mgh6 commited on
Commit
4b2f862
·
verified ·
1 Parent(s): d1b1664

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "tattabio/gLM2_150M",
3
  "architectures": [
4
  "gLM2ForMaskedLM"
5
  ],
@@ -8,10 +8,10 @@
8
  "AutoModel": "modeling_glm2.gLM2Model",
9
  "AutoModelForMaskedLM": "modeling_glm2.gLM2ForMaskedLM"
10
  },
11
- "depth": 30,
12
- "dim": 640,
13
  "ffn_dim_multiplier": null,
14
- "heads": 10,
15
  "model_type": "gLM2",
16
  "norm_eps": 1e-05,
17
  "swiglu_multiple_of": 256,
 
1
  {
2
+ "_name_or_path": "tattabio/gLM2_650M",
3
  "architectures": [
4
  "gLM2ForMaskedLM"
5
  ],
 
8
  "AutoModel": "modeling_glm2.gLM2Model",
9
  "AutoModelForMaskedLM": "modeling_glm2.gLM2ForMaskedLM"
10
  },
11
+ "depth": 33,
12
+ "dim": 1280,
13
  "ffn_dim_multiplier": null,
14
+ "heads": 20,
15
  "model_type": "gLM2",
16
  "norm_eps": 1e-05,
17
  "swiglu_multiple_of": 256,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:516558ed7782de66fc542438abb1c93e159afd70a2aeb6571ce83cca423452b0
3
- size 609855088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:228e54ea153feeb0f49b0800638a29264ec8340106787699023f5720254dacea
3
+ size 2682482800
runs/Oct28_21-42-34_torch-flash-large-0-6/events.out.tfevents.1730151755.torch-flash-large-0-6.676.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12933faa94443b29d2eb1ec478a5f8fb657eeaa213446b52f73ac3d37515ce58
3
- size 5199
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78b89f24802dcc61b4b1b82401210bccab5382e28527bbc1714db989d559cb9b
3
+ size 5613
runs/Oct28_21-46-13_torch-flash-large-0-6/events.out.tfevents.1730151974.torch-flash-large-0-6.1973.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92c6e229a6a8731a5e00d8f0f8ec017531cb925d84d382fe3317ef822ae0bf95
3
+ size 4790
runs/Oct28_22-05-01_torch-flash-large-0-6/events.out.tfevents.1730153103.torch-flash-large-0-6.10166.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6ff3b1ac941e1bcd457cea65251468dbd605703dfe609d70f448866fb997b48
3
+ size 5415
runs/Oct28_22-39-07_torch-flash-large-0-6/events.out.tfevents.1730155149.torch-flash-large-0-6.10310.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2c04de51840380e57c9b94c3f8a488270d5170f1e6c01dc1f198636bead3a90
3
+ size 6892
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:064b240ea07b11fb2a55256aa70c4f515e16a1e7de5972e80b77b98e19219a68
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b0a8ed667ee8b35f22ca4883f52af3ea1273c54ad954652c4052132affac051
3
  size 5240