mgh6 commited on
Commit
b0a5dcb
·
verified ·
1 Parent(s): 3305d70

Training in progress, step 2

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "tattabio/gLM2_650M",
3
  "architectures": [
4
  "gLM2ForMaskedLM"
5
  ],
@@ -8,14 +8,14 @@
8
  "AutoModel": "modeling_glm2.gLM2Model",
9
  "AutoModelForMaskedLM": "modeling_glm2.gLM2ForMaskedLM"
10
  },
11
- "depth": 33,
12
- "dim": 1280,
13
  "ffn_dim_multiplier": null,
14
- "heads": 20,
15
  "model_type": "gLM2",
16
  "norm_eps": 1e-05,
17
  "swiglu_multiple_of": 256,
18
  "torch_dtype": "float32",
19
- "transformers_version": "4.45.2",
20
  "vocab_size": 37
21
  }
 
1
  {
2
+ "_name_or_path": "tattabio/gLM2_150M",
3
  "architectures": [
4
  "gLM2ForMaskedLM"
5
  ],
 
8
  "AutoModel": "modeling_glm2.gLM2Model",
9
  "AutoModelForMaskedLM": "modeling_glm2.gLM2ForMaskedLM"
10
  },
11
+ "depth": 30,
12
+ "dim": 640,
13
  "ffn_dim_multiplier": null,
14
+ "heads": 10,
15
  "model_type": "gLM2",
16
  "norm_eps": 1e-05,
17
  "swiglu_multiple_of": 256,
18
  "torch_dtype": "float32",
19
+ "transformers_version": "4.46.0",
20
  "vocab_size": 37
21
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9eae45eb43651c4ce612c5b264270a3ccdfbc48e1be2784320e0059c614c3cab
3
- size 2682482800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:516558ed7782de66fc542438abb1c93e159afd70a2aeb6571ce83cca423452b0
3
+ size 609855088
runs/Oct22_14-42-35_torch-flash-large-0-5/events.out.tfevents.1729608158.torch-flash-large-0-5.15432.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:810807ab17e17d607934b36f382c07db6fdce6404d6609316f2cc595fe0b50b5
3
- size 30034
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:795897e579db5094733b5e6a833553202120ad6e7282eb13a24e0a23837fd9dd
3
+ size 31933
runs/Oct28_21-42-34_torch-flash-large-0-6/events.out.tfevents.1730151755.torch-flash-large-0-6.676.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12933faa94443b29d2eb1ec478a5f8fb657eeaa213446b52f73ac3d37515ce58
3
+ size 5199
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65de12ccf65227e16c5ac7d6f4de8c23b93867370e90dd502a95ed85503923fb
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:064b240ea07b11fb2a55256aa70c4f515e16a1e7de5972e80b77b98e19219a68
3
  size 5240