samhitmantrala commited on
Commit
b84dabc
·
verified ·
1 Parent(s): 60e54d8

Training in progress, step 500

Browse files
config.json CHANGED
@@ -1,6 +1,5 @@
1
  {
2
- "_name_or_path": "distilgpt2",
3
- "_num_labels": 1,
4
  "activation_function": "gelu_new",
5
  "architectures": [
6
  "GPT2LMHeadModel"
@@ -9,20 +8,14 @@
9
  "bos_token_id": 50256,
10
  "embd_pdrop": 0.1,
11
  "eos_token_id": 50256,
12
- "id2label": {
13
- "0": "LABEL_0"
14
- },
15
  "initializer_range": 0.02,
16
- "label2id": {
17
- "LABEL_0": 0
18
- },
19
  "layer_norm_epsilon": 1e-05,
20
  "model_type": "gpt2",
21
  "n_ctx": 1024,
22
  "n_embd": 768,
23
  "n_head": 12,
24
  "n_inner": null,
25
- "n_layer": 6,
26
  "n_positions": 1024,
27
  "reorder_and_upcast_attn": false,
28
  "resid_pdrop": 0.1,
 
1
  {
2
+ "_name_or_path": "openai-community/gpt2",
 
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
8
  "bos_token_id": 50256,
9
  "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
 
 
 
11
  "initializer_range": 0.02,
 
 
 
12
  "layer_norm_epsilon": 1e-05,
13
  "model_type": "gpt2",
14
  "n_ctx": 1024,
15
  "n_embd": 768,
16
  "n_head": 12,
17
  "n_inner": null,
18
+ "n_layer": 12,
19
  "n_positions": 1024,
20
  "reorder_and_upcast_attn": false,
21
  "resid_pdrop": 0.1,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:116ef28be4964797bc1c3339ef72014d4a9a444554e2572f8f225a95329ef27f
3
- size 327657928
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:874f88027bcad1b34440d1386b9ef541db7d7d0182668caf4392255688502477
3
+ size 497774208
runs/Apr21_18-54-11_c8d33eca33e1/events.out.tfevents.1713725652.c8d33eca33e1.376.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61dd2a9fe4f065d66b9b7d6fb15ab4f943c5b8eb3acbd9dd170dd1bdfeeca55f
3
+ size 122139
runs/Apr21_18-56-06_c8d33eca33e1/events.out.tfevents.1713725767.c8d33eca33e1.376.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6b15050e8728f50bd5615ed9c09efbacf6241a6fd214815a32b8e6408aa4668
3
+ size 140205
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32e021e4ed1c911d0e31aef8e26c0015a37a24e3a7d3b05f2f388453ef311989
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8b2e0bb9a2bf0083af7ef391e9ada1b1721f5f48bc8105ec3b21e0f57fb2592
3
  size 4856