Sayan01 commited on
Commit
23c5701
·
verified ·
1 Parent(s): f15dc77

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -4,22 +4,22 @@
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
7
- "gradient_checkpointing": false,
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
10
- "hidden_size": 512,
11
  "initializer_range": 0.02,
12
- "intermediate_size": 3072,
13
  "layer_norm_eps": 1e-12,
14
  "max_position_embeddings": 512,
15
  "model_type": "bert",
16
- "num_attention_heads": 8,
17
- "num_hidden_layers": 6,
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
20
  "problem_type": "single_label_classification",
21
  "torch_dtype": "float32",
22
- "transformers_version": "4.39.0",
23
  "type_vocab_size": 2,
24
  "use_cache": true,
25
  "vocab_size": 30522
 
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "classifier_dropout": null,
7
+ "finetuning_task": "sst-2",
8
  "hidden_act": "gelu",
9
  "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 384,
11
  "initializer_range": 0.02,
12
+ "intermediate_size": 1536,
13
  "layer_norm_eps": 1e-12,
14
  "max_position_embeddings": 512,
15
  "model_type": "bert",
16
+ "num_attention_heads": 12,
17
+ "num_hidden_layers": 12,
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
20
  "problem_type": "single_label_classification",
21
  "torch_dtype": "float32",
22
+ "transformers_version": "4.45.1",
23
  "type_vocab_size": 2,
24
  "use_cache": true,
25
  "vocab_size": 30522
logs/events.out.tfevents.1724851568.spartan-gpgpu092.hpc.unimelb.edu.au.199860.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9359702a996c844d6c46dd032a5f124c1147b57cb8ddec1e4d553877efa8d365
3
- size 9676
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59202bd1e2613b5c4045bec454073c823d9d54c998b90cd31c3870980abe2abf
3
+ size 10564
logs/events.out.tfevents.1724858283.spartan-gpgpu092.hpc.unimelb.edu.au.199860.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3874a420149c000f319fae4bad3c10771152f3d14f8e998d11785418021117c6
3
+ size 411
logs/events.out.tfevents.1727725862.spartan-gpgpu147.hpc.unimelb.edu.au.116319.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0fd0b228c22a7a43270a2cb446db9ce8c4f74ee47bd1f2ff3eb8554f6a099f1
3
+ size 5883
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82502dc56b28ee4f27771bcb019a138d21af8077d5bec2401c4606a45f42e6c8
3
- size 165480304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:774647636b32119027595bedb091b007018818ba37d511dfe7b458c9e69fb769
3
+ size 133466376
tokenizer.json CHANGED
@@ -1,7 +1,21 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 512,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 512
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 0,
16
+ "pad_type_id": 0,
17
+ "pad_token": "[PAD]"
18
+ },
19
  "added_tokens": [
20
  {
21
  "id": 0,
tokenizer_config.json CHANGED
@@ -41,7 +41,7 @@
41
  "special": true
42
  }
43
  },
44
- "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
 
41
  "special": true
42
  }
43
  },
44
+ "clean_up_tokenization_spaces": false,
45
  "cls_token": "[CLS]",
46
  "do_lower_case": true,
47
  "mask_token": "[MASK]",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba0abb8edd82c8779b2624d5a123b8ca8ce20afd1ccf9de599e3b613e2b7bf17
3
- size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46eeb5538a0185c2eff2f2b2a73333f17eccb4c40fe9c55defa4d1c6b0ead6f4
3
+ size 5304