sheoran95 commited on
Commit
03c395b
·
1 Parent(s): f8c36cd

Training in progress, step 500

Browse files
added_tokens.json CHANGED
@@ -12,15 +12,5 @@
12
  ":ARGM-MNR": 32108,
13
  ":ARGM-NEG": 32113,
14
  ":ARGM-PRP": 32109,
15
- ":ARGM-TMP": 32107,
16
- ":graph1": 32114,
17
- ":graph10": 32123,
18
- ":graph2": 32115,
19
- ":graph3": 32116,
20
- ":graph4": 32117,
21
- ":graph5": 32118,
22
- ":graph6": 32119,
23
- ":graph7": 32120,
24
- ":graph8": 32121,
25
- ":graph9": 32122
26
  }
 
12
  ":ARGM-MNR": 32108,
13
  ":ARGM-NEG": 32113,
14
  ":ARGM-PRP": 32109,
15
+ ":ARGM-TMP": 32107
 
 
 
 
 
 
 
 
 
 
16
  }
config.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
- "_name_or_path": "t5-small",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
6
- "d_ff": 2048,
7
  "d_kv": 64,
8
- "d_model": 512,
9
  "decoder_start_token_id": 0,
10
  "dense_act_fn": "relu",
11
  "dropout_rate": 0.1,
@@ -17,9 +17,9 @@
17
  "layer_norm_epsilon": 1e-06,
18
  "model_type": "t5",
19
  "n_positions": 512,
20
- "num_decoder_layers": 6,
21
- "num_heads": 8,
22
- "num_layers": 6,
23
  "output_past": true,
24
  "pad_token_id": 0,
25
  "relative_attention_max_distance": 128,
@@ -54,7 +54,7 @@
54
  }
55
  },
56
  "torch_dtype": "float32",
57
- "transformers_version": "4.26.1",
58
  "use_cache": true,
59
- "vocab_size": 32124
60
  }
 
1
  {
2
+ "_name_or_path": "t5-large",
3
  "architectures": [
4
  "T5ForConditionalGeneration"
5
  ],
6
+ "d_ff": 4096,
7
  "d_kv": 64,
8
+ "d_model": 1024,
9
  "decoder_start_token_id": 0,
10
  "dense_act_fn": "relu",
11
  "dropout_rate": 0.1,
 
17
  "layer_norm_epsilon": 1e-06,
18
  "model_type": "t5",
19
  "n_positions": 512,
20
+ "num_decoder_layers": 24,
21
+ "num_heads": 16,
22
+ "num_layers": 24,
23
  "output_past": true,
24
  "pad_token_id": 0,
25
  "relative_attention_max_distance": 128,
 
54
  }
55
  },
56
  "torch_dtype": "float32",
57
+ "transformers_version": "4.27.3",
58
  "use_cache": true,
59
+ "vocab_size": 32114
60
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e974ce2a7ef3ca156a0d1a53de155fb1888878d2b50f8c85023f36f9ec6d737
3
- size 242063449
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e03d92b495880b29acf2dd0169c643fa8d587d387644233cf69c35317c3f6728
3
+ size 2950791169
runs/Mar28_11-55-35_d5f806247e8b/1680004539.0123274/events.out.tfevents.1680004539.d5f806247e8b.17127.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3905897a2e5a058794a58beedbb7cb33019bc193b3ad7e22e7dbc995a6f29c82
3
+ size 5981
runs/Mar28_11-55-35_d5f806247e8b/events.out.tfevents.1680004538.d5f806247e8b.17127.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f911b8b5b60d6b65c5e03373723c63b2fa08ac902a503485357b21e4b56f8554
3
+ size 4976
special_tokens_map.json CHANGED
@@ -13,17 +13,7 @@
13
  ":ARGM-CAU",
14
  ":ARGM-DIR",
15
  ":ARGM-EXT",
16
- ":ARGM-NEG",
17
- ":graph1",
18
- ":graph2",
19
- ":graph3",
20
- ":graph4",
21
- ":graph5",
22
- ":graph6",
23
- ":graph7",
24
- ":graph8",
25
- ":graph9",
26
- ":graph10"
27
  ],
28
  "eos_token": "</s>",
29
  "pad_token": "<pad>",
 
13
  ":ARGM-CAU",
14
  ":ARGM-DIR",
15
  ":ARGM-EXT",
16
+ ":ARGM-NEG"
 
 
 
 
 
 
 
 
 
 
17
  ],
18
  "eos_token": "</s>",
19
  "pad_token": "<pad>",
tokenizer.json CHANGED
@@ -1067,96 +1067,6 @@
1067
  "rstrip": false,
1068
  "normalized": false,
1069
  "special": true
1070
- },
1071
- {
1072
- "id": 32114,
1073
- "content": ":graph1",
1074
- "single_word": false,
1075
- "lstrip": false,
1076
- "rstrip": false,
1077
- "normalized": false,
1078
- "special": true
1079
- },
1080
- {
1081
- "id": 32115,
1082
- "content": ":graph2",
1083
- "single_word": false,
1084
- "lstrip": false,
1085
- "rstrip": false,
1086
- "normalized": false,
1087
- "special": true
1088
- },
1089
- {
1090
- "id": 32116,
1091
- "content": ":graph3",
1092
- "single_word": false,
1093
- "lstrip": false,
1094
- "rstrip": false,
1095
- "normalized": false,
1096
- "special": true
1097
- },
1098
- {
1099
- "id": 32117,
1100
- "content": ":graph4",
1101
- "single_word": false,
1102
- "lstrip": false,
1103
- "rstrip": false,
1104
- "normalized": false,
1105
- "special": true
1106
- },
1107
- {
1108
- "id": 32118,
1109
- "content": ":graph5",
1110
- "single_word": false,
1111
- "lstrip": false,
1112
- "rstrip": false,
1113
- "normalized": false,
1114
- "special": true
1115
- },
1116
- {
1117
- "id": 32119,
1118
- "content": ":graph6",
1119
- "single_word": false,
1120
- "lstrip": false,
1121
- "rstrip": false,
1122
- "normalized": false,
1123
- "special": true
1124
- },
1125
- {
1126
- "id": 32120,
1127
- "content": ":graph7",
1128
- "single_word": false,
1129
- "lstrip": false,
1130
- "rstrip": false,
1131
- "normalized": false,
1132
- "special": true
1133
- },
1134
- {
1135
- "id": 32121,
1136
- "content": ":graph8",
1137
- "single_word": false,
1138
- "lstrip": false,
1139
- "rstrip": false,
1140
- "normalized": false,
1141
- "special": true
1142
- },
1143
- {
1144
- "id": 32122,
1145
- "content": ":graph9",
1146
- "single_word": false,
1147
- "lstrip": false,
1148
- "rstrip": false,
1149
- "normalized": false,
1150
- "special": true
1151
- },
1152
- {
1153
- "id": 32123,
1154
- "content": ":graph10",
1155
- "single_word": false,
1156
- "lstrip": false,
1157
- "rstrip": false,
1158
- "normalized": false,
1159
- "special": true
1160
  }
1161
  ],
1162
  "normalizer": {
 
1067
  "rstrip": false,
1068
  "normalized": false,
1069
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1070
  }
1071
  ],
1072
  "normalizer": {
tokenizer_config.json CHANGED
@@ -104,7 +104,6 @@
104
  "eos_token": "</s>",
105
  "extra_ids": 100,
106
  "model_max_length": 512,
107
- "name_or_path": "t5-small",
108
  "pad_token": "<pad>",
109
  "special_tokens_map_file": null,
110
  "tokenizer_class": "T5Tokenizer",
 
104
  "eos_token": "</s>",
105
  "extra_ids": 100,
106
  "model_max_length": 512,
 
107
  "pad_token": "<pad>",
108
  "special_tokens_map_file": null,
109
  "tokenizer_class": "T5Tokenizer",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a30bd09f4afc5c21d55974f45dcdf6d0bc7c83e942122064a692247db45e17d0
3
- size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e4675273a31e5eebae2b1b2c3989e5c7676ef6477893030095707614a5e8872
3
+ size 3707