Training in progress, epoch 1
Browse files
config.json
CHANGED
|
@@ -12,142 +12,142 @@
|
|
| 12 |
"hidden_dropout_prob": 0.0,
|
| 13 |
"hidden_size": 1024,
|
| 14 |
"id2label": {
|
| 15 |
-
"0": "
|
| 16 |
-
"1": "
|
| 17 |
-
"2": "
|
| 18 |
-
"3": "
|
| 19 |
-
"4": "
|
| 20 |
-
"5": "
|
| 21 |
-
"6": "
|
| 22 |
-
"7": "
|
| 23 |
-
"8": "
|
| 24 |
-
"9": "
|
| 25 |
-
"10": "
|
| 26 |
-
"11": "
|
| 27 |
-
"12": "
|
| 28 |
-
"13": "
|
| 29 |
-
"14": "
|
| 30 |
-
"15": "
|
| 31 |
-
"16": "
|
| 32 |
-
"17": "
|
| 33 |
-
"18": "
|
| 34 |
-
"19": "
|
| 35 |
-
"20": "
|
| 36 |
-
"21": "
|
| 37 |
-
"22": "
|
| 38 |
-
"23": "
|
| 39 |
-
"24": "
|
| 40 |
-
"25": "
|
| 41 |
-
"26": "
|
| 42 |
-
"27": "
|
| 43 |
-
"28": "
|
| 44 |
-
"29": "
|
| 45 |
-
"30": "
|
| 46 |
-
"31": "
|
| 47 |
-
"32": "
|
| 48 |
-
"33": "
|
| 49 |
-
"34": "
|
| 50 |
-
"35": "
|
| 51 |
-
"36": "
|
| 52 |
-
"37": "
|
| 53 |
-
"38": "
|
| 54 |
-
"39": "
|
| 55 |
-
"40": "
|
| 56 |
-
"41": "
|
| 57 |
-
"42": "
|
| 58 |
-
"43": "
|
| 59 |
-
"44": "
|
| 60 |
-
"45": "
|
| 61 |
-
"46": "
|
| 62 |
-
"47": "
|
| 63 |
-
"48": "
|
| 64 |
-
"49": "
|
| 65 |
-
"50": "
|
| 66 |
-
"51": "
|
| 67 |
-
"52": "
|
| 68 |
-
"53": "
|
| 69 |
-
"54": "
|
| 70 |
-
"55": "
|
| 71 |
-
"56": "
|
| 72 |
"57": "Fg",
|
| 73 |
-
"58": "
|
| 74 |
-
"59": "
|
| 75 |
-
"60": "
|
| 76 |
-
"61": "
|
| 77 |
-
"62": "
|
| 78 |
-
"63": "
|
| 79 |
-
"64": "
|
| 80 |
"65": "cs"
|
| 81 |
},
|
| 82 |
"initializer_range": 0.02,
|
| 83 |
"intermediate_size": 4096,
|
| 84 |
"label2id": {
|
| 85 |
-
"Faa":
|
| 86 |
-
"Fat":
|
| 87 |
-
"Fc":
|
| 88 |
-
"Fd":
|
| 89 |
-
"Fe":
|
| 90 |
"Fg": 57,
|
| 91 |
-
"Fh":
|
| 92 |
-
"Fia":
|
| 93 |
-
"Fit":
|
| 94 |
-
"Fp":
|
| 95 |
-
"Fpa":
|
| 96 |
-
"Fpt":
|
| 97 |
-
"Fs":
|
| 98 |
-
"Fx":
|
| 99 |
-
"Fz":
|
| 100 |
-
"I":
|
| 101 |
-
"W":
|
| 102 |
-
"X":
|
| 103 |
-
"Y":
|
| 104 |
-
"Z":
|
| 105 |
-
"Zm":
|
| 106 |
-
"Zp":
|
| 107 |
-
"ao":
|
| 108 |
-
"aq":
|
| 109 |
-
"cc":
|
| 110 |
"cs": 65,
|
| 111 |
-
"da":
|
| 112 |
-
"dd":
|
| 113 |
-
"de":
|
| 114 |
-
"di":
|
| 115 |
-
"dn":
|
| 116 |
-
"dp":
|
| 117 |
-
"dt":
|
| 118 |
-
"i":
|
| 119 |
-
"nc":
|
| 120 |
-
"np":
|
| 121 |
-
"p0":
|
| 122 |
-
"pd":
|
| 123 |
-
"pe":
|
| 124 |
-
"pi":
|
| 125 |
-
"pn":
|
| 126 |
-
"pp":
|
| 127 |
-
"pr":
|
| 128 |
-
"pt":
|
| 129 |
-
"px":
|
| 130 |
-
"rg":
|
| 131 |
-
"rn":
|
| 132 |
-
"sp":
|
| 133 |
-
"vag":
|
| 134 |
-
"vai":
|
| 135 |
-
"vam":
|
| 136 |
-
"van":
|
| 137 |
-
"vap":
|
| 138 |
-
"vas":
|
| 139 |
-
"vmg":
|
| 140 |
-
"vmi":
|
| 141 |
-
"vmm":
|
| 142 |
-
"vmn":
|
| 143 |
-
"vmp":
|
| 144 |
-
"vms":
|
| 145 |
-
"vsg":
|
| 146 |
-
"vsi":
|
| 147 |
-
"vsm":
|
| 148 |
-
"vsn":
|
| 149 |
-
"vsp":
|
| 150 |
-
"vss":
|
| 151 |
},
|
| 152 |
"layer_norm_eps": 1e-05,
|
| 153 |
"max_position_embeddings": 514,
|
|
|
|
| 12 |
"hidden_dropout_prob": 0.0,
|
| 13 |
"hidden_size": 1024,
|
| 14 |
"id2label": {
|
| 15 |
+
"0": "dp",
|
| 16 |
+
"1": "px",
|
| 17 |
+
"2": "nc",
|
| 18 |
+
"3": "vsn",
|
| 19 |
+
"4": "pn",
|
| 20 |
+
"5": "Fia",
|
| 21 |
+
"6": "vag",
|
| 22 |
+
"7": "dt",
|
| 23 |
+
"8": "Zm",
|
| 24 |
+
"9": "p0",
|
| 25 |
+
"10": "aq",
|
| 26 |
+
"11": "vmn",
|
| 27 |
+
"12": "da",
|
| 28 |
+
"13": "Fz",
|
| 29 |
+
"14": "rn",
|
| 30 |
+
"15": "Fs",
|
| 31 |
+
"16": "Fp",
|
| 32 |
+
"17": "Fh",
|
| 33 |
+
"18": "vsi",
|
| 34 |
+
"19": "pe",
|
| 35 |
+
"20": "vas",
|
| 36 |
+
"21": "vap",
|
| 37 |
+
"22": "pi",
|
| 38 |
+
"23": "Y",
|
| 39 |
+
"24": "Fe",
|
| 40 |
+
"25": "de",
|
| 41 |
+
"26": "pd",
|
| 42 |
+
"27": "pp",
|
| 43 |
+
"28": "i",
|
| 44 |
+
"29": "X",
|
| 45 |
+
"30": "cc",
|
| 46 |
+
"31": "dn",
|
| 47 |
+
"32": "Fit",
|
| 48 |
+
"33": "I",
|
| 49 |
+
"34": "ao",
|
| 50 |
+
"35": "vai",
|
| 51 |
+
"36": "Fx",
|
| 52 |
+
"37": "vms",
|
| 53 |
+
"38": "sp",
|
| 54 |
+
"39": "Fpa",
|
| 55 |
+
"40": "Fpt",
|
| 56 |
+
"41": "vmg",
|
| 57 |
+
"42": "di",
|
| 58 |
+
"43": "vsp",
|
| 59 |
+
"44": "pt",
|
| 60 |
+
"45": "vsg",
|
| 61 |
+
"46": "dd",
|
| 62 |
+
"47": "Fat",
|
| 63 |
+
"48": "rg",
|
| 64 |
+
"49": "vss",
|
| 65 |
+
"50": "Faa",
|
| 66 |
+
"51": "vsm",
|
| 67 |
+
"52": "np",
|
| 68 |
+
"53": "W",
|
| 69 |
+
"54": "vmi",
|
| 70 |
+
"55": "vmp",
|
| 71 |
+
"56": "van",
|
| 72 |
"57": "Fg",
|
| 73 |
+
"58": "vam",
|
| 74 |
+
"59": "pr",
|
| 75 |
+
"60": "Fd",
|
| 76 |
+
"61": "Z",
|
| 77 |
+
"62": "vmm",
|
| 78 |
+
"63": "Fc",
|
| 79 |
+
"64": "Zp",
|
| 80 |
"65": "cs"
|
| 81 |
},
|
| 82 |
"initializer_range": 0.02,
|
| 83 |
"intermediate_size": 4096,
|
| 84 |
"label2id": {
|
| 85 |
+
"Faa": 50,
|
| 86 |
+
"Fat": 47,
|
| 87 |
+
"Fc": 63,
|
| 88 |
+
"Fd": 60,
|
| 89 |
+
"Fe": 24,
|
| 90 |
"Fg": 57,
|
| 91 |
+
"Fh": 17,
|
| 92 |
+
"Fia": 5,
|
| 93 |
+
"Fit": 32,
|
| 94 |
+
"Fp": 16,
|
| 95 |
+
"Fpa": 39,
|
| 96 |
+
"Fpt": 40,
|
| 97 |
+
"Fs": 15,
|
| 98 |
+
"Fx": 36,
|
| 99 |
+
"Fz": 13,
|
| 100 |
+
"I": 33,
|
| 101 |
+
"W": 53,
|
| 102 |
+
"X": 29,
|
| 103 |
+
"Y": 23,
|
| 104 |
+
"Z": 61,
|
| 105 |
+
"Zm": 8,
|
| 106 |
+
"Zp": 64,
|
| 107 |
+
"ao": 34,
|
| 108 |
+
"aq": 10,
|
| 109 |
+
"cc": 30,
|
| 110 |
"cs": 65,
|
| 111 |
+
"da": 12,
|
| 112 |
+
"dd": 46,
|
| 113 |
+
"de": 25,
|
| 114 |
+
"di": 42,
|
| 115 |
+
"dn": 31,
|
| 116 |
+
"dp": 0,
|
| 117 |
+
"dt": 7,
|
| 118 |
+
"i": 28,
|
| 119 |
+
"nc": 2,
|
| 120 |
+
"np": 52,
|
| 121 |
+
"p0": 9,
|
| 122 |
+
"pd": 26,
|
| 123 |
+
"pe": 19,
|
| 124 |
+
"pi": 22,
|
| 125 |
+
"pn": 4,
|
| 126 |
+
"pp": 27,
|
| 127 |
+
"pr": 59,
|
| 128 |
+
"pt": 44,
|
| 129 |
+
"px": 1,
|
| 130 |
+
"rg": 48,
|
| 131 |
+
"rn": 14,
|
| 132 |
+
"sp": 38,
|
| 133 |
+
"vag": 6,
|
| 134 |
+
"vai": 35,
|
| 135 |
+
"vam": 58,
|
| 136 |
+
"van": 56,
|
| 137 |
+
"vap": 21,
|
| 138 |
+
"vas": 20,
|
| 139 |
+
"vmg": 41,
|
| 140 |
+
"vmi": 54,
|
| 141 |
+
"vmm": 62,
|
| 142 |
+
"vmn": 11,
|
| 143 |
+
"vmp": 55,
|
| 144 |
+
"vms": 37,
|
| 145 |
+
"vsg": 45,
|
| 146 |
+
"vsi": 18,
|
| 147 |
+
"vsm": 51,
|
| 148 |
+
"vsn": 3,
|
| 149 |
+
"vsp": 43,
|
| 150 |
+
"vss": 49
|
| 151 |
},
|
| 152 |
"layer_norm_eps": 1e-05,
|
| 153 |
"max_position_embeddings": 514,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1417546912
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9311b9985276a9ee8b8b9643d1394b302fff2c1494a37bb1527edb2dee349d57
|
| 3 |
size 1417546912
|
runs/Oct28_10-19-38_4226ec852e37/events.out.tfevents.1730111007.4226ec852e37.2246.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8166dbd052f4bd5a3569aa96f8536ef7d56a710eac864c741912fe8095f28d4
|
| 3 |
+
size 7695
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f064f264b058c74e3bd19a1438b44b6ab5de5bd0291439354e72b5a86d525b3
|
| 3 |
size 5176
|