sigurdriseth commited on
Commit
2deb39e
·
verified ·
1 Parent(s): 2d66a80

Upload retrain-full joint intent+NER model

Browse files
encoder/config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "BertModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": null,
8
+ "classifier_dropout": null,
9
+ "dtype": "float32",
10
+ "eos_token_id": null,
11
+ "gradient_checkpointing": false,
12
+ "hidden_act": "gelu",
13
+ "hidden_dropout_prob": 0.1,
14
+ "hidden_size": 1024,
15
+ "initializer_range": 0.02,
16
+ "intermediate_size": 4096,
17
+ "is_decoder": false,
18
+ "layer_norm_eps": 1e-12,
19
+ "max_position_embeddings": 512,
20
+ "model_type": "bert",
21
+ "num_attention_heads": 16,
22
+ "num_hidden_layers": 24,
23
+ "pad_token_id": 0,
24
+ "position_embedding_type": "absolute",
25
+ "tie_word_embeddings": true,
26
+ "transformers_version": "5.1.0",
27
+ "type_vocab_size": 2,
28
+ "use_cache": true,
29
+ "vocab_size": 50000
30
+ }
encoder/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80cf0f07931d2f2a9587ceaba78b6a1cde1ee35c3be50d4a042d24cea6dc2613
3
+ size 1420394320
heads.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae3594808fed1a86bfaca39596352f6811f15badfca870a627068e9fb6ab1b9e
3
+ size 84361
joint_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "num_intents": 5,
3
+ "num_ner_labels": 15,
4
+ "intent_loss_weight": 0.6000000000000001,
5
+ "ner_loss_weight": 0.3999999999999999,
6
+ "classifier_dropout": null,
7
+ "hidden_size": 1024,
8
+ "hidden_dropout_prob": 0.1
9
+ }
label_config.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "label2id": {
3
+ "O": 0,
4
+ "B-PRODUCT": 1,
5
+ "I-PRODUCT": 2,
6
+ "B-QUANTITY": 3,
7
+ "I-QUANTITY": 4,
8
+ "B-UNIT": 5,
9
+ "I-UNIT": 6,
10
+ "B-DELIVERY_METHOD": 7,
11
+ "I-DELIVERY_METHOD": 8,
12
+ "B-DELIVERY_DATE": 9,
13
+ "I-DELIVERY_DATE": 10,
14
+ "B-ADDRESS": 11,
15
+ "I-ADDRESS": 12,
16
+ "B-TANK_SILO": 13,
17
+ "I-TANK_SILO": 14
18
+ },
19
+ "id2label": {
20
+ "0": "O",
21
+ "1": "B-PRODUCT",
22
+ "2": "I-PRODUCT",
23
+ "3": "B-QUANTITY",
24
+ "4": "I-QUANTITY",
25
+ "5": "B-UNIT",
26
+ "6": "I-UNIT",
27
+ "7": "B-DELIVERY_METHOD",
28
+ "8": "I-DELIVERY_METHOD",
29
+ "9": "B-DELIVERY_DATE",
30
+ "10": "I-DELIVERY_DATE",
31
+ "11": "B-ADDRESS",
32
+ "12": "I-ADDRESS",
33
+ "13": "B-TANK_SILO",
34
+ "14": "I-TANK_SILO"
35
+ },
36
+ "intent2id": {
37
+ "create_order": 0,
38
+ "edit_order": 1,
39
+ "confirm": 2,
40
+ "reject": 3,
41
+ "help": 4
42
+ },
43
+ "id2intent": {
44
+ "0": "create_order",
45
+ "1": "edit_order",
46
+ "2": "confirm",
47
+ "3": "reject",
48
+ "4": "help"
49
+ }
50
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "cls_token": "[CLS]",
4
+ "do_basic_tokenize": true,
5
+ "do_lower_case": true,
6
+ "is_local": false,
7
+ "mask_token": "[MASK]",
8
+ "model_max_length": 1000000000000000019884624838656,
9
+ "never_split": null,
10
+ "pad_token": "[PAD]",
11
+ "sep_token": "[SEP]",
12
+ "strip_accents": false,
13
+ "tokenize_chinese_chars": true,
14
+ "tokenizer_class": "BertTokenizer",
15
+ "unk_token": "[UNK]"
16
+ }
training_results.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "retrain_full": true,
3
+ "train_size": 450,
4
+ "test_results": {
5
+ "eval_loss": 0.07978741824626923,
6
+ "eval_ner_precision": 0.9270833333333334,
7
+ "eval_ner_recall": 0.9518716577540107,
8
+ "eval_ner_f1": 0.9393139841688656,
9
+ "eval_intent_accuracy": 1.0,
10
+ "eval_intent_f1": 1.0,
11
+ "eval_f1": 0.9696569920844328,
12
+ "eval_runtime": 1.1246,
13
+ "eval_samples_per_second": 44.461,
14
+ "eval_steps_per_second": 6.225,
15
+ "epoch": 5.0
16
+ },
17
+ "best_hyperparameters": {
18
+ "learning_rate": 5e-05,
19
+ "num_train_epochs": 5,
20
+ "weight_decay": 0.01,
21
+ "per_device_train_batch_size": 8,
22
+ "warmup_ratio": 0.2,
23
+ "loss_alpha": 0.6000000000000001,
24
+ "freeze_layers": 0
25
+ }
26
+ }