Rogendo commited on
Commit
ecdeabd
·
verified ·
1 Parent(s): 7517e68

Upload JengaAI trained multi-task NLP model

Browse files
checkpoints/best/checkpoint_meta.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4,
3
+ "metrics": {
4
+ "fraud_detection_fraud_accuracy": 0.75,
5
+ "fraud_detection_fraud_precision": 0.875,
6
+ "fraud_detection_fraud_recall": 0.75,
7
+ "fraud_detection_fraud_f1": 0.7666666666666667,
8
+ "sentiment_analysis_sentiment_accuracy": 0.6666666666666666,
9
+ "sentiment_analysis_sentiment_precision": 0.8333333333333334,
10
+ "sentiment_analysis_sentiment_recall": 0.6666666666666666,
11
+ "sentiment_analysis_sentiment_f1": 0.6666666666666666,
12
+ "call_quality_opening_precision": 0.963,
13
+ "call_quality_opening_recall": 0.963,
14
+ "call_quality_opening_f1": 0.963,
15
+ "call_quality_listening_precision": 0.8913311928871326,
16
+ "call_quality_listening_recall": 0.9484888304862024,
17
+ "call_quality_listening_f1": 0.919022154316272,
18
+ "call_quality_proactiveness_precision": 0.7491271820448878,
19
+ "call_quality_proactiveness_recall": 0.8632183908045977,
20
+ "call_quality_proactiveness_f1": 0.8021361815754339,
21
+ "call_quality_resolution_precision": 0.9153363740022805,
22
+ "call_quality_resolution_recall": 0.8986845787853345,
23
+ "call_quality_resolution_f1": 0.9069340488631549,
24
+ "call_quality_hold_precision": 0.7804878048780488,
25
+ "call_quality_hold_recall": 0.46601941747572817,
26
+ "call_quality_hold_f1": 0.5835866261398176,
27
+ "call_quality_closing_precision": 0.863,
28
+ "call_quality_closing_recall": 0.863,
29
+ "call_quality_closing_f1": 0.863,
30
+ "eval_loss": 1.9891562443513138,
31
+ "train_loss_avg": 1.9425991174011004
32
+ },
33
+ "is_best": true
34
+ }
checkpoints/best/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9f04c79105542cda3168410c549cfca104c566e5dd04c1c66496cfb38ccc0bd
3
+ size 450684151
checkpoints/epoch_8/checkpoint_meta.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 8,
3
+ "metrics": {
4
+ "fraud_detection_fraud_accuracy": 1.0,
5
+ "fraud_detection_fraud_precision": 1.0,
6
+ "fraud_detection_fraud_recall": 1.0,
7
+ "fraud_detection_fraud_f1": 1.0,
8
+ "sentiment_analysis_sentiment_accuracy": 0.6666666666666666,
9
+ "sentiment_analysis_sentiment_precision": 0.8333333333333334,
10
+ "sentiment_analysis_sentiment_recall": 0.6666666666666666,
11
+ "sentiment_analysis_sentiment_f1": 0.6666666666666666,
12
+ "call_quality_opening_precision": 0.961,
13
+ "call_quality_opening_recall": 0.961,
14
+ "call_quality_opening_f1": 0.961,
15
+ "call_quality_listening_precision": 0.8937638649248213,
16
+ "call_quality_listening_recall": 0.9529566360052563,
17
+ "call_quality_listening_f1": 0.9224116001017553,
18
+ "call_quality_proactiveness_precision": 0.7430112800392349,
19
+ "call_quality_proactiveness_recall": 0.8706896551724138,
20
+ "call_quality_proactiveness_f1": 0.8017994178354062,
21
+ "call_quality_resolution_precision": 0.9060665362035225,
22
+ "call_quality_resolution_recall": 0.9070808844108592,
23
+ "call_quality_resolution_f1": 0.9065734265734265,
24
+ "call_quality_hold_precision": 0.75177304964539,
25
+ "call_quality_hold_recall": 0.5145631067961165,
26
+ "call_quality_hold_f1": 0.6109510086455331,
27
+ "call_quality_closing_precision": 0.851,
28
+ "call_quality_closing_recall": 0.851,
29
+ "call_quality_closing_f1": 0.851,
30
+ "eval_loss": 2.139722445148688,
31
+ "train_loss_avg": 1.5664203519385957
32
+ },
33
+ "is_best": false
34
+ }
checkpoints/epoch_8/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53cd910936c79d638b139c62e284889edfb889b87ff170d7289fd91085855df4
3
+ size 450684151
checkpoints/epoch_9/checkpoint_meta.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 9,
3
+ "metrics": {
4
+ "fraud_detection_fraud_accuracy": 1.0,
5
+ "fraud_detection_fraud_precision": 1.0,
6
+ "fraud_detection_fraud_recall": 1.0,
7
+ "fraud_detection_fraud_f1": 1.0,
8
+ "sentiment_analysis_sentiment_accuracy": 0.6666666666666666,
9
+ "sentiment_analysis_sentiment_precision": 0.8333333333333334,
10
+ "sentiment_analysis_sentiment_recall": 0.6666666666666666,
11
+ "sentiment_analysis_sentiment_f1": 0.6666666666666666,
12
+ "call_quality_opening_precision": 0.963,
13
+ "call_quality_opening_recall": 0.963,
14
+ "call_quality_opening_f1": 0.963,
15
+ "call_quality_listening_precision": 0.8982245561390347,
16
+ "call_quality_listening_recall": 0.9440210249671485,
17
+ "call_quality_listening_f1": 0.920553562275756,
18
+ "call_quality_proactiveness_precision": 0.7580813347236705,
19
+ "call_quality_proactiveness_recall": 0.835632183908046,
20
+ "call_quality_proactiveness_f1": 0.7949699289229087,
21
+ "call_quality_resolution_precision": 0.9113707609005415,
22
+ "call_quality_resolution_recall": 0.8950461796809404,
23
+ "call_quality_resolution_f1": 0.9031347077096865,
24
+ "call_quality_hold_precision": 0.7575757575757576,
25
+ "call_quality_hold_recall": 0.4854368932038835,
26
+ "call_quality_hold_f1": 0.591715976331361,
27
+ "call_quality_closing_precision": 0.848,
28
+ "call_quality_closing_recall": 0.848,
29
+ "call_quality_closing_f1": 0.848,
30
+ "eval_loss": 2.179060117785747,
31
+ "train_loss_avg": 1.5035246791362407
32
+ },
33
+ "is_best": false
34
+ }
checkpoints/epoch_9/model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:debc0005634ff2b1e3728ced2194492c727ae1dfd1de9a52a8ae313c5fcf3b85
3
+ size 450684151
encoder_config/config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_cross_attention": false,
3
+ "architectures": [
4
+ "XLMRobertaForMaskedLM"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 0,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 2,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "is_decoder": false,
17
+ "layer_norm_eps": 1e-05,
18
+ "max_position_embeddings": 514,
19
+ "model_type": "xlm-roberta",
20
+ "num_attention_heads": 6,
21
+ "num_hidden_layers": 8,
22
+ "output_past": true,
23
+ "pad_token_id": 1,
24
+ "position_embedding_type": "absolute",
25
+ "tie_word_embeddings": true,
26
+ "transformers_version": "5.0.0",
27
+ "type_vocab_size": 1,
28
+ "use_cache": true,
29
+ "vocab_size": 70006
30
+ }
experiment_config.yaml ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ project_name: security_nlp_3task
2
+ tasks:
3
+ - name: fraud_detection
4
+ type: single_label_classification
5
+ data_path: fixtures/sample_classification.jsonl
6
+ heads:
7
+ - name: fraud
8
+ num_labels: 2
9
+ weight: 1.0
10
+ dropout: 0.1
11
+ text_column: text
12
+ label_column: label
13
+ label_maps: null
14
+ - name: sentiment_analysis
15
+ type: single_label_classification
16
+ data_path: fixtures/sample_sentiment.jsonl
17
+ heads:
18
+ - name: sentiment
19
+ num_labels: 3
20
+ weight: 1.0
21
+ dropout: 0.1
22
+ text_column: text
23
+ label_column: label
24
+ label_maps: null
25
+ - name: call_quality
26
+ type: question_answering
27
+ data_path: fixtures/synthetic_qa_metrics_data_v01x.json
28
+ heads:
29
+ - name: opening
30
+ num_labels: 1
31
+ weight: 1.0
32
+ dropout: 0.1
33
+ - name: listening
34
+ num_labels: 5
35
+ weight: 1.5
36
+ dropout: 0.1
37
+ - name: proactiveness
38
+ num_labels: 3
39
+ weight: 1.0
40
+ dropout: 0.1
41
+ - name: resolution
42
+ num_labels: 5
43
+ weight: 2.0
44
+ dropout: 0.1
45
+ - name: hold
46
+ num_labels: 2
47
+ weight: 0.5
48
+ dropout: 0.1
49
+ - name: closing
50
+ num_labels: 1
51
+ weight: 1.0
52
+ dropout: 0.1
53
+ text_column: transcript
54
+ label_column: labels
55
+ label_maps:
56
+ opening:
57
+ 0: greeting
58
+ listening:
59
+ 0: acknowledgment
60
+ 1: empathy
61
+ 2: clarification
62
+ 3: active_listening
63
+ 4: patience
64
+ proactiveness:
65
+ 0: initiative
66
+ 1: follow_up
67
+ 2: suggestions
68
+ resolution:
69
+ 0: identified_issue
70
+ 1: provided_solution
71
+ 2: confirmed_resolution
72
+ 3: set_expectations
73
+ 4: offered_alternatives
74
+ hold:
75
+ 0: asked_permission
76
+ 1: explained_reason
77
+ closing:
78
+ 0: proper_farewell
79
+ model:
80
+ base_model: castorini/afriberta_base
81
+ hidden_size: 768
82
+ dropout: 0.1
83
+ fusion:
84
+ type: attention
85
+ dropout: 0.1
86
+ use_residual: true
87
+ num_attention_heads: 1
88
+ gate_init_value: 0.5
89
+ freeze_encoder_layers: 0
90
+ gradient_checkpointing: false
91
+ tokenizer:
92
+ max_length: 256
93
+ padding: max_length
94
+ truncation: true
95
+ training:
96
+ output_dir: ./results/3task_fusion
97
+ learning_rate: 2.0e-05
98
+ batch_size: 16
99
+ eval_batch_size: 16
100
+ num_epochs: 12
101
+ weight_decay: 0.01
102
+ warmup_steps: 20
103
+ max_grad_norm: 1.0
104
+ gradient_accumulation_steps: 1
105
+ use_amp: false
106
+ device: auto
107
+ task_sampling: proportional
108
+ temperature: 2.0
109
+ early_stopping_patience: 5
110
+ metric_for_best_model: eval_loss
111
+ greater_is_better: false
112
+ logging:
113
+ service: tensorboard
114
+ experiment_name: security_3task_fusion
115
+ tracking_uri: null
116
+ log_every_n_steps: 5
117
+ checkpoint:
118
+ save_every_n_epochs: 1
119
+ save_best: true
120
+ max_checkpoints: 2
121
+ data:
122
+ test_size: 0.2
123
+ seed: 42
124
+ num_workers: 0
125
+ pin_memory: true
126
+ pii_redaction:
127
+ enabled: false
128
+ strategy: mask
129
+ detect_types: null
130
+ hash_salt: jenga-ai-pii
131
+ log_detections: true
logs/security_3task_fusion/events.out.tfevents.1771217131.7207cada2386.3311.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bf8c2b49a191f57676c7419cc02f6bc4f91c9f07c53762ed936e5bcf502144e
3
+ size 44553
metadata.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base_model": "castorini/afriberta_base",
3
+ "hidden_size": 768,
4
+ "num_tasks": 3,
5
+ "task_names": [
6
+ "fraud_detection",
7
+ "sentiment_analysis",
8
+ "call_quality"
9
+ ],
10
+ "task_types": [
11
+ "single_label_classification",
12
+ "single_label_classification",
13
+ "question_answering"
14
+ ],
15
+ "has_fusion": true
16
+ }
model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:debc0005634ff2b1e3728ced2194492c727ae1dfd1de9a52a8ae313c5fcf3b85
3
+ size 450684151