JengaAI-multi-task-roberta-base / experiment_config.yaml
Rogendo's picture
Upload JengaAI trained multi-task NLP model
c838fec verified
project_name: security_nlp_3task
tasks:
- name: fraud_detection
type: single_label_classification
data_path: fixtures/sample_classification.jsonl
heads:
- name: fraud
num_labels: 2
weight: 1.0
dropout: 0.1
text_column: text
label_column: label
label_maps: null
- name: sentiment_analysis
type: single_label_classification
data_path: fixtures/sample_sentiment.jsonl
heads:
- name: sentiment
num_labels: 3
weight: 1.0
dropout: 0.1
text_column: text
label_column: label
label_maps: null
- name: call_quality
type: question_answering
data_path: /content/JengaAI/fixtures/synthetic_qa_metrics_data_v01x.json
heads:
- name: opening
num_labels: 1
weight: 1.0
dropout: 0.1
- name: listening
num_labels: 5
weight: 1.5
dropout: 0.1
- name: proactiveness
num_labels: 3
weight: 1.0
dropout: 0.1
- name: resolution
num_labels: 5
weight: 2.0
dropout: 0.1
- name: hold
num_labels: 2
weight: 0.5
dropout: 0.1
- name: closing
num_labels: 1
weight: 1.0
dropout: 0.1
text_column: transcript
label_column: labels
label_maps:
opening:
0: greeting
listening:
0: acknowledgment
1: empathy
2: clarification
3: active_listening
4: patience
proactiveness:
0: initiative
1: follow_up
2: suggestions
resolution:
0: identified_issue
1: provided_solution
2: confirmed_resolution
3: set_expectations
4: offered_alternatives
hold:
0: asked_permission
1: explained_reason
closing:
0: proper_farewell
model:
base_model: roberta-base
hidden_size: 768
dropout: 0.1
fusion:
type: attention
dropout: 0.1
use_residual: true
num_attention_heads: 1
gate_init_value: 0.5
freeze_encoder_layers: 0
gradient_checkpointing: false
tokenizer:
max_length: 256
padding: max_length
truncation: true
training:
output_dir: ./results/roberta-base-3task_fusion
learning_rate: 2.0e-05
batch_size: 8
eval_batch_size: 8
num_epochs: 15
weight_decay: 0.01
warmup_steps: 20
max_grad_norm: 1.0
gradient_accumulation_steps: 1
use_amp: false
device: auto
task_sampling: proportional
temperature: 2.0
early_stopping_patience: 5
metric_for_best_model: eval_loss
greater_is_better: false
logging:
service: tensorboard
experiment_name: security_3task_fusion
tracking_uri: null
log_every_n_steps: 5
checkpoint:
save_every_n_epochs: 1
save_best: true
max_checkpoints: 2
data:
test_size: 0.2
seed: 42
num_workers: 0
pin_memory: true
pii_redaction:
enabled: false
strategy: mask
detect_types: null
hash_salt: jenga-ai-pii
log_detections: true