File size: 2,799 Bytes

c838fec

project_name: security_nlp_3task
tasks:
- name: fraud_detection
  type: single_label_classification
  data_path: fixtures/sample_classification.jsonl
  heads:
  - name: fraud
    num_labels: 2
    weight: 1.0
    dropout: 0.1
  text_column: text
  label_column: label
  label_maps: null
- name: sentiment_analysis
  type: single_label_classification
  data_path: fixtures/sample_sentiment.jsonl
  heads:
  - name: sentiment
    num_labels: 3
    weight: 1.0
    dropout: 0.1
  text_column: text
  label_column: label
  label_maps: null
- name: call_quality
  type: question_answering
  data_path: /content/JengaAI/fixtures/synthetic_qa_metrics_data_v01x.json
  heads:
  - name: opening
    num_labels: 1
    weight: 1.0
    dropout: 0.1
  - name: listening
    num_labels: 5
    weight: 1.5
    dropout: 0.1
  - name: proactiveness
    num_labels: 3
    weight: 1.0
    dropout: 0.1
  - name: resolution
    num_labels: 5
    weight: 2.0
    dropout: 0.1
  - name: hold
    num_labels: 2
    weight: 0.5
    dropout: 0.1
  - name: closing
    num_labels: 1
    weight: 1.0
    dropout: 0.1
  text_column: transcript
  label_column: labels
  label_maps:
    opening:
      0: greeting
    listening:
      0: acknowledgment
      1: empathy
      2: clarification
      3: active_listening
      4: patience
    proactiveness:
      0: initiative
      1: follow_up
      2: suggestions
    resolution:
      0: identified_issue
      1: provided_solution
      2: confirmed_resolution
      3: set_expectations
      4: offered_alternatives
    hold:
      0: asked_permission
      1: explained_reason
    closing:
      0: proper_farewell
model:
  base_model: roberta-base
  hidden_size: 768
  dropout: 0.1
  fusion:
    type: attention
    dropout: 0.1
    use_residual: true
    num_attention_heads: 1
    gate_init_value: 0.5
  freeze_encoder_layers: 0
  gradient_checkpointing: false
tokenizer:
  max_length: 256
  padding: max_length
  truncation: true
training:
  output_dir: ./results/roberta-base-3task_fusion
  learning_rate: 2.0e-05
  batch_size: 8
  eval_batch_size: 8
  num_epochs: 15
  weight_decay: 0.01
  warmup_steps: 20
  max_grad_norm: 1.0
  gradient_accumulation_steps: 1
  use_amp: false
  device: auto
  task_sampling: proportional
  temperature: 2.0
  early_stopping_patience: 5
  metric_for_best_model: eval_loss
  greater_is_better: false
  logging:
    service: tensorboard
    experiment_name: security_3task_fusion
    tracking_uri: null
    log_every_n_steps: 5
  checkpoint:
    save_every_n_epochs: 1
    save_best: true
    max_checkpoints: 2
  data:
    test_size: 0.2
    seed: 42
    num_workers: 0
    pin_memory: true
    pii_redaction:
      enabled: false
      strategy: mask
      detect_types: null
      hash_salt: jenga-ai-pii
      log_detections: true