Rogendo's picture
Upload JengaAI model: Police_Case_Multi-Task_v2 — Mar 09 00:25
49d070d verified
project_name: police_case_reports_json
tasks:
- name: sentiment
type: sentiment
data_path: /home/naynek/Desktop/TujengeAI/Update/JengaAI/backend/uploads/datasets/16ced0930e7e_police_case_reports.json
heads:
- name: sentiment
num_labels: 4
weight: 1.0
dropout: 0.1
text_column: report_text
label_column: sentiment
label_maps:
sentiment:
0: negative
1: neutral
2: positive
3: urgent
- name: main_category
type: single_label_classification
data_path: /home/naynek/Desktop/TujengeAI/Update/JengaAI/backend/uploads/datasets/16ced0930e7e_police_case_reports.json
heads:
- name: main_category
num_labels: 10
weight: 1.0
dropout: 0.1
text_column: report_text
label_column: main_category
label_maps:
main_category:
0: Child Abuse
1: Commendation
2: Drug Abuse
3: Fraud
4: Human Trafficking
5: Missing Person
6: Theft
7: Traffic
8: Vandalism
9: Violence
- name: subcategory
type: single_label_classification
data_path: /home/naynek/Desktop/TujengeAI/Update/JengaAI/backend/uploads/datasets/16ced0930e7e_police_case_reports.json
heads:
- name: subcategory
num_labels: 24
weight: 1.0
dropout: 0.1
text_column: report_text
label_column: subcategory
label_maps:
subcategory:
0: ATM Fraud
1: Abandoned Child
2: Abandoned Vehicle
3: Bank Robbery
4: Breaking and Entering
5: Child Labour
6: Consumer Fraud
7: Domestic Servitude
8: Domestic Violence
9: Drug Distribution
10: Extortion
11: Gunfire
12: Hit and Run
13: Identity Theft
14: Illicit Brewing
15: Missing Child
16: Mugging
17: Officer Commendation
18: Phone Scam
19: Property Destruction
20: Robbery
21: Sexual Abuse
22: Tourist Scam
23: Vehicle Theft
- name: priority
type: single_label_classification
data_path: /home/naynek/Desktop/TujengeAI/Update/JengaAI/backend/uploads/datasets/16ced0930e7e_police_case_reports.json
heads:
- name: priority
num_labels: 4
weight: 1.0
dropout: 0.1
text_column: report_text
label_column: priority
label_maps:
priority:
0: critical
1: high
2: low
3: medium
- name: intervention
type: single_label_classification
data_path: /home/naynek/Desktop/TujengeAI/Update/JengaAI/backend/uploads/datasets/16ced0930e7e_police_case_reports.json
heads:
- name: intervention
num_labels: 8
weight: 1.0
dropout: 0.1
text_column: report_text
label_column: intervention
label_maps:
intervention:
0: Counseling
1: Investigation
2: Legal Aid
3: Medical
4: None Required
5: Police Dispatch
6: Search and Rescue
7: Welfare Services
- name: entity_extraction
type: ner
data_path: /home/naynek/Desktop/TujengeAI/Update/JengaAI/backend/uploads/datasets/16ced0930e7e_police_case_reports.json
heads:
- name: entity_extraction
num_labels: 15
weight: 1.0
dropout: 0.1
text_column: report_text
label_column: entities
label_maps:
ner_head:
0: O
1: B-DATE
2: I-DATE
3: B-LOCATION
4: I-LOCATION
5: B-NAME
6: I-NAME
7: B-ORG
8: I-ORG
9: B-TIME
10: I-TIME
11: B-VEHICLE
12: I-VEHICLE
13: B-WEAPON
14: I-WEAPON
model:
base_model: distilbert-base-uncased
hidden_size: 768
dropout: 0.1
fusion:
type: attention
dropout: 0.1
use_residual: true
num_attention_heads: 1
gate_init_value: 0.5
freeze_encoder_layers: 0
gradient_checkpointing: false
tokenizer:
max_length: 512
padding: max_length
truncation: true
training:
output_dir: ./results/police_case_reports_json
learning_rate: 2.0e-05
batch_size: 4
eval_batch_size: 4
num_epochs: 4
weight_decay: 0.01
warmup_steps: 50
max_grad_norm: 1.0
gradient_accumulation_steps: 1
use_amp: false
device: auto
task_sampling: round_robin
temperature: 2.0
early_stopping_patience: 3
metric_for_best_model: eval_loss
greater_is_better: false
logging:
service: mlflow
experiment_name: police_case_reports_json
tracking_uri: http://localhost:5000
log_every_n_steps: 10
checkpoint:
save_every_n_epochs: 1
save_best: true
max_checkpoints: 2
data:
test_size: 0.08
seed: 42
num_workers: 0
pin_memory: true
pii_redaction:
enabled: false
detect_types:
- email
- phone
- url
- card
- name
- org
log_detections: true