fmnxl commited on
Commit
0774ad1
·
verified ·
1 Parent(s): a44e956

Revert to 7-label: F1 0.72 (binary was 0.28)

Browse files
Files changed (1) hide show
  1. train.py +2 -4
train.py CHANGED
@@ -23,10 +23,8 @@ from transformers import (
23
  TrainingArguments,
24
  )
25
 
26
- # Binary classification: KEEP (author content) vs DISCARD (quoted content)
27
- # KEEP = GREETING, AUTHOR, SIGNATURE, FORWARD
28
- # DISCARD = O, QUOTE_HEADER, QUOTE
29
- ZONE_LABELS = ['DISCARD', 'KEEP']
30
  LABEL2ID = {label: i for i, label in enumerate(ZONE_LABELS)}
31
  ID2LABEL = {i: label for i, label in enumerate(ZONE_LABELS)}
32
 
 
23
  TrainingArguments,
24
  )
25
 
26
+ # Zone labels (7-class classification)
27
+ ZONE_LABELS = ['O', 'GREETING', 'AUTHOR', 'QUOTE_HEADER', 'QUOTE', 'SIGNATURE', 'FORWARD']
 
 
28
  LABEL2ID = {label: i for i, label in enumerate(ZONE_LABELS)}
29
  ID2LABEL = {i: label for i, label in enumerate(ZONE_LABELS)}
30