Revert to 7-label: F1 0.72 (binary was 0.28)
Browse files
train.py
CHANGED
|
@@ -23,10 +23,8 @@ from transformers import (
|
|
| 23 |
TrainingArguments,
|
| 24 |
)
|
| 25 |
|
| 26 |
-
#
|
| 27 |
-
|
| 28 |
-
# DISCARD = O, QUOTE_HEADER, QUOTE
|
| 29 |
-
ZONE_LABELS = ['DISCARD', 'KEEP']
|
| 30 |
LABEL2ID = {label: i for i, label in enumerate(ZONE_LABELS)}
|
| 31 |
ID2LABEL = {i: label for i, label in enumerate(ZONE_LABELS)}
|
| 32 |
|
|
|
|
| 23 |
TrainingArguments,
|
| 24 |
)
|
| 25 |
|
| 26 |
+
# Zone labels (7-class classification)
|
| 27 |
+
ZONE_LABELS = ['O', 'GREETING', 'AUTHOR', 'QUOTE_HEADER', 'QUOTE', 'SIGNATURE', 'FORWARD']
|
|
|
|
|
|
|
| 28 |
LABEL2ID = {label: i for i, label in enumerate(ZONE_LABELS)}
|
| 29 |
ID2LABEL = {i: label for i, label in enumerate(ZONE_LABELS)}
|
| 30 |
|