HavelockAI
/

bert-token-classifier

@@ -31,7 +31,7 @@ This model performs span-level detection of 72 rhetorical marker types using BIO
 | Base model | `bert-base-uncased` |
 | Task | Token classification (BIO tagging) |
 | Labels | 145 (72 marker types × B/I + O) |
-| Best F1 | **0.459** (macro, markers only) |
 | Training | 15 epochs, batch 8, lr 2e-5 |
 | Loss | Focal loss (γ=1.0) for class imbalance |
@@ -119,165 +119,155 @@ Characteristics of written, analytical discourse:
 ## Evaluation
-Per-class F1 on test set (selected markers):
-| Marker | Precision | Recall | F1 | Support |
-|--------|-----------|--------|-----|---------|
-| oral_vocative | 0.889 | 0.593 | 0.711 | 27 |
-| oral_inclusive_we | 0.500 | 0.586 | 0.540 | 29 |
-| oral_second_person | 0.556 | 0.600 | 0.577 | 25 |
-| literate_conditional | 0.769 | 0.714 | 0.741 | 14 |
-| oral_self_correction | 1.000 | 1.000 | 1.000 | 3 |
-| oral_audience_response | 1.000 | 1.000 | 1.000 | 4 |
-| literate_citation | 0.000 | 0.000 | 0.000 | 10 |
 <details><summary>Click to show per-marker precision/recall/F1/support</summary>
 ```
-                                   precision    recall  f1-score   support
-                                O      0.730     0.850     0.785      3496
-         B-literate_abstract_noun      0.500     0.071     0.125        14
-       B-literate_additive_formal      1.000     0.667     0.800         3
-         B-literate_agent_demoted      1.000     1.000     1.000         4
-     B-literate_agentless_passive      0.297     0.458     0.361        24
-                 B-literate_aside      0.412     0.778     0.538         9
- B-literate_categorical_statement      0.571     1.000     0.727         4
-          B-literate_causal_chain      0.667     0.667     0.667         3
-       B-literate_causal_explicit      0.467     0.636     0.538        11
-              B-literate_citation      0.000     0.000     0.000        10
-   B-literate_conceptual_metaphor      0.500     0.333     0.400         6
-            B-literate_concessive      1.000     1.000     1.000         2
-  B-literate_concessive_connector      0.800     0.800     0.800         5
-           B-literate_conditional      0.769     0.714     0.741        14
-           B-literate_contrastive      0.455     0.625     0.526         8
-     B-literate_definitional_move      1.000     1.000     1.000         1
-           B-literate_enumeration      0.429     1.000     0.600         3
-       B-literate_epistemic_hedge      0.357     0.417     0.385        24
-            B-literate_evidential      0.000     0.000     0.000        11
-    B-literate_footnote_reference      0.500     0.667     0.571         3
- B-literate_institutional_subject      0.429     1.000     0.600         3
-        B-literate_list_structure      0.000     0.000     0.000         1
-         B-literate_metadiscourse      0.500     0.250     0.333         4
-B-literate_methodological_framing      1.000     0.500     0.667         4
-        B-literate_nested_clauses      0.345     0.455     0.392        22
-        B-literate_nominalization      0.600     0.300     0.400        10
-   B-literate_objectifying_stance      0.800     1.000     0.889         4
-               B-literate_paradox      0.333     0.333     0.333         3
-           B-literate_probability      0.333     0.200     0.250         5
-   B-literate_qualified_assertion      0.000     0.000     0.000         5
-        B-literate_relative_chain      0.270     0.773     0.400        22
-B-literate_technical_abbreviation      0.000     0.000     0.000         2
-        B-literate_technical_term      0.333     0.667     0.444         3
-    B-literate_temporal_embedding      1.000     0.500     0.667         4
-B-literate_third_person_reference      0.500     0.333     0.400         3
-              B-oral_alliteration      0.000     0.000     0.000         3
-                  B-oral_anaphora      0.188     0.400     0.255        15
-                 B-oral_asyndeton      0.000     0.000     0.000         1
-         B-oral_audience_response      1.000     1.000     1.000         4
-       B-oral_binomial_expression      0.333     0.400     0.364         5
-            B-oral_conflict_frame      0.800     0.800     0.800         5
-         B-oral_discourse_formula      0.500     0.500     0.500         6
-            B-oral_dramatic_pause      1.000     0.500     0.667         2
-           B-oral_embodied_action      1.000     0.167     0.286         6
-                B-oral_epistrophe      0.500     0.333     0.400         3
-                   B-oral_epithet      0.000     0.000     0.000         2
-          B-oral_everyday_example      0.750     1.000     0.857         3
-              B-oral_first_person      0.000     0.000     0.000         5
-                B-oral_imperative      0.571     0.571     0.571        14
-              B-oral_inclusive_we      0.500     0.586     0.540        29
-      B-oral_intensifier_doubling      1.000     0.667     0.800         3
-        B-oral_lexical_repetition      0.267     0.400     0.320        10
-          B-oral_named_individual      0.474     0.450     0.462        20
-               B-oral_parallelism      0.100     0.143     0.118         7
-              B-oral_phatic_check      1.000     1.000     1.000         1
-             B-oral_phatic_filler      0.429     0.600     0.500         5
-              B-oral_polysyndeton      0.200     0.100     0.133        10
-                   B-oral_proverb      0.600     0.500     0.545         6
-                   B-oral_refrain      1.000     1.000     1.000         1
-         B-oral_religious_formula      0.000     0.000     0.000         2
-       B-oral_rhetorical_question      0.125     0.500     0.200         2
-                    B-oral_rhythm      0.714     0.833     0.769         6
-             B-oral_second_person      0.556     0.600     0.577        25
-           B-oral_self_correction      1.000     1.000     1.000         3
-            B-oral_sensory_detail      0.500     1.000     0.667         1
-        B-oral_simple_conjunction      0.000     0.000     0.000         3
-            B-oral_specific_place      0.333     0.667     0.444         3
-           B-oral_temporal_anchor      0.000     0.000     0.000         3
-                  B-oral_tricolon      0.286     1.000     0.444         2
-                   B-oral_us_them      0.667     0.667     0.667         3
-                  B-oral_vocative      0.889     0.593     0.711        27
-         I-literate_abstract_noun      0.500     0.083     0.143        12
-       I-literate_additive_formal      0.000     0.000     0.000         6
-         I-literate_agent_demoted      0.583     0.933     0.718        15
-     I-literate_agentless_passive      0.518     0.414     0.460        70
-                 I-literate_aside      0.700     0.618     0.656       102
- I-literate_categorical_statement      0.692     0.391     0.500        23
-          I-literate_causal_chain      0.889     0.640     0.744        25
-       I-literate_causal_explicit      0.593     0.762     0.667        21
-              I-literate_citation      0.625     0.227     0.333        44
-   I-literate_conceptual_metaphor      0.857     0.400     0.545        15
-            I-literate_concessive      0.800     0.571     0.667         7
-  I-literate_concessive_connector      0.667     0.667     0.667         3
-           I-literate_conditional      0.784     0.351     0.485       114
-           I-literate_contrastive      0.857     0.400     0.545        15
-       I-literate_cross_reference      0.000     0.000     0.000         0
-     I-literate_definitional_move      1.000     1.000     1.000         5
-           I-literate_enumeration      0.680     0.436     0.531        39
-       I-literate_epistemic_hedge      0.425     0.386     0.405        44
-            I-literate_evidential      0.500     0.103     0.171        29
-    I-literate_footnote_reference      1.000     0.727     0.842        11
- I-literate_institutional_subject      0.625     1.000     0.769         5
-        I-literate_list_structure      0.000     0.000     0.000         3
-         I-literate_metadiscourse      0.222     0.125     0.160        16
-I-literate_methodological_framing      0.857     0.500     0.632        12
-        I-literate_nested_clauses      0.487     0.256     0.336       379
-        I-literate_nominalization      0.000     0.000     0.000        11
-   I-literate_objectifying_stance      0.900     0.692     0.783        13
-               I-literate_paradox      0.250     0.062     0.100        16
-           I-literate_probability      0.000     0.000     0.000         7
-   I-literate_qualified_assertion      0.000     0.000     0.000        21
-        I-literate_relative_chain      0.494     0.482     0.488       251
-I-literate_technical_abbreviation      0.750     0.273     0.400        11
-        I-literate_technical_term      0.167     0.273     0.207        11
-    I-literate_temporal_embedding      1.000     0.600     0.750        50
-I-literate_third_person_reference      0.714     0.833     0.769         6
-              I-oral_alliteration      1.000     0.222     0.364         9
-                  I-oral_anaphora      0.140     0.070     0.093       100
-                 I-oral_asyndeton      0.417     0.714     0.526         7
-         I-oral_audience_response      0.905     0.905     0.905        21
-       I-oral_binomial_expression      0.529     0.818     0.643        11
-            I-oral_conflict_frame      0.833     0.714     0.769         7
-         I-oral_discourse_formula      0.625     0.833     0.714         6
-            I-oral_dramatic_pause      0.500     0.500     0.500         4
-           I-oral_embodied_action      1.000     0.062     0.118        16
-                I-oral_epistrophe      0.000     0.000     0.000         3
-                   I-oral_epithet      0.200     0.200     0.200         5
-          I-oral_everyday_example      1.000     0.950     0.974        20
-              I-oral_first_person      0.000     0.000     0.000         2
-                I-oral_imperative      0.692     0.333     0.450        27
-              I-oral_inclusive_we      0.849     0.900     0.874        50
-      I-oral_intensifier_doubling      0.800     1.000     0.889         4
-        I-oral_lexical_repetition      0.241     0.341     0.283        41
-          I-oral_named_individual      0.689     0.646     0.667        48
-               I-oral_parallelism      0.518     0.319     0.394       135
-              I-oral_phatic_check      1.000     1.000     1.000         3
-             I-oral_phatic_filler      0.667     0.400     0.500         5
-              I-oral_polysyndeton      1.000     0.268     0.423        82
-                   I-oral_proverb      0.955     0.568     0.712        37
-                   I-oral_refrain      1.000     1.000     1.000         4
-         I-oral_religious_formula      0.000     0.000     0.000        16
-       I-oral_rhetorical_question      0.312     0.333     0.323        15
-                    I-oral_rhythm      0.979     0.610     0.752        77
-             I-oral_second_person      0.143     0.143     0.143         7
-           I-oral_self_correction      0.857     0.900     0.878        20
-            I-oral_sensory_detail      0.833     1.000     0.909         5
-        I-oral_simple_conjunction      0.714     1.000     0.833         5
-            I-oral_specific_place      0.714     0.625     0.667         8
-           I-oral_temporal_anchor      0.059     0.100     0.074        10
-                  I-oral_tricolon      0.388     0.929     0.547        28
-                   I-oral_us_them      0.800     0.889     0.842         9
-                  I-oral_vocative      0.971     0.723     0.829        47
 ```
 </details>
@@ -383,7 +373,7 @@ Markers with <100 examples:  57 (79%)
 </details>
-**Macro F1 (all 145 labels):** 0.487
 **Weighted F1:** 0.645
 **Accuracy:** 66.5%

 | Base model | `bert-base-uncased` |
 | Task | Token classification (BIO tagging) |
 | Labels | 145 (72 marker types × B/I + O) |
+| Best F1 | **0.4611** (macro, markers only) |
 | Training | 15 epochs, batch 8, lr 2e-5 |
 | Loss | Focal loss (γ=1.0) for class imbalance |
 ## Evaluation
+Per-class F1 on test set:
 <details><summary>Click to show per-marker precision/recall/F1/support</summary>
 ```
+                                   precision    recall  f1-score   support
+                                O      0.721     0.835     0.774      3496
+         B-literate_abstract_noun      0.500     0.286     0.364        14
+       B-literate_additive_formal      0.667     0.667     0.667         3
+         B-literate_agent_demoted      0.800     1.000     0.889         4
+     B-literate_agentless_passive      0.312     0.417     0.357        24
+                 B-literate_aside      0.438     0.778     0.560         9
+ B-literate_categorical_statement      0.333     0.500     0.400         4
+          B-literate_causal_chain      0.667     0.667     0.667         3
+       B-literate_causal_explicit      0.538     0.636     0.583        11
+              B-literate_citation      0.000     0.000     0.000        10
+   B-literate_conceptual_metaphor      0.500     0.167     0.250         6
+            B-literate_concessive      1.000     1.000     1.000         2
+  B-literate_concessive_connector      0.800     0.800     0.800         5
+           B-literate_conditional      0.667     0.714     0.690        14
+           B-literate_contrastive      0.333     0.375     0.353         8
+     B-literate_definitional_move      1.000     1.000     1.000         1
+           B-literate_enumeration      0.500     0.667     0.571         3
+       B-literate_epistemic_hedge      0.371     0.542     0.441        24
+            B-literate_evidential      0.000     0.000     0.000        11
+    B-literate_footnote_reference      0.500     0.667     0.571         3
+ B-literate_institutional_subject      0.600     1.000     0.750         3
+        B-literate_list_structure      0.000     0.000     0.000         1
+         B-literate_metadiscourse      0.500     0.500     0.500         4
+B-literate_methodological_framing      1.000     0.500     0.667         4
+        B-literate_nested_clauses      0.300     0.545     0.387        22
+        B-literate_nominalization      0.750     0.300     0.429        10
+   B-literate_objectifying_stance      0.800     1.000     0.889         4
+               B-literate_paradox      0.500     0.333     0.400         3
+           B-literate_probability      0.333     0.200     0.250         5
+   B-literate_qualified_assertion      0.000     0.000     0.000         5
+        B-literate_relative_chain      0.327     0.773     0.459        22
+B-literate_technical_abbreviation      0.000     0.000     0.000         2
+        B-literate_technical_term      0.400     0.667     0.500         3
+    B-literate_temporal_embedding      1.000     0.500     0.667         4
+B-literate_third_person_reference      0.250     0.333     0.286         3
+              B-oral_alliteration      0.000     0.000     0.000         3
+                  B-oral_anaphora      0.185     0.333     0.238        15
+                 B-oral_asyndeton      0.000     0.000     0.000         1
+         B-oral_audience_response      1.000     1.000     1.000         4
+       B-oral_binomial_expression      0.333     0.400     0.364         5
+            B-oral_conflict_frame      0.800     0.800     0.800         5
+         B-oral_discourse_formula      0.333     0.500     0.400         6
+            B-oral_dramatic_pause      0.000     0.000     0.000         2
+           B-oral_embodied_action      1.000     0.167     0.286         6
+                B-oral_epistrophe      0.000     0.000     0.000         3
+                   B-oral_epithet      0.333     0.500     0.400         2
+          B-oral_everyday_example      0.750     1.000     0.857         3
+              B-oral_first_person      0.000     0.000     0.000         5
+                B-oral_imperative      0.600     0.643     0.621        14
+              B-oral_inclusive_we      0.486     0.586     0.531        29
+      B-oral_intensifier_doubling      0.667     0.667     0.667         3
+        B-oral_lexical_repetition      0.273     0.300     0.286        10
+          B-oral_named_individual      0.450     0.450     0.450        20
+               B-oral_parallelism      0.000     0.000     0.000         7
+              B-oral_phatic_check      1.000     1.000     1.000         1
+             B-oral_phatic_filler      0.667     0.800     0.727         5
+              B-oral_polysyndeton      0.250     0.100     0.143        10
+                   B-oral_proverb      1.000     0.333     0.500         6
+                   B-oral_refrain      1.000     1.000     1.000         1
+         B-oral_religious_formula      0.000     0.000     0.000         2
+       B-oral_rhetorical_question      0.222     1.000     0.364         2
+                    B-oral_rhythm      0.714     0.833     0.769         6
+             B-oral_second_person      0.533     0.640     0.582        25
+           B-oral_self_correction      0.600     1.000     0.750         3
+            B-oral_sensory_detail      1.000     1.000     1.000         1
+        B-oral_simple_conjunction      0.000     0.000     0.000         3
+            B-oral_specific_place      0.333     0.667     0.444         3
+           B-oral_temporal_anchor      0.000     0.000     0.000         3
+                  B-oral_tricolon      0.200     1.000     0.333         2
+                   B-oral_us_them      0.667     0.667     0.667         3
+                  B-oral_vocative      0.714     0.556     0.625        27
+         I-literate_abstract_noun      0.000     0.000     0.000        12
+       I-literate_additive_formal      0.000     0.000     0.000         6
+         I-literate_agent_demoted      0.500     0.800     0.615        15
+     I-literate_agentless_passive      0.483     0.414     0.446        70
+                 I-literate_aside      0.400     0.235     0.296       102
+ I-literate_categorical_statement      0.412     0.304     0.350        23
+          I-literate_causal_chain      0.917     0.440     0.595        25
+       I-literate_causal_explicit      0.444     0.762     0.561        21
+              I-literate_citation      0.444     0.182     0.258        44
+   I-literate_conceptual_metaphor      0.571     0.267     0.364        15
+            I-literate_concessive      0.750     0.429     0.545         7
+  I-literate_concessive_connector      0.400     0.667     0.500         3
+           I-literate_conditional      0.479     0.307     0.374       114
+           I-literate_contrastive      0.600     0.400     0.480        15
+       I-literate_cross_reference      0.000     0.000     0.000         0
+     I-literate_definitional_move      0.833     1.000     0.909         5
+           I-literate_enumeration      0.824     0.718     0.767        39
+       I-literate_epistemic_hedge      0.375     0.341     0.357        44
+            I-literate_evidential      0.333     0.034     0.062        29
+    I-literate_footnote_reference      0.667     0.727     0.696        11
+ I-literate_institutional_subject      1.000     1.000     1.000         5
+        I-literate_list_structure      0.000     0.000     0.000         3
+         I-literate_metadiscourse      0.200     0.125     0.154        16
+I-literate_methodological_framing      0.750     0.500     0.600        12
+        I-literate_nested_clauses      0.336     0.127     0.184       379
+        I-literate_nominalization      0.000     0.000     0.000        11
+   I-literate_objectifying_stance      0.917     0.846     0.880        13
+               I-literate_paradox      0.100     0.062     0.077        16
+           I-literate_probability      0.000     0.000     0.000         7
+   I-literate_qualified_assertion      0.000     0.000     0.000        21
+        I-literate_relative_chain      0.402     0.422     0.412       251
+I-literate_technical_abbreviation      0.833     0.455     0.588        11
+        I-literate_technical_term      0.250     0.273     0.261        11
+    I-literate_temporal_embedding      1.000     0.600     0.750        50
+I-literate_third_person_reference      0.556     0.833     0.667         6
+              I-oral_alliteration      0.778     0.778     0.778         9
+                  I-oral_anaphora      0.116     0.080     0.095       100
+                 I-oral_asyndeton      0.000     0.000     0.000         7
+         I-oral_audience_response      0.864     0.905     0.884        21
+       I-oral_binomial_expression      0.533     0.727     0.615        11
+            I-oral_conflict_frame      1.000     0.714     0.833         7
+         I-oral_discourse_formula      0.545     1.000     0.706         6
+            I-oral_dramatic_pause      0.400     0.500     0.444         4
+           I-oral_embodied_action      0.000     0.000     0.000        16
+                I-oral_epistrophe      0.000     0.000     0.000         3
+                   I-oral_epithet      0.400     0.400     0.400         5
+          I-oral_everyday_example      0.947     0.900     0.923        20
+              I-oral_first_person      0.000     0.000     0.000         2
+                I-oral_imperative      0.714     0.370     0.488        27
+              I-oral_inclusive_we      0.754     0.920     0.829        50
+      I-oral_intensifier_doubling      0.800     1.000     0.889         4
+        I-oral_lexical_repetition      0.250     0.317     0.280        41
+          I-oral_named_individual      0.620     0.646     0.633        48
+               I-oral_parallelism      0.485     0.237     0.318       135
+              I-oral_phatic_check      1.000     1.000     1.000         3
+             I-oral_phatic_filler      1.000     0.400     0.571         5
+              I-oral_polysyndeton      0.700     0.171     0.275        82
+                   I-oral_proverb      0.938     0.405     0.566        37
+                   I-oral_refrain      1.000     1.000     1.000         4
+         I-oral_religious_formula      1.000     0.062     0.118        16
+       I-oral_rhetorical_question      0.389     0.467     0.424        15
+                    I-oral_rhythm      0.957     0.584     0.726        77
+             I-oral_second_person      0.250     0.143     0.182         7
+           I-oral_self_correction      0.889     0.800     0.842        20
+            I-oral_sensory_detail      0.833     1.000     0.909         5
+        I-oral_simple_conjunction      0.625     1.000     0.769         5
+            I-oral_specific_place      0.556     0.625     0.588         8
+           I-oral_temporal_anchor      0.056     0.100     0.071        10
+                  I-oral_tricolon      0.329     0.964     0.491        28
+                   I-oral_us_them      0.750     0.333     0.462         9
+                  I-oral_vocative      0.846     0.702     0.767        47
 ```
 </details>
 </details>
+**Macro F1 (all 145 labels):** 0.4611
 **Weighted F1:** 0.645
 **Accuracy:** 66.5%

config.json CHANGED Viewed

@@ -1,16 +1,13 @@
 {
   "add_cross_attention": false,
   "architectures": [
-    "BertTokenClassifier"
   ],
   "attention_probs_dropout_prob": 0.1,
   "bos_token_id": null,
   "classifier_dropout": null,
-  "dropout": 0.1,
   "dtype": "float32",
   "eos_token_id": null,
-  "focal_alpha": 1.0,
-  "focal_gamma": 1.0,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
@@ -314,7 +311,7 @@
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
-  "model_type": "bert-token-classifier",
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "pad_token_id": 0,

 {
   "add_cross_attention": false,
   "architectures": [
+    "BertForTokenClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
   "bos_token_id": null,
   "classifier_dropout": null,
   "dtype": "float32",
   "eos_token_id": null,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
+  "model_type": "bert",
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "pad_token_id": 0,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d310f9767c901ae616ffd9d2fa59addc5e10a450b3b25d44c12bdedaeab3fbeb
 size 436035932

 version https://git-lfs.github.com/spec/v1
+oid sha256:862313c38ca9273d9d4cbb21c001ce9fbf3798c8c3601eddfc009e63303341d7
 size 436035932