oksomu
/

resume-ner

@@ -106,6 +106,10 @@
           "the comptia security+": "comptia security+"
         }
       },
       "EMAIL": {
         "min_length": 5,
         "exceptions": [],

           "the comptia security+": "comptia security+"
         }
       },
+      "DATE": {
+        "min_length": 3,
+        "exceptions": []
+      },
       "EMAIL": {
         "min_length": 5,
         "exceptions": [],

training/structured_postprocess.py CHANGED Viewed

@@ -106,7 +106,7 @@ class StructuredPostProcessor:
                 if pattern.lower() in cleaned.lower():
                     return None
         elif label == "SKILL":
-            cleaned = re.sub(r"[,.]$", "", cleaned)
         elif label == "COMPANY":
             if rules.get("strip_trailing_state_code"):
                 cleaned = re.sub(r",?\s+[A-Z]{2}$", "", cleaned).strip()

                 if pattern.lower() in cleaned.lower():
                     return None
         elif label == "SKILL":
+            cleaned = re.sub(r"[,.;:]+$", "", cleaned)
         elif label == "COMPANY":
             if rules.get("strip_trailing_state_code"):
                 cleaned = re.sub(r",?\s+[A-Z]{2}$", "", cleaned).strip()