{ "release": "IrishCore-DiffMask-135M-v1-rc2", "repo_id": "temsa/IrishCore-DiffMask-135M-v1-rc2", "architecture": { "family": "DistilBERT-size token-span extractor", "diffusion_style_training": true, "runtime_diffusion": false, "scanner_free": true, "validator_free": true, "heads": [ "token_presence_head", "typed_start_boundary_head", "typed_end_boundary_head" ] }, "base_model": "OpenMed/OpenMed-PII-mLiteClinical-Base-135M-v1", "notes": [ "DiffMask uses a masked denoising training schedule, not a generative diffusion runtime.", "ONNX q8 is the recommended CPU deployment artifact.", "The release inference scripts emit [PII:LABEL] placeholders.", "This rc2 package was selected from an interpolation blend after cleaning label contamination in the v5 training mix.", "A UAT replay exact suite was added for the rc2 selection pass." ], "full": { "core_f1": 0.9664429530201343, "edge_f1": 1.0, "multilingual_f1": 0.9212121212121211, "hardening_f1": 0.9743589743589743 }, "onnx_q8": { "core_f1": 0.9664429530201343, "edge_f1": 1.0, "finance_f1": 1.0, "finance_boundary_f1": 1.0, "user_ppsn_f1": 1.0, "gaelic_weak_ppsn_f1": 1.0, "multilingual_f1": 0.9212121212121211, "hardening_f1": 0.9743589743589743, "uat_replay_exact_f1": 0.8275862068965517, "core_examples_per_second": 247.08088626660017, "multilingual_examples_per_second": 256.13155387081486, "runtime_profile_examples_per_second": 173.08521268339905, "uat_replay_examples_per_second": 183.66747754925285 }, "comparison": { "public_rc5_onnx_q8": { "core": 0.9668874172185431, "edge": 0.9743589743589743, "remaining_gaps": 0.888888888888889, "finance": 0.9361702127659575, "finance_boundary": 0.8750000000000001, "multilingual_ppsn": 0.9333333333333333, "user_ppsn": 1.0, "gaelic_weak_ppsn": 1.0, "overlap_ppsn": 1.0 }, "public_rc8_onnx_q8": { "min_score": 0.5, "core": 0.9736842105263158, "edge": 1.0, "finance": 1.0, "finance_boundary": 1.0, "user_ppsn": 1.0, "gaelic_weak_ppsn": 1.0, "multilingual_ppsn": 0.9176470588235294, "hardening": 0.7058823529411765, "core_examples_per_second": 257.37556287434955, "multilingual_examples_per_second": 230.51805414983642, "runtime_profile_examples_per_second": 179.47083751317666 } }, "uat_replay_exact_suite": { "dataset": "diffmask_gap_uat_exact_v1", "rc1_q8": { "f1": 0.45454545454545453, "precision": 1.0, "recall": 0.29411764705882354, "examples_per_second": 238.65238838006147 }, "rc8_q8": { "f1": 0.3636363636363636, "precision": 0.375, "recall": 0.35294117647058826, "examples_per_second": 110.75945444067594 }, "rc2_q8": { "f1": 0.8275862068965517, "precision": 1.0, "recall": 0.7058823529411765, "examples_per_second": 183.66747754925285 } }, "known_remaining_misses": [ "Second phone number inside the long Client Identity Services sentence: 071 967 2616", "Postcode inside the longer allocation-centre block: R93 EC57", "Email mailbox form: EPStamp4@enterprise.gov.ie", "One D02 XY45 address form from the UAT replay suite" ] }