{ "manifest_schema_version": 3, "config_path": "/nvme/CognitiveMemoryLayer/packages/models/model_pipeline.toml", "trained_at_utc": "2026-03-25T13:59:08.669850+00:00", "paths": { "prepared_dir": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack", "trained_models_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models" }, "train_settings": { "seed": 42, "families": [ "router", "extractor", "pair" ], "max_features": 250000, "min_df": 2, "ngram_min": 1, "ngram_max": 2, "max_iter": 25, "alpha": 1e-05, "predict_batch_size": 8192, "early_stopping": true, "early_stopping_patience": 3, "early_stopping_metric": "macro_f1", "early_stopping_min_delta": 0.001, "calibration_method": "sigmoid", "calibration_split": "eval", "transformer": { "model_name_or_path": "microsoft/deberta-v3-base", "tokenizer_name": "", "num_train_epochs": 2, "per_device_train_batch_size": 8, "per_device_eval_batch_size": 16, "max_seq_length": 256, "learning_rate": 2e-05, "warmup_ratio": 0.1, "weight_decay": 0.01, "gradient_accumulation_steps": 1, "score_margin": 0.15, "focal_gamma": 1.5, "temperature_grid": [ 0.7, 0.85, 1.0, 1.15, 1.3, 1.5, 2.0 ] }, "token": { "model_name_or_path": "bert-base-multilingual-cased", "num_train_epochs": 8, "per_device_train_batch_size": 8, "per_device_eval_batch_size": 16, "max_seq_length": 256, "stride": 64, "learning_rate": 5e-05, "warmup_ratio": 0.1, "weight_decay": 0.01, "gradient_accumulation_steps": 1 }, "allow_dirty": false, "release_mode": false, "strict": true }, "build_metadata": { "python_version": "3.14.3 (main, Mar 11 2026, 19:17:30) [GCC 15.2.0]", "dependencies": { "scikit_learn": "1.8.0", "joblib": "1.5.3", "pandas": "3.0.1" }, "commit_sha": "090060c4478c373a02eb09ae63292f51ca31a710", "dirty": true }, "configured_tasks": [ { "task_name": "retrieval_constraint_relevance_pair", "family": "pair", "input_type": "pair", "objective": "pair_ranking", "enabled": true, "artifact_name": "retrieval_constraint_relevance_pair", "metrics": [ "mrr@10", "ndcg@10", "recall@10" ], "trainer": "transformer_pair", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "BAAI/bge-reranker-base", "tokenizer_name": "" }, { "task_name": "memory_rerank_pair", "family": "pair", "input_type": "pair", "objective": "pair_ranking", "enabled": true, "artifact_name": "memory_rerank_pair", "metrics": [ "mrr@10", "ndcg@10", "recall@10" ], "trainer": "transformer_pair", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "BAAI/bge-reranker-base", "tokenizer_name": "" }, { "task_name": "novelty_pair", "family": "pair", "input_type": "pair", "objective": "classification", "enabled": true, "artifact_name": "novelty_pair", "metrics": [ "accuracy", "macro_f1", "weighted_f1" ], "trainer": "transformer_pair", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "BAAI/bge-reranker-base", "tokenizer_name": "" }, { "task_name": "fact_extraction_structured", "family": "extractor", "input_type": "single", "objective": "token_classification", "enabled": true, "artifact_name": "fact_extraction_structured", "metrics": [ "span_f1", "span_exact_match" ], "trainer": "", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "", "tokenizer_name": "" }, { "task_name": "schema_match_pair", "family": "pair", "input_type": "pair", "objective": "classification", "enabled": true, "artifact_name": "schema_match_pair", "metrics": [ "accuracy", "macro_f1", "weighted_f1" ], "trainer": "transformer_pair", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "BAAI/bge-reranker-base", "tokenizer_name": "" }, { "task_name": "reconsolidation_candidate_pair", "family": "pair", "input_type": "pair", "objective": "pair_ranking", "enabled": true, "artifact_name": "reconsolidation_candidate_pair", "metrics": [ "mrr@10", "ndcg@10", "recall@10" ], "trainer": "transformer_pair", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "BAAI/bge-reranker-base", "tokenizer_name": "" }, { "task_name": "write_importance_regression", "family": "router", "input_type": "single", "objective": "single_regression", "enabled": true, "artifact_name": "write_importance_regression", "metrics": [ "mae", "rmse" ], "trainer": "", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "", "tokenizer_name": "" }, { "task_name": "memory_type", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "memory_type", "metrics": [ "accuracy", "macro_f1", "weighted_f1" ], "trainer": "hierarchical_transformer", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "" }, { "task_name": "salience_bin", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "salience_bin", "metrics": [ "accuracy", "macro_f1", "weighted_f1", "ordinal_mae", "off_by_two_rate" ], "trainer": "ordinal_threshold", "feature_backend": "", "label_order": [ "low", "medium", "high" ], "embedding_model_name": "", "backbone_model_name": "", "tokenizer_name": "" }, { "task_name": "importance_bin", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "importance_bin", "metrics": [ "accuracy", "macro_f1", "weighted_f1", "ordinal_mae", "off_by_two_rate" ], "trainer": "ordinal_threshold", "feature_backend": "", "label_order": [ "low", "medium", "high" ], "embedding_model_name": "", "backbone_model_name": "", "tokenizer_name": "" }, { "task_name": "confidence_bin", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "confidence_bin", "metrics": [ "accuracy", "macro_f1", "weighted_f1", "ordinal_mae", "off_by_two_rate" ], "trainer": "ordinal_threshold", "feature_backend": "", "label_order": [ "low", "medium", "high" ], "embedding_model_name": "", "backbone_model_name": "", "tokenizer_name": "" }, { "task_name": "decay_profile", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "decay_profile", "metrics": [ "accuracy", "macro_f1", "weighted_f1", "ordinal_mae", "off_by_two_rate" ], "trainer": "ordinal_threshold", "feature_backend": "", "label_order": [ "very_fast", "fast", "medium", "slow", "very_slow" ], "embedding_model_name": "", "backbone_model_name": "", "tokenizer_name": "" }, { "task_name": "pii_span_detection", "family": "extractor", "input_type": "single", "objective": "token_classification", "enabled": true, "artifact_name": "pii_span_detection", "metrics": [ "span_f1", "span_exact_match" ], "trainer": "", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "", "tokenizer_name": "" }, { "task_name": "consolidation_gist_quality", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "consolidation_gist_quality", "metrics": [ "accuracy", "macro_f1", "weighted_f1" ], "trainer": "transformer_text", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "" }, { "task_name": "forgetting_action_policy", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "forgetting_action_policy", "metrics": [ "accuracy", "macro_f1", "weighted_f1" ], "trainer": "transformer_text", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "" }, { "task_name": "constraint_dimension", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "constraint_dimension", "metrics": [ "accuracy", "macro_f1", "weighted_f1" ], "trainer": "transformer_text", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "" }, { "task_name": "context_tag", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "artifact_name": "context_tag", "metrics": [ "accuracy", "macro_f1", "weighted_f1" ], "trainer": "transformer_text", "feature_backend": "", "label_order": [], "embedding_model_name": "", "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "" } ], "preflight_validation": { "ok": true, "strict": true, "errors": [], "warnings": [], "task_checks": [ { "task_name": "retrieval_constraint_relevance_pair", "family": "pair", "input_type": "pair", "objective": "pair_ranking", "enabled": true, "status": "ok", "reason": null, "rows_found": 80000, "valid_score_rows": 0 }, { "task_name": "memory_rerank_pair", "family": "pair", "input_type": "pair", "objective": "pair_ranking", "enabled": true, "status": "ok", "reason": null, "rows_found": 80000, "valid_score_rows": 0 }, { "task_name": "novelty_pair", "family": "pair", "input_type": "pair", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 117206, "valid_score_rows": 0 }, { "task_name": "fact_extraction_structured", "family": "extractor", "input_type": "single", "objective": "token_classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 31997, "valid_score_rows": 0 }, { "task_name": "schema_match_pair", "family": "pair", "input_type": "pair", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 81200, "valid_score_rows": 0 }, { "task_name": "reconsolidation_candidate_pair", "family": "pair", "input_type": "pair", "objective": "pair_ranking", "enabled": true, "status": "ok", "reason": null, "rows_found": 80000, "valid_score_rows": 0 }, { "task_name": "write_importance_regression", "family": "router", "input_type": "single", "objective": "single_regression", "enabled": true, "status": "ok", "reason": null, "rows_found": 8000, "valid_score_rows": 8000 }, { "task_name": "memory_type", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 120000, "valid_score_rows": 0 }, { "task_name": "salience_bin", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 24000, "valid_score_rows": 0 }, { "task_name": "importance_bin", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 24000, "valid_score_rows": 0 }, { "task_name": "confidence_bin", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 24000, "valid_score_rows": 0 }, { "task_name": "decay_profile", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 40000, "valid_score_rows": 0 }, { "task_name": "pii_span_detection", "family": "extractor", "input_type": "single", "objective": "token_classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 30516, "valid_score_rows": 0 }, { "task_name": "consolidation_gist_quality", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 10432, "valid_score_rows": 0 }, { "task_name": "forgetting_action_policy", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 40000, "valid_score_rows": 0 }, { "task_name": "constraint_dimension", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 48000, "valid_score_rows": 0 }, { "task_name": "context_tag", "family": "router", "input_type": "single", "objective": "classification", "enabled": true, "status": "ok", "reason": null, "rows_found": 64000, "valid_score_rows": 0 } ], "observed_tasks_by_family": { "extractor": [ "constraint_scope", "constraint_stability", "constraint_type", "fact_type", "pii_presence" ], "pair": [ "conflict_detection", "constraint_rerank", "memory_rerank_pair", "novelty_pair", "reconsolidation_candidate_pair", "retrieval_constraint_relevance_pair", "schema_match_pair", "scope_match", "supersession" ], "router": [ "confidence_bin", "consolidation_gist_quality", "constraint_dimension", "context_tag", "decay_profile", "forgetting_action_policy", "importance_bin", "memory_type", "query_domain", "query_intent", "salience_bin", "write_importance_regression" ] }, "coverage_vs_config": { "extractor": { "configured_enabled_tasks": [], "observed_tasks": [ "constraint_scope", "constraint_stability", "constraint_type", "fact_type", "pii_presence" ], "missing_configured_tasks": [] }, "pair": { "configured_enabled_tasks": [ "memory_rerank_pair", "novelty_pair", "reconsolidation_candidate_pair", "retrieval_constraint_relevance_pair", "schema_match_pair" ], "observed_tasks": [ "conflict_detection", "constraint_rerank", "memory_rerank_pair", "novelty_pair", "reconsolidation_candidate_pair", "retrieval_constraint_relevance_pair", "schema_match_pair", "scope_match", "supersession" ], "missing_configured_tasks": [] }, "router": { "configured_enabled_tasks": [ "confidence_bin", "consolidation_gist_quality", "constraint_dimension", "context_tag", "decay_profile", "forgetting_action_policy", "importance_bin", "memory_type", "salience_bin", "write_importance_regression" ], "observed_tasks": [ "confidence_bin", "consolidation_gist_quality", "constraint_dimension", "context_tag", "decay_profile", "forgetting_action_policy", "importance_bin", "memory_type", "query_domain", "query_intent", "salience_bin", "write_importance_regression" ], "missing_configured_tasks": [] } } }, "families": { "router": { "model_path": "packages/models/trained_models/router_model.joblib" }, "extractor": { "model_path": "packages/models/trained_models/extractor_model.joblib" }, "pair": { "model_path": "packages/models/trained_models/pair_model.joblib" } }, "task_training_status": { "retrieval_constraint_relevance_pair": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "pair", "objective": "pair_ranking", "enabled": true }, "memory_rerank_pair": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "pair", "objective": "pair_ranking", "enabled": true }, "novelty_pair": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "pair", "objective": "classification", "enabled": true }, "fact_extraction_structured": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "extractor", "objective": "token_classification", "enabled": true }, "schema_match_pair": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "pair", "objective": "classification", "enabled": true }, "reconsolidation_candidate_pair": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "pair", "objective": "pair_ranking", "enabled": true }, "write_importance_regression": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "single_regression", "enabled": true }, "memory_type": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "salience_bin": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "importance_bin": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "confidence_bin": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "decay_profile": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "pii_span_detection": { "status": "trained", "reason": null, "family": "extractor", "objective": "token_classification", "enabled": true, "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/pii_span_detection_model.joblib", "train_rows": 30516 }, "consolidation_gist_quality": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "forgetting_action_policy": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "constraint_dimension": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true }, "context_tag": { "status": "filtered_out", "reason": "Excluded by --tasks filter", "family": "router", "objective": "classification", "enabled": true } }, "task_models": { "memory_rerank_pair": { "model_path": "packages/models/trained_models/memory_rerank_pair_model.joblib", "hf_model_dir": "packages/models/trained_models/memory_rerank_pair_hf" }, "retrieval_constraint_relevance_pair": { "model_path": "packages/models/trained_models/retrieval_constraint_relevance_pair_model.joblib", "hf_model_dir": "packages/models/trained_models/retrieval_constraint_relevance_pair_hf" }, "novelty_pair": { "model_path": "packages/models/trained_models/novelty_pair_model.joblib", "hf_model_dir": "packages/models/trained_models/novelty_pair_hf" }, "fact_extraction_structured": { "model_path": "packages/models/trained_models/fact_extraction_structured_model.joblib", "hf_model_dir": "packages/models/trained_models/fact_extraction_structured_hf" }, "schema_match_pair": { "task": "schema_match_pair", "objective": "classification", "trainer": "transformer_pair", "model_kind": "transformer_pair", "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/schema_match_pair_model.joblib", "hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/schema_match_pair_hf", "train_rows": 81200, "test": { "rows": 10000, "accuracy": 0.8552, "macro_f1": 0.8551561470750885, "weighted_f1": 0.8551561470750885, "micro_f1": 0.8552, "labels": [ "schema_match_pair::match", "schema_match_pair::no_match" ], "confusion_matrix": [ [ 4189, 811 ], [ 637, 4363 ] ], "calibration_error": 0.03336120770113563, "classification_report": { "schema_match_pair::match": { "precision": 0.8680066307501036, "recall": 0.8378, "f1-score": 0.852635864034195, "support": 5000.0 }, "schema_match_pair::no_match": { "precision": 0.8432547352145342, "recall": 0.8726, "f1-score": 0.8576764301159819, "support": 5000.0 }, "accuracy": 0.8552, "macro avg": { "precision": 0.8556306829823189, "recall": 0.8552, "f1-score": 0.8551561470750885, "support": 10000.0 }, "weighted avg": { "precision": 0.8556306829823188, "recall": 0.8552, "f1-score": 0.8551561470750885, "support": 10000.0 } } }, "eval": { "rows": 10000, "accuracy": 0.8517, "macro_f1": 0.8516351927685533, "weighted_f1": 0.8516351927685533, "micro_f1": 0.8517, "labels": [ "schema_match_pair::match", "schema_match_pair::no_match" ], "confusion_matrix": [ [ 4154, 846 ], [ 637, 4363 ] ], "calibration_error": 0.03950018305884612, "classification_report": { "schema_match_pair::match": { "precision": 0.8670423711125026, "recall": 0.8308, "f1-score": 0.848534368297416, "support": 5000.0 }, "schema_match_pair::no_match": { "precision": 0.8375887886350547, "recall": 0.8726, "f1-score": 0.8547360172396905, "support": 5000.0 }, "accuracy": 0.8517, "macro avg": { "precision": 0.8523155798737787, "recall": 0.8517, "f1-score": 0.8516351927685533, "support": 10000.0 }, "weighted avg": { "precision": 0.8523155798737786, "recall": 0.8517, "f1-score": 0.8516351927685533, "support": 10000.0 } } }, "actual_epochs": 4, "best_epoch": 4, "early_stopped": false, "selection_metric": "macro_f1", "selection_value": 0.8516351927685533, "backbone_model_name": "BAAI/bge-reranker-base", "tokenizer_name": "BAAI/bge-reranker-base", "calibration": { "method": "temperature_grid_search", "rows": 10000, "temperature": 1.3, "loss": 0.3754132442613608 }, "thresholds": { "default_threshold": 0.26, "positive_label": "schema_match_pair::match", "precision_floor": 0.85, "positive_f1": 0.8544423440453687, "positive_precision": 0.8501286873886359 }, "artifact_scope": "task", "evaluation_suite": "standard", "dataset_hashes": { "train": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pair_train.parquet", "sha256": "5b19ae2af42d3bbeb58fa8cda2a6b40748e2561a7c4c60a464e2eced711d7c16", "bytes": 99474783 }, "test": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pair_test.parquet", "sha256": "33f2d21d29ab684df5c9ab8df2b8bea8ffaa485434bc14bed350cea86a075a88", "bytes": 14270999 }, "eval": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pair_eval.parquet", "sha256": "cb6fae7ab447adb0d49af2de458dfbfa82f1af1efa5fd72644e2e6a9db7d07b7", "bytes": 14298411 } }, "release_gates": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.8, "actual": 0.8551561470750885, "passed": true }, { "section": "test", "metric": "calibration_error", "threshold": { "max": 0.08 }, "actual": 0.03336120770113563, "passed": true } ] } }, "reconsolidation_candidate_pair": { "model_path": "packages/models/trained_models/reconsolidation_candidate_pair_model.joblib", "hf_model_dir": "packages/models/trained_models/reconsolidation_candidate_pair_hf" }, "write_importance_regression": { "model_path": "packages/models/trained_models/write_importance_regression_model.joblib" }, "forgetting_action_policy": { "task": "forgetting_action_policy", "objective": "classification", "trainer": "transformer_text", "model_kind": "transformer_text", "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/forgetting_action_policy_model.joblib", "hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/forgetting_action_policy_hf", "train_rows": 28580, "test": { "rows": 18920, "accuracy": 0.9994714587737844, "macro_f1": 0.9994714168187103, "weighted_f1": 0.9994714168187103, "micro_f1": 0.9994714587737844, "labels": [ "forgetting_action_policy::compress", "forgetting_action_policy::decay", "forgetting_action_policy::delete", "forgetting_action_policy::keep", "forgetting_action_policy::silence" ], "confusion_matrix": [ [ 3782, 2, 0, 0, 0 ], [ 0, 3784, 0, 0, 0 ], [ 0, 0, 3779, 1, 4 ], [ 0, 0, 0, 3784, 0 ], [ 2, 0, 1, 0, 3781 ] ], "calibration_error": 0.01649172677837832, "classification_report": { "forgetting_action_policy::compress": { "precision": 0.9994714587737844, "recall": 0.9994714587737844, "f1-score": 0.9994714587737844, "support": 3784.0 }, "forgetting_action_policy::decay": { "precision": 0.9994717379820391, "recall": 1.0, "f1-score": 0.9997357992073976, "support": 3784.0 }, "forgetting_action_policy::delete": { "precision": 0.9997354497354497, "recall": 0.9986786469344608, "f1-score": 0.9992067689053411, "support": 3784.0 }, "forgetting_action_policy::keep": { "precision": 0.9997357992073976, "recall": 1.0, "f1-score": 0.9998678821508786, "support": 3784.0 }, "forgetting_action_policy::silence": { "precision": 0.9989431968295905, "recall": 0.9992071881606766, "f1-score": 0.9990751750561501, "support": 3784.0 }, "accuracy": 0.9994714587737844, "macro avg": { "precision": 0.9994715285056524, "recall": 0.9994714587737844, "f1-score": 0.9994714168187103, "support": 18920.0 }, "weighted avg": { "precision": 0.9994715285056522, "recall": 0.9994714587737844, "f1-score": 0.9994714168187103, "support": 18920.0 } } }, "eval": { "rows": 5000, "accuracy": 0.984, "macro_f1": 0.9839922007228425, "weighted_f1": 0.9839922007228427, "micro_f1": 0.984, "labels": [ "forgetting_action_policy::compress", "forgetting_action_policy::decay", "forgetting_action_policy::delete", "forgetting_action_policy::keep", "forgetting_action_policy::silence" ], "confusion_matrix": [ [ 988, 3, 0, 9, 0 ], [ 3, 986, 1, 1, 9 ], [ 2, 0, 994, 0, 4 ], [ 6, 11, 0, 979, 4 ], [ 2, 11, 11, 3, 973 ] ], "calibration_error": 0.0073812406567217975, "classification_report": { "forgetting_action_policy::compress": { "precision": 0.987012987012987, "recall": 0.988, "f1-score": 0.9875062468765617, "support": 1000.0 }, "forgetting_action_policy::decay": { "precision": 0.9752720079129574, "recall": 0.986, "f1-score": 0.9806066633515664, "support": 1000.0 }, "forgetting_action_policy::delete": { "precision": 0.9880715705765407, "recall": 0.994, "f1-score": 0.9910269192422732, "support": 1000.0 }, "forgetting_action_policy::keep": { "precision": 0.9868951612903226, "recall": 0.979, "f1-score": 0.9829317269076305, "support": 1000.0 }, "forgetting_action_policy::silence": { "precision": 0.9828282828282828, "recall": 0.973, "f1-score": 0.9778894472361809, "support": 1000.0 }, "accuracy": 0.984, "macro avg": { "precision": 0.984016001924218, "recall": 0.984, "f1-score": 0.9839922007228425, "support": 5000.0 }, "weighted avg": { "precision": 0.9840160019242181, "recall": 0.984, "f1-score": 0.9839922007228427, "support": 5000.0 } } }, "actual_epochs": 8, "best_epoch": 7, "early_stopped": false, "selection_metric": "macro_f1", "selection_value": 0.9839922007228425, "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "microsoft/deberta-v3-base", "calibration": { "method": "temperature_grid_search", "rows": 5000, "temperature": 2.0, "loss": 0.08134587520392533 }, "artifact_scope": "task", "evaluation_suite": "standard", "dataset_hashes": { "train": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet", "sha256": "d6cf7bf6638ca6d2a0b12d3e011aac120866f3cbf7364359bcc32a1f86ac3770", "bytes": 44674192 }, "test": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet", "sha256": "2665b088823ca9733c9f53a62aa9e4c8f6148a8d169ebfb69641d04a3e710552", "bytes": 7175410 }, "eval": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet", "sha256": "b492f3fd739408de18bfd17b5c57248b51b90dba10e744f2687b50cdc351e13f", "bytes": 6746274 } }, "release_gates": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.93, "actual": 0.9994714168187103, "passed": true }, { "section": "test", "metric": "decay_recall", "threshold": 0.9, "actual": 1.0, "passed": true }, { "section": "test", "metric": "delete_recall", "threshold": 0.9, "actual": 0.9986786469344608, "passed": true } ] } }, "constraint_dimension": { "task": "constraint_dimension", "objective": "classification", "trainer": "transformer_text", "model_kind": "transformer_text", "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/constraint_dimension_model.joblib", "hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/constraint_dimension_hf", "train_rows": 48000, "test": { "rows": 6000, "accuracy": 0.8828333333333334, "macro_f1": 0.883185453547077, "weighted_f1": 0.883185453547077, "micro_f1": 0.8828333333333334, "labels": [ "constraint_dimension::causal", "constraint_dimension::goal", "constraint_dimension::other", "constraint_dimension::policy", "constraint_dimension::state", "constraint_dimension::value" ], "confusion_matrix": [ [ 966, 2, 20, 1, 7, 4 ], [ 1, 927, 47, 2, 6, 17 ], [ 12, 30, 817, 22, 56, 63 ], [ 0, 2, 26, 949, 1, 22 ], [ 27, 7, 63, 8, 865, 30 ], [ 7, 19, 137, 27, 37, 773 ] ], "calibration_error": 0.08291319935909541, "classification_report": { "constraint_dimension::causal": { "precision": 0.9536031589338598, "recall": 0.966, "f1-score": 0.9597615499254843, "support": 1000.0 }, "constraint_dimension::goal": { "precision": 0.939209726443769, "recall": 0.927, "f1-score": 0.9330649219929542, "support": 1000.0 }, "constraint_dimension::other": { "precision": 0.7360360360360361, "recall": 0.817, "f1-score": 0.7744075829383886, "support": 1000.0 }, "constraint_dimension::policy": { "precision": 0.9405351833498513, "recall": 0.949, "f1-score": 0.944748631159781, "support": 1000.0 }, "constraint_dimension::state": { "precision": 0.8899176954732511, "recall": 0.865, "f1-score": 0.8772819472616633, "support": 1000.0 }, "constraint_dimension::value": { "precision": 0.8503850385038504, "recall": 0.773, "f1-score": 0.8098480880041907, "support": 1000.0 }, "accuracy": 0.8828333333333334, "macro avg": { "precision": 0.8849478064567696, "recall": 0.8828333333333332, "f1-score": 0.883185453547077, "support": 6000.0 }, "weighted avg": { "precision": 0.8849478064567696, "recall": 0.8828333333333334, "f1-score": 0.883185453547077, "support": 6000.0 } } }, "eval": { "rows": 6000, "accuracy": 0.8698333333333333, "macro_f1": 0.8703105353987516, "weighted_f1": 0.8703105353987517, "micro_f1": 0.8698333333333333, "labels": [ "constraint_dimension::causal", "constraint_dimension::goal", "constraint_dimension::other", "constraint_dimension::policy", "constraint_dimension::state", "constraint_dimension::value" ], "confusion_matrix": [ [ 965, 2, 16, 0, 12, 5 ], [ 1, 907, 57, 1, 9, 25 ], [ 19, 31, 791, 18, 56, 85 ], [ 1, 0, 22, 954, 2, 21 ], [ 27, 13, 78, 6, 842, 34 ], [ 13, 23, 145, 23, 36, 760 ] ], "calibration_error": 0.09575599064379686, "classification_report": { "constraint_dimension::causal": { "precision": 0.9405458089668616, "recall": 0.965, "f1-score": 0.9526159921026653, "support": 1000.0 }, "constraint_dimension::goal": { "precision": 0.9293032786885246, "recall": 0.907, "f1-score": 0.9180161943319838, "support": 1000.0 }, "constraint_dimension::other": { "precision": 0.7132551848512173, "recall": 0.791, "f1-score": 0.7501185395922239, "support": 1000.0 }, "constraint_dimension::policy": { "precision": 0.9520958083832335, "recall": 0.954, "f1-score": 0.9530469530469531, "support": 1000.0 }, "constraint_dimension::state": { "precision": 0.8798328108672936, "recall": 0.842, "f1-score": 0.8605007664793051, "support": 1000.0 }, "constraint_dimension::value": { "precision": 0.8172043010752689, "recall": 0.76, "f1-score": 0.7875647668393783, "support": 1000.0 }, "accuracy": 0.8698333333333333, "macro avg": { "precision": 0.8720395321387332, "recall": 0.8698333333333332, "f1-score": 0.8703105353987516, "support": 6000.0 }, "weighted avg": { "precision": 0.8720395321387332, "recall": 0.8698333333333333, "f1-score": 0.8703105353987517, "support": 6000.0 } } }, "actual_epochs": 10, "best_epoch": 10, "early_stopped": false, "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "microsoft/deberta-v3-base", "calibration": { "method": "temperature_grid_search", "rows": 6000, "temperature": 2.0, "loss": 0.5294126563569427 }, "artifact_scope": "task", "evaluation_suite": "standard", "dataset_hashes": { "train": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet", "sha256": "d6cf7bf6638ca6d2a0b12d3e011aac120866f3cbf7364359bcc32a1f86ac3770", "bytes": 44674192 }, "test": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet", "sha256": "c24ff4a481709443ccdac0bad5916fede972611b3cdd683a578f750d18a40e71", "bytes": 7175410 }, "eval": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet", "sha256": "b492f3fd739408de18bfd17b5c57248b51b90dba10e744f2687b50cdc351e13f", "bytes": 6746274 } }, "release_gates": { "passed": true, "checks": [] } }, "context_tag": { "task": "context_tag", "objective": "classification", "trainer": "transformer_text", "model_kind": "transformer_text", "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/context_tag_model.joblib", "hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/context_tag_hf", "train_rows": 64000, "test": { "rows": 8000, "accuracy": 0.947375, "macro_f1": 0.9462078544778264, "weighted_f1": 0.9462078544778263, "micro_f1": 0.947375, "labels": [ "context_tag::finance", "context_tag::food", "context_tag::general", "context_tag::health", "context_tag::social", "context_tag::tech", "context_tag::travel", "context_tag::work" ], "confusion_matrix": [ [ 979, 0, 12, 1, 0, 3, 1, 4 ], [ 0, 951, 15, 24, 8, 0, 2, 0 ], [ 52, 34, 775, 27, 28, 21, 30, 33 ], [ 0, 13, 15, 972, 0, 0, 0, 0 ], [ 1, 5, 10, 0, 975, 0, 6, 3 ], [ 2, 0, 9, 0, 0, 975, 0, 14 ], [ 4, 0, 4, 0, 4, 1, 986, 1 ], [ 5, 0, 11, 0, 0, 17, 1, 966 ] ], "calibration_error": 0.024662236875587645, "classification_report": { "context_tag::finance": { "precision": 0.9386385426653883, "recall": 0.979, "f1-score": 0.9583945178658835, "support": 1000.0 }, "context_tag::food": { "precision": 0.9481555333998006, "recall": 0.951, "f1-score": 0.9495756365451822, "support": 1000.0 }, "context_tag::general": { "precision": 0.9106933019976499, "recall": 0.775, "f1-score": 0.8373851971907077, "support": 1000.0 }, "context_tag::health": { "precision": 0.94921875, "recall": 0.972, "f1-score": 0.9604743083003953, "support": 1000.0 }, "context_tag::social": { "precision": 0.9605911330049262, "recall": 0.975, "f1-score": 0.967741935483871, "support": 1000.0 }, "context_tag::tech": { "precision": 0.9587020648967551, "recall": 0.975, "f1-score": 0.9667823500247893, "support": 1000.0 }, "context_tag::travel": { "precision": 0.9610136452241715, "recall": 0.986, "f1-score": 0.9733464955577492, "support": 1000.0 }, "context_tag::work": { "precision": 0.9461312438785504, "recall": 0.966, "f1-score": 0.9559623948540327, "support": 1000.0 }, "accuracy": 0.947375, "macro avg": { "precision": 0.9466430268834052, "recall": 0.947375, "f1-score": 0.9462078544778264, "support": 8000.0 }, "weighted avg": { "precision": 0.9466430268834054, "recall": 0.947375, "f1-score": 0.9462078544778263, "support": 8000.0 } } }, "eval": { "rows": 8000, "accuracy": 0.94625, "macro_f1": 0.9445890976694143, "weighted_f1": 0.9445890976694143, "micro_f1": 0.94625, "labels": [ "context_tag::finance", "context_tag::food", "context_tag::general", "context_tag::health", "context_tag::social", "context_tag::tech", "context_tag::travel", "context_tag::work" ], "confusion_matrix": [ [ 982, 0, 8, 0, 0, 4, 0, 6 ], [ 1, 972, 9, 11, 6, 0, 1, 0 ], [ 50, 53, 743, 33, 29, 26, 27, 39 ], [ 1, 18, 10, 967, 1, 2, 0, 1 ], [ 2, 5, 4, 1, 984, 0, 2, 2 ], [ 5, 0, 14, 2, 1, 971, 0, 7 ], [ 1, 2, 6, 0, 6, 1, 983, 1 ], [ 1, 0, 11, 0, 0, 19, 1, 968 ] ], "calibration_error": 0.023930798305538282, "classification_report": { "context_tag::finance": { "precision": 0.9415148609779482, "recall": 0.982, "f1-score": 0.9613313754282917, "support": 1000.0 }, "context_tag::food": { "precision": 0.9257142857142857, "recall": 0.972, "f1-score": 0.9482926829268292, "support": 1000.0 }, "context_tag::general": { "precision": 0.9229813664596274, "recall": 0.743, "f1-score": 0.8232686980609418, "support": 1000.0 }, "context_tag::health": { "precision": 0.9536489151873767, "recall": 0.967, "f1-score": 0.9602780536246276, "support": 1000.0 }, "context_tag::social": { "precision": 0.9581304771178188, "recall": 0.984, "f1-score": 0.9708929452392698, "support": 1000.0 }, "context_tag::tech": { "precision": 0.9491691104594331, "recall": 0.971, "f1-score": 0.9599604547701434, "support": 1000.0 }, "context_tag::travel": { "precision": 0.9694280078895463, "recall": 0.983, "f1-score": 0.9761668321747765, "support": 1000.0 }, "context_tag::work": { "precision": 0.9453125, "recall": 0.968, "f1-score": 0.9565217391304348, "support": 1000.0 }, "accuracy": 0.94625, "macro avg": { "precision": 0.9457374404757546, "recall": 0.94625, "f1-score": 0.9445890976694143, "support": 8000.0 }, "weighted avg": { "precision": 0.9457374404757545, "recall": 0.94625, "f1-score": 0.9445890976694143, "support": 8000.0 } } }, "actual_epochs": 3, "best_epoch": 3, "early_stopped": false, "backbone_model_name": "microsoft/deberta-v3-base", "tokenizer_name": "microsoft/deberta-v3-base", "calibration": { "method": "temperature_grid_search", "rows": 8000, "temperature": 2.0, "loss": 0.22631261527409646 }, "artifact_scope": "task", "evaluation_suite": "standard", "dataset_hashes": { "train": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet", "sha256": "d6cf7bf6638ca6d2a0b12d3e011aac120866f3cbf7364359bcc32a1f86ac3770", "bytes": 44674192 }, "test": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet", "sha256": "c24ff4a481709443ccdac0bad5916fede972611b3cdd683a578f750d18a40e71", "bytes": 7175410 }, "eval": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet", "sha256": "b492f3fd739408de18bfd17b5c57248b51b90dba10e744f2687b50cdc351e13f", "bytes": 6746274 } }, "release_gates": { "passed": true, "checks": [] } }, "confidence_bin": { "task": "confidence_bin", "objective": "classification", "trainer": "ordinal_threshold", "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/confidence_bin_model.joblib", "train_rows": 24000, "test": { "rows": 3000, "accuracy": 1.0, "macro_f1": 1.0, "weighted_f1": 1.0, "micro_f1": 1.0, "labels": [ "low", "medium", "high" ], "confusion_matrix": [ [ 1000, 0, 0 ], [ 0, 1000, 0 ], [ 0, 0, 1000 ] ], "calibration_error": 0.0, "classification_report": { "confidence_bin::high": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "confidence_bin::low": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "confidence_bin::medium": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "accuracy": 1.0, "macro avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 3000.0 }, "weighted avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 3000.0 } }, "ordinal_mae": 0.0, "off_by_two_rate": 0.0 }, "eval": { "rows": 3000, "accuracy": 1.0, "macro_f1": 1.0, "weighted_f1": 1.0, "micro_f1": 1.0, "labels": [ "low", "medium", "high" ], "confusion_matrix": [ [ 1000, 0, 0 ], [ 0, 1000, 0 ], [ 0, 0, 1000 ] ], "calibration_error": 0.0, "classification_report": { "confidence_bin::high": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "confidence_bin::low": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "confidence_bin::medium": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "accuracy": 1.0, "macro avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 3000.0 }, "weighted avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 3000.0 } }, "ordinal_mae": 0.0, "off_by_two_rate": 0.0 }, "actual_epochs": 1, "best_epoch": 1, "early_stopped": false, "boundary_count": 2, "artifact_scope": "task", "evaluation_suite": "standard", "model_kind": "ordinal_threshold", "dataset_hashes": { "train": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet", "sha256": "d8bf7adebbfa6cda2ef35311b60e5b6028efd58ced64101671e6c64d4e87ca17", "bytes": 41617539 }, "test": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet", "sha256": "46c4cf932e38240bb411ff50814b562f5daac3a876f807eaaaa5a52f8d981995", "bytes": 6786069 }, "eval": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet", "sha256": "ea69623ce36b98080f7c00ee722e45f7c870174a8967e87a5e7ed03ae18b1387", "bytes": 6369869 } }, "release_gates": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.85, "actual": 1.0, "passed": true } ] } }, "decay_profile": { "task": "decay_profile", "objective": "classification", "trainer": "ordinal_threshold", "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/decay_profile_model.joblib", "train_rows": 40000, "test": { "rows": 5000, "accuracy": 1.0, "macro_f1": 1.0, "weighted_f1": 1.0, "micro_f1": 1.0, "labels": [ "very_fast", "fast", "medium", "slow", "very_slow" ], "confusion_matrix": [ [ 1000, 0, 0, 0, 0 ], [ 0, 1000, 0, 0, 0 ], [ 0, 0, 1000, 0, 0 ], [ 0, 0, 0, 1000, 0 ], [ 0, 0, 0, 0, 1000 ] ], "calibration_error": 0.0, "classification_report": { "decay_profile::fast": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::medium": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::slow": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::very_fast": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::very_slow": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "accuracy": 1.0, "macro avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 5000.0 }, "weighted avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 5000.0 } }, "ordinal_mae": 0.0, "off_by_two_rate": 0.0 }, "eval": { "rows": 5000, "accuracy": 1.0, "macro_f1": 1.0, "weighted_f1": 1.0, "micro_f1": 1.0, "labels": [ "very_fast", "fast", "medium", "slow", "very_slow" ], "confusion_matrix": [ [ 1000, 0, 0, 0, 0 ], [ 0, 1000, 0, 0, 0 ], [ 0, 0, 1000, 0, 0 ], [ 0, 0, 0, 1000, 0 ], [ 0, 0, 0, 0, 1000 ] ], "calibration_error": 0.0, "classification_report": { "decay_profile::fast": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::medium": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::slow": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::very_fast": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "decay_profile::very_slow": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 1000.0 }, "accuracy": 1.0, "macro avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 5000.0 }, "weighted avg": { "precision": 1.0, "recall": 1.0, "f1-score": 1.0, "support": 5000.0 } }, "ordinal_mae": 0.0, "off_by_two_rate": 0.0 }, "actual_epochs": 1, "best_epoch": 1, "early_stopped": false, "boundary_count": 4, "artifact_scope": "task", "evaluation_suite": "standard", "model_kind": "ordinal_threshold", "dataset_hashes": { "train": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet", "sha256": "d8bf7adebbfa6cda2ef35311b60e5b6028efd58ced64101671e6c64d4e87ca17", "bytes": 41617539 }, "test": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet", "sha256": "46c4cf932e38240bb411ff50814b562f5daac3a876f807eaaaa5a52f8d981995", "bytes": 6786069 }, "eval": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet", "sha256": "ea69623ce36b98080f7c00ee722e45f7c870174a8967e87a5e7ed03ae18b1387", "bytes": 6369869 } }, "release_gates": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.81, "actual": 1.0, "passed": true } ] } }, "pii_span_detection": { "task": "pii_span_detection", "objective": "token_classification", "trainer": "token_classification", "model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/pii_span_detection_model.joblib", "hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/pii_span_detection_hf", "train_rows": 30516, "test": { "span_precision": 0.9211675795604243, "span_recall": 0.9452863749555318, "span_f1": 0.9330711426364211, "span_exact_match": 0.8445730247406225, "rows": 5012 }, "eval": { "span_precision": 0.9210037995935318, "span_recall": 0.9411286681715576, "span_f1": 0.9309574848160057, "span_exact_match": 0.851520572450805, "rows": 4472 }, "labels": { "0": "O", "1": "B-ACCOUNTNAME", "2": "I-ACCOUNTNAME", "3": "B-ACCOUNTNUMBER", "4": "I-ACCOUNTNUMBER", "5": "B-AGE", "6": "I-AGE", "7": "B-AMOUNT", "8": "I-AMOUNT", "9": "B-BIC", "10": "I-BIC", "11": "B-BITCOINADDRESS", "12": "I-BITCOINADDRESS", "13": "B-BUILDINGNUMBER", "14": "I-BUILDINGNUMBER", "15": "B-CITY", "16": "I-CITY", "17": "B-COMPANYNAME", "18": "I-COMPANYNAME", "19": "B-COUNTY", "20": "I-COUNTY", "21": "B-CREDITCARDCVV", "22": "I-CREDITCARDCVV", "23": "B-CREDITCARDISSUER", "24": "I-CREDITCARDISSUER", "25": "B-CREDITCARDNUMBER", "26": "I-CREDITCARDNUMBER", "27": "B-CURRENCY", "28": "I-CURRENCY", "29": "B-CURRENCYCODE", "30": "I-CURRENCYCODE", "31": "B-CURRENCYNAME", "32": "I-CURRENCYNAME", "33": "B-CURRENCYSYMBOL", "34": "I-CURRENCYSYMBOL", "35": "B-DATE", "36": "I-DATE", "37": "B-DOB", "38": "I-DOB", "39": "B-EMAIL", "40": "I-EMAIL", "41": "B-ETHEREUMADDRESS", "42": "I-ETHEREUMADDRESS", "43": "B-EYECOLOR", "44": "I-EYECOLOR", "45": "B-FIRSTNAME", "46": "I-FIRSTNAME", "47": "B-GENDER", "48": "I-GENDER", "49": "B-HEIGHT", "50": "I-HEIGHT", "51": "B-IBAN", "52": "I-IBAN", "53": "B-IP", "54": "I-IP", "55": "B-IPV4", "56": "I-IPV4", "57": "B-IPV6", "58": "I-IPV6", "59": "B-JOBAREA", "60": "I-JOBAREA", "61": "B-JOBTITLE", "62": "I-JOBTITLE", "63": "B-JOBTYPE", "64": "I-JOBTYPE", "65": "B-LASTNAME", "66": "I-LASTNAME", "67": "B-LITECOINADDRESS", "68": "I-LITECOINADDRESS", "69": "B-MAC", "70": "I-MAC", "71": "B-MASKEDNUMBER", "72": "I-MASKEDNUMBER", "73": "B-MIDDLENAME", "74": "I-MIDDLENAME", "75": "B-NEARBYGPSCOORDINATE", "76": "I-NEARBYGPSCOORDINATE", "77": "B-ORDINALDIRECTION", "78": "I-ORDINALDIRECTION", "79": "B-PASSWORD", "80": "I-PASSWORD", "81": "B-PHONEIMEI", "82": "I-PHONEIMEI", "83": "B-PHONENUMBER", "84": "I-PHONENUMBER", "85": "B-PIN", "86": "I-PIN", "87": "B-PREFIX", "88": "I-PREFIX", "89": "B-SECONDARYADDRESS", "90": "I-SECONDARYADDRESS", "91": "B-SECRET", "92": "I-SECRET", "93": "B-SEX", "94": "I-SEX", "95": "B-SSN", "96": "I-SSN", "97": "B-STATE", "98": "I-STATE", "99": "B-STREET", "100": "I-STREET", "101": "B-TIME", "102": "I-TIME", "103": "B-URL", "104": "I-URL", "105": "B-USERAGENT", "106": "I-USERAGENT", "107": "B-USERNAME", "108": "I-USERNAME", "109": "B-VEHICLEVIN", "110": "I-VEHICLEVIN", "111": "B-VEHICLEVRM", "112": "I-VEHICLEVRM", "113": "B-ZIPCODE", "114": "I-ZIPCODE" }, "epoch_stats": [ { "epoch": 1, "train_loss": 0.5123886795952879 }, { "epoch": 2, "train_loss": 0.10158961580695137 }, { "epoch": 3, "train_loss": 0.08095065996874068 }, { "epoch": 4, "train_loss": 0.0687989874073682 }, { "epoch": 5, "train_loss": 0.058967599591349715 }, { "epoch": 6, "train_loss": 0.04842000443624294 }, { "epoch": 7, "train_loss": 0.03766606290595617 }, { "epoch": 8, "train_loss": 0.024583430213327515 } ], "actual_epochs": 8, "best_epoch": 8, "early_stopped": false, "artifact_scope": "task", "evaluation_suite": "standard", "model_kind": "token_classification", "dataset_hashes": { "train": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pii_span_detection_train.parquet", "sha256": "f904fecb9ca45337906ff8e3d60087e38091237777e82a6313e9ef5a21e82bc8", "bytes": 3742506 }, "test": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pii_span_detection_test.parquet", "sha256": "6d75b6997a97a61e2b884dfc36099605ecd5d7e5ae3476c54cc7aa33cdb5fb81", "bytes": 607354 }, "eval": { "path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pii_span_detection_eval.parquet", "sha256": "153d5d007b854ff6023261c4182a67df1dfb219537c4cebaf69ce8ebed4a2725", "bytes": 515338 } }, "release_gates": { "passed": false, "checks": [ { "section": "test", "metric": "span_exact_match", "threshold": 0.88, "actual": 0.8445730247406225, "passed": false }, { "section": "test", "metric": "span_f1", "threshold": 0.93, "actual": 0.9330711426364211, "passed": true } ] } } }, "release_mode": false, "allow_dirty": false, "release_gates": { "schema_match_pair": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.8, "actual": 0.8551561470750885, "passed": true }, { "section": "test", "metric": "calibration_error", "threshold": { "max": 0.08 }, "actual": 0.03336120770113563, "passed": true } ] }, "memory_type": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.86, "actual": 1.0, "passed": true }, { "section": "test", "metric": "plan_f1", "threshold": 0.75, "actual": 1.0, "passed": true } ] }, "novelty_pair": { "passed": true, "checks": [ { "section": "test", "metric": "changed_f1", "threshold": 0.88, "actual": 0.9117293835068054, "passed": true } ] }, "confidence_bin": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.85, "actual": 1.0, "passed": true } ] }, "decay_profile": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.81, "actual": 1.0, "passed": true } ] }, "pii_span_detection": { "passed": true, "checks": [ { "section": "test", "metric": "span_exact_match", "threshold": 0.84, "actual": 0.8445730247406225, "passed": true }, { "section": "test", "metric": "span_f1", "threshold": 0.93, "actual": 0.9330711426364211, "passed": true } ] }, "forgetting_action_policy": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.93, "actual": 0.9994714168187103, "passed": true }, { "section": "test", "metric": "decay_recall", "threshold": 0.9, "actual": 1.0, "passed": true }, { "section": "test", "metric": "delete_recall", "threshold": 0.9, "actual": 0.9986786469344608, "passed": true } ] }, "constraint_dimension": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.88, "actual": 0.883185453547077, "passed": true }, { "section": "test", "metric": "calibration_error", "threshold": { "max": 0.06 }, "actual": 0.04340881209580012, "passed": true } ] }, "context_tag": { "passed": true, "checks": [ { "section": "test", "metric": "macro_f1", "threshold": 0.94, "actual": 0.9462078544778264, "passed": true } ] }, "retrieval_constraint_relevance_pair": { "passed": true, "checks": [ { "section": "test", "metric": "calibration_error", "threshold": { "max": 0.08 }, "actual": 0.0649609781444073, "passed": true } ] }, "memory_rerank_pair": { "passed": true, "checks": [ { "section": "test", "metric": "calibration_error", "threshold": { "max": 0.08 }, "actual": 0.06469904275987867, "passed": true } ] }, "reconsolidation_candidate_pair": { "passed": true, "checks": [ { "section": "test", "metric": "calibration_error", "threshold": { "max": 0.08 }, "actual": 0.07517948439121241, "passed": true } ] }, "write_importance_regression": { "passed": true, "checks": [ { "section": "test", "metric": "test_mae", "threshold": { "max": 0.1 }, "actual": 0.01877478314980445, "passed": true } ] } }, "runtime_thresholds": {}, "artifact_validation": { "ok": true, "errors": [] } }