avinashm's picture
Upload all trained models
e65379c verified
{
"manifest_schema_version": 3,
"config_path": "/nvme/CognitiveMemoryLayer/packages/models/model_pipeline.toml",
"trained_at_utc": "2026-03-25T13:59:08.669850+00:00",
"paths": {
"prepared_dir": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack",
"trained_models_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models"
},
"train_settings": {
"seed": 42,
"families": [
"router",
"extractor",
"pair"
],
"max_features": 250000,
"min_df": 2,
"ngram_min": 1,
"ngram_max": 2,
"max_iter": 25,
"alpha": 1e-05,
"predict_batch_size": 8192,
"early_stopping": true,
"early_stopping_patience": 3,
"early_stopping_metric": "macro_f1",
"early_stopping_min_delta": 0.001,
"calibration_method": "sigmoid",
"calibration_split": "eval",
"transformer": {
"model_name_or_path": "microsoft/deberta-v3-base",
"tokenizer_name": "",
"num_train_epochs": 2,
"per_device_train_batch_size": 8,
"per_device_eval_batch_size": 16,
"max_seq_length": 256,
"learning_rate": 2e-05,
"warmup_ratio": 0.1,
"weight_decay": 0.01,
"gradient_accumulation_steps": 1,
"score_margin": 0.15,
"focal_gamma": 1.5,
"temperature_grid": [
0.7,
0.85,
1.0,
1.15,
1.3,
1.5,
2.0
]
},
"token": {
"model_name_or_path": "bert-base-multilingual-cased",
"num_train_epochs": 8,
"per_device_train_batch_size": 8,
"per_device_eval_batch_size": 16,
"max_seq_length": 256,
"stride": 64,
"learning_rate": 5e-05,
"warmup_ratio": 0.1,
"weight_decay": 0.01,
"gradient_accumulation_steps": 1
},
"allow_dirty": false,
"release_mode": false,
"strict": true
},
"build_metadata": {
"python_version": "3.14.3 (main, Mar 11 2026, 19:17:30) [GCC 15.2.0]",
"dependencies": {
"scikit_learn": "1.8.0",
"joblib": "1.5.3",
"pandas": "3.0.1"
},
"commit_sha": "090060c4478c373a02eb09ae63292f51ca31a710",
"dirty": true
},
"configured_tasks": [
{
"task_name": "retrieval_constraint_relevance_pair",
"family": "pair",
"input_type": "pair",
"objective": "pair_ranking",
"enabled": true,
"artifact_name": "retrieval_constraint_relevance_pair",
"metrics": [
"mrr@10",
"ndcg@10",
"recall@10"
],
"trainer": "transformer_pair",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "BAAI/bge-reranker-base",
"tokenizer_name": ""
},
{
"task_name": "memory_rerank_pair",
"family": "pair",
"input_type": "pair",
"objective": "pair_ranking",
"enabled": true,
"artifact_name": "memory_rerank_pair",
"metrics": [
"mrr@10",
"ndcg@10",
"recall@10"
],
"trainer": "transformer_pair",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "BAAI/bge-reranker-base",
"tokenizer_name": ""
},
{
"task_name": "novelty_pair",
"family": "pair",
"input_type": "pair",
"objective": "classification",
"enabled": true,
"artifact_name": "novelty_pair",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1"
],
"trainer": "transformer_pair",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "BAAI/bge-reranker-base",
"tokenizer_name": ""
},
{
"task_name": "fact_extraction_structured",
"family": "extractor",
"input_type": "single",
"objective": "token_classification",
"enabled": true,
"artifact_name": "fact_extraction_structured",
"metrics": [
"span_f1",
"span_exact_match"
],
"trainer": "",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "",
"tokenizer_name": ""
},
{
"task_name": "schema_match_pair",
"family": "pair",
"input_type": "pair",
"objective": "classification",
"enabled": true,
"artifact_name": "schema_match_pair",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1"
],
"trainer": "transformer_pair",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "BAAI/bge-reranker-base",
"tokenizer_name": ""
},
{
"task_name": "reconsolidation_candidate_pair",
"family": "pair",
"input_type": "pair",
"objective": "pair_ranking",
"enabled": true,
"artifact_name": "reconsolidation_candidate_pair",
"metrics": [
"mrr@10",
"ndcg@10",
"recall@10"
],
"trainer": "transformer_pair",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "BAAI/bge-reranker-base",
"tokenizer_name": ""
},
{
"task_name": "write_importance_regression",
"family": "router",
"input_type": "single",
"objective": "single_regression",
"enabled": true,
"artifact_name": "write_importance_regression",
"metrics": [
"mae",
"rmse"
],
"trainer": "",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "",
"tokenizer_name": ""
},
{
"task_name": "memory_type",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "memory_type",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1"
],
"trainer": "hierarchical_transformer",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": ""
},
{
"task_name": "salience_bin",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "salience_bin",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1",
"ordinal_mae",
"off_by_two_rate"
],
"trainer": "ordinal_threshold",
"feature_backend": "",
"label_order": [
"low",
"medium",
"high"
],
"embedding_model_name": "",
"backbone_model_name": "",
"tokenizer_name": ""
},
{
"task_name": "importance_bin",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "importance_bin",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1",
"ordinal_mae",
"off_by_two_rate"
],
"trainer": "ordinal_threshold",
"feature_backend": "",
"label_order": [
"low",
"medium",
"high"
],
"embedding_model_name": "",
"backbone_model_name": "",
"tokenizer_name": ""
},
{
"task_name": "confidence_bin",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "confidence_bin",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1",
"ordinal_mae",
"off_by_two_rate"
],
"trainer": "ordinal_threshold",
"feature_backend": "",
"label_order": [
"low",
"medium",
"high"
],
"embedding_model_name": "",
"backbone_model_name": "",
"tokenizer_name": ""
},
{
"task_name": "decay_profile",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "decay_profile",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1",
"ordinal_mae",
"off_by_two_rate"
],
"trainer": "ordinal_threshold",
"feature_backend": "",
"label_order": [
"very_fast",
"fast",
"medium",
"slow",
"very_slow"
],
"embedding_model_name": "",
"backbone_model_name": "",
"tokenizer_name": ""
},
{
"task_name": "pii_span_detection",
"family": "extractor",
"input_type": "single",
"objective": "token_classification",
"enabled": true,
"artifact_name": "pii_span_detection",
"metrics": [
"span_f1",
"span_exact_match"
],
"trainer": "",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "",
"tokenizer_name": ""
},
{
"task_name": "consolidation_gist_quality",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "consolidation_gist_quality",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1"
],
"trainer": "transformer_text",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": ""
},
{
"task_name": "forgetting_action_policy",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "forgetting_action_policy",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1"
],
"trainer": "transformer_text",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": ""
},
{
"task_name": "constraint_dimension",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "constraint_dimension",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1"
],
"trainer": "transformer_text",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": ""
},
{
"task_name": "context_tag",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"artifact_name": "context_tag",
"metrics": [
"accuracy",
"macro_f1",
"weighted_f1"
],
"trainer": "transformer_text",
"feature_backend": "",
"label_order": [],
"embedding_model_name": "",
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": ""
}
],
"preflight_validation": {
"ok": true,
"strict": true,
"errors": [],
"warnings": [],
"task_checks": [
{
"task_name": "retrieval_constraint_relevance_pair",
"family": "pair",
"input_type": "pair",
"objective": "pair_ranking",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 80000,
"valid_score_rows": 0
},
{
"task_name": "memory_rerank_pair",
"family": "pair",
"input_type": "pair",
"objective": "pair_ranking",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 80000,
"valid_score_rows": 0
},
{
"task_name": "novelty_pair",
"family": "pair",
"input_type": "pair",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 117206,
"valid_score_rows": 0
},
{
"task_name": "fact_extraction_structured",
"family": "extractor",
"input_type": "single",
"objective": "token_classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 31997,
"valid_score_rows": 0
},
{
"task_name": "schema_match_pair",
"family": "pair",
"input_type": "pair",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 81200,
"valid_score_rows": 0
},
{
"task_name": "reconsolidation_candidate_pair",
"family": "pair",
"input_type": "pair",
"objective": "pair_ranking",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 80000,
"valid_score_rows": 0
},
{
"task_name": "write_importance_regression",
"family": "router",
"input_type": "single",
"objective": "single_regression",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 8000,
"valid_score_rows": 8000
},
{
"task_name": "memory_type",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 120000,
"valid_score_rows": 0
},
{
"task_name": "salience_bin",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 24000,
"valid_score_rows": 0
},
{
"task_name": "importance_bin",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 24000,
"valid_score_rows": 0
},
{
"task_name": "confidence_bin",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 24000,
"valid_score_rows": 0
},
{
"task_name": "decay_profile",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 40000,
"valid_score_rows": 0
},
{
"task_name": "pii_span_detection",
"family": "extractor",
"input_type": "single",
"objective": "token_classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 30516,
"valid_score_rows": 0
},
{
"task_name": "consolidation_gist_quality",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 10432,
"valid_score_rows": 0
},
{
"task_name": "forgetting_action_policy",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 40000,
"valid_score_rows": 0
},
{
"task_name": "constraint_dimension",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 48000,
"valid_score_rows": 0
},
{
"task_name": "context_tag",
"family": "router",
"input_type": "single",
"objective": "classification",
"enabled": true,
"status": "ok",
"reason": null,
"rows_found": 64000,
"valid_score_rows": 0
}
],
"observed_tasks_by_family": {
"extractor": [
"constraint_scope",
"constraint_stability",
"constraint_type",
"fact_type",
"pii_presence"
],
"pair": [
"conflict_detection",
"constraint_rerank",
"memory_rerank_pair",
"novelty_pair",
"reconsolidation_candidate_pair",
"retrieval_constraint_relevance_pair",
"schema_match_pair",
"scope_match",
"supersession"
],
"router": [
"confidence_bin",
"consolidation_gist_quality",
"constraint_dimension",
"context_tag",
"decay_profile",
"forgetting_action_policy",
"importance_bin",
"memory_type",
"query_domain",
"query_intent",
"salience_bin",
"write_importance_regression"
]
},
"coverage_vs_config": {
"extractor": {
"configured_enabled_tasks": [],
"observed_tasks": [
"constraint_scope",
"constraint_stability",
"constraint_type",
"fact_type",
"pii_presence"
],
"missing_configured_tasks": []
},
"pair": {
"configured_enabled_tasks": [
"memory_rerank_pair",
"novelty_pair",
"reconsolidation_candidate_pair",
"retrieval_constraint_relevance_pair",
"schema_match_pair"
],
"observed_tasks": [
"conflict_detection",
"constraint_rerank",
"memory_rerank_pair",
"novelty_pair",
"reconsolidation_candidate_pair",
"retrieval_constraint_relevance_pair",
"schema_match_pair",
"scope_match",
"supersession"
],
"missing_configured_tasks": []
},
"router": {
"configured_enabled_tasks": [
"confidence_bin",
"consolidation_gist_quality",
"constraint_dimension",
"context_tag",
"decay_profile",
"forgetting_action_policy",
"importance_bin",
"memory_type",
"salience_bin",
"write_importance_regression"
],
"observed_tasks": [
"confidence_bin",
"consolidation_gist_quality",
"constraint_dimension",
"context_tag",
"decay_profile",
"forgetting_action_policy",
"importance_bin",
"memory_type",
"query_domain",
"query_intent",
"salience_bin",
"write_importance_regression"
],
"missing_configured_tasks": []
}
}
},
"families": {
"router": {
"model_path": "packages/models/trained_models/router_model.joblib"
},
"extractor": {
"model_path": "packages/models/trained_models/extractor_model.joblib"
},
"pair": {
"model_path": "packages/models/trained_models/pair_model.joblib"
}
},
"task_training_status": {
"retrieval_constraint_relevance_pair": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "pair",
"objective": "pair_ranking",
"enabled": true
},
"memory_rerank_pair": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "pair",
"objective": "pair_ranking",
"enabled": true
},
"novelty_pair": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "pair",
"objective": "classification",
"enabled": true
},
"fact_extraction_structured": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "extractor",
"objective": "token_classification",
"enabled": true
},
"schema_match_pair": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "pair",
"objective": "classification",
"enabled": true
},
"reconsolidation_candidate_pair": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "pair",
"objective": "pair_ranking",
"enabled": true
},
"write_importance_regression": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "single_regression",
"enabled": true
},
"memory_type": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"salience_bin": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"importance_bin": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"confidence_bin": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"decay_profile": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"pii_span_detection": {
"status": "trained",
"reason": null,
"family": "extractor",
"objective": "token_classification",
"enabled": true,
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/pii_span_detection_model.joblib",
"train_rows": 30516
},
"consolidation_gist_quality": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"forgetting_action_policy": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"constraint_dimension": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
},
"context_tag": {
"status": "filtered_out",
"reason": "Excluded by --tasks filter",
"family": "router",
"objective": "classification",
"enabled": true
}
},
"task_models": {
"memory_rerank_pair": {
"model_path": "packages/models/trained_models/memory_rerank_pair_model.joblib",
"hf_model_dir": "packages/models/trained_models/memory_rerank_pair_hf"
},
"retrieval_constraint_relevance_pair": {
"model_path": "packages/models/trained_models/retrieval_constraint_relevance_pair_model.joblib",
"hf_model_dir": "packages/models/trained_models/retrieval_constraint_relevance_pair_hf"
},
"novelty_pair": {
"model_path": "packages/models/trained_models/novelty_pair_model.joblib",
"hf_model_dir": "packages/models/trained_models/novelty_pair_hf"
},
"fact_extraction_structured": {
"model_path": "packages/models/trained_models/fact_extraction_structured_model.joblib",
"hf_model_dir": "packages/models/trained_models/fact_extraction_structured_hf"
},
"schema_match_pair": {
"task": "schema_match_pair",
"objective": "classification",
"trainer": "transformer_pair",
"model_kind": "transformer_pair",
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/schema_match_pair_model.joblib",
"hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/schema_match_pair_hf",
"train_rows": 81200,
"test": {
"rows": 10000,
"accuracy": 0.8552,
"macro_f1": 0.8551561470750885,
"weighted_f1": 0.8551561470750885,
"micro_f1": 0.8552,
"labels": [
"schema_match_pair::match",
"schema_match_pair::no_match"
],
"confusion_matrix": [
[
4189,
811
],
[
637,
4363
]
],
"calibration_error": 0.03336120770113563,
"classification_report": {
"schema_match_pair::match": {
"precision": 0.8680066307501036,
"recall": 0.8378,
"f1-score": 0.852635864034195,
"support": 5000.0
},
"schema_match_pair::no_match": {
"precision": 0.8432547352145342,
"recall": 0.8726,
"f1-score": 0.8576764301159819,
"support": 5000.0
},
"accuracy": 0.8552,
"macro avg": {
"precision": 0.8556306829823189,
"recall": 0.8552,
"f1-score": 0.8551561470750885,
"support": 10000.0
},
"weighted avg": {
"precision": 0.8556306829823188,
"recall": 0.8552,
"f1-score": 0.8551561470750885,
"support": 10000.0
}
}
},
"eval": {
"rows": 10000,
"accuracy": 0.8517,
"macro_f1": 0.8516351927685533,
"weighted_f1": 0.8516351927685533,
"micro_f1": 0.8517,
"labels": [
"schema_match_pair::match",
"schema_match_pair::no_match"
],
"confusion_matrix": [
[
4154,
846
],
[
637,
4363
]
],
"calibration_error": 0.03950018305884612,
"classification_report": {
"schema_match_pair::match": {
"precision": 0.8670423711125026,
"recall": 0.8308,
"f1-score": 0.848534368297416,
"support": 5000.0
},
"schema_match_pair::no_match": {
"precision": 0.8375887886350547,
"recall": 0.8726,
"f1-score": 0.8547360172396905,
"support": 5000.0
},
"accuracy": 0.8517,
"macro avg": {
"precision": 0.8523155798737787,
"recall": 0.8517,
"f1-score": 0.8516351927685533,
"support": 10000.0
},
"weighted avg": {
"precision": 0.8523155798737786,
"recall": 0.8517,
"f1-score": 0.8516351927685533,
"support": 10000.0
}
}
},
"actual_epochs": 4,
"best_epoch": 4,
"early_stopped": false,
"selection_metric": "macro_f1",
"selection_value": 0.8516351927685533,
"backbone_model_name": "BAAI/bge-reranker-base",
"tokenizer_name": "BAAI/bge-reranker-base",
"calibration": {
"method": "temperature_grid_search",
"rows": 10000,
"temperature": 1.3,
"loss": 0.3754132442613608
},
"thresholds": {
"default_threshold": 0.26,
"positive_label": "schema_match_pair::match",
"precision_floor": 0.85,
"positive_f1": 0.8544423440453687,
"positive_precision": 0.8501286873886359
},
"artifact_scope": "task",
"evaluation_suite": "standard",
"dataset_hashes": {
"train": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pair_train.parquet",
"sha256": "5b19ae2af42d3bbeb58fa8cda2a6b40748e2561a7c4c60a464e2eced711d7c16",
"bytes": 99474783
},
"test": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pair_test.parquet",
"sha256": "33f2d21d29ab684df5c9ab8df2b8bea8ffaa485434bc14bed350cea86a075a88",
"bytes": 14270999
},
"eval": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pair_eval.parquet",
"sha256": "cb6fae7ab447adb0d49af2de458dfbfa82f1af1efa5fd72644e2e6a9db7d07b7",
"bytes": 14298411
}
},
"release_gates": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.8,
"actual": 0.8551561470750885,
"passed": true
},
{
"section": "test",
"metric": "calibration_error",
"threshold": {
"max": 0.08
},
"actual": 0.03336120770113563,
"passed": true
}
]
}
},
"reconsolidation_candidate_pair": {
"model_path": "packages/models/trained_models/reconsolidation_candidate_pair_model.joblib",
"hf_model_dir": "packages/models/trained_models/reconsolidation_candidate_pair_hf"
},
"write_importance_regression": {
"model_path": "packages/models/trained_models/write_importance_regression_model.joblib"
},
"forgetting_action_policy": {
"task": "forgetting_action_policy",
"objective": "classification",
"trainer": "transformer_text",
"model_kind": "transformer_text",
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/forgetting_action_policy_model.joblib",
"hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/forgetting_action_policy_hf",
"train_rows": 28580,
"test": {
"rows": 18920,
"accuracy": 0.9994714587737844,
"macro_f1": 0.9994714168187103,
"weighted_f1": 0.9994714168187103,
"micro_f1": 0.9994714587737844,
"labels": [
"forgetting_action_policy::compress",
"forgetting_action_policy::decay",
"forgetting_action_policy::delete",
"forgetting_action_policy::keep",
"forgetting_action_policy::silence"
],
"confusion_matrix": [
[
3782,
2,
0,
0,
0
],
[
0,
3784,
0,
0,
0
],
[
0,
0,
3779,
1,
4
],
[
0,
0,
0,
3784,
0
],
[
2,
0,
1,
0,
3781
]
],
"calibration_error": 0.01649172677837832,
"classification_report": {
"forgetting_action_policy::compress": {
"precision": 0.9994714587737844,
"recall": 0.9994714587737844,
"f1-score": 0.9994714587737844,
"support": 3784.0
},
"forgetting_action_policy::decay": {
"precision": 0.9994717379820391,
"recall": 1.0,
"f1-score": 0.9997357992073976,
"support": 3784.0
},
"forgetting_action_policy::delete": {
"precision": 0.9997354497354497,
"recall": 0.9986786469344608,
"f1-score": 0.9992067689053411,
"support": 3784.0
},
"forgetting_action_policy::keep": {
"precision": 0.9997357992073976,
"recall": 1.0,
"f1-score": 0.9998678821508786,
"support": 3784.0
},
"forgetting_action_policy::silence": {
"precision": 0.9989431968295905,
"recall": 0.9992071881606766,
"f1-score": 0.9990751750561501,
"support": 3784.0
},
"accuracy": 0.9994714587737844,
"macro avg": {
"precision": 0.9994715285056524,
"recall": 0.9994714587737844,
"f1-score": 0.9994714168187103,
"support": 18920.0
},
"weighted avg": {
"precision": 0.9994715285056522,
"recall": 0.9994714587737844,
"f1-score": 0.9994714168187103,
"support": 18920.0
}
}
},
"eval": {
"rows": 5000,
"accuracy": 0.984,
"macro_f1": 0.9839922007228425,
"weighted_f1": 0.9839922007228427,
"micro_f1": 0.984,
"labels": [
"forgetting_action_policy::compress",
"forgetting_action_policy::decay",
"forgetting_action_policy::delete",
"forgetting_action_policy::keep",
"forgetting_action_policy::silence"
],
"confusion_matrix": [
[
988,
3,
0,
9,
0
],
[
3,
986,
1,
1,
9
],
[
2,
0,
994,
0,
4
],
[
6,
11,
0,
979,
4
],
[
2,
11,
11,
3,
973
]
],
"calibration_error": 0.0073812406567217975,
"classification_report": {
"forgetting_action_policy::compress": {
"precision": 0.987012987012987,
"recall": 0.988,
"f1-score": 0.9875062468765617,
"support": 1000.0
},
"forgetting_action_policy::decay": {
"precision": 0.9752720079129574,
"recall": 0.986,
"f1-score": 0.9806066633515664,
"support": 1000.0
},
"forgetting_action_policy::delete": {
"precision": 0.9880715705765407,
"recall": 0.994,
"f1-score": 0.9910269192422732,
"support": 1000.0
},
"forgetting_action_policy::keep": {
"precision": 0.9868951612903226,
"recall": 0.979,
"f1-score": 0.9829317269076305,
"support": 1000.0
},
"forgetting_action_policy::silence": {
"precision": 0.9828282828282828,
"recall": 0.973,
"f1-score": 0.9778894472361809,
"support": 1000.0
},
"accuracy": 0.984,
"macro avg": {
"precision": 0.984016001924218,
"recall": 0.984,
"f1-score": 0.9839922007228425,
"support": 5000.0
},
"weighted avg": {
"precision": 0.9840160019242181,
"recall": 0.984,
"f1-score": 0.9839922007228427,
"support": 5000.0
}
}
},
"actual_epochs": 8,
"best_epoch": 7,
"early_stopped": false,
"selection_metric": "macro_f1",
"selection_value": 0.9839922007228425,
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": "microsoft/deberta-v3-base",
"calibration": {
"method": "temperature_grid_search",
"rows": 5000,
"temperature": 2.0,
"loss": 0.08134587520392533
},
"artifact_scope": "task",
"evaluation_suite": "standard",
"dataset_hashes": {
"train": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet",
"sha256": "d6cf7bf6638ca6d2a0b12d3e011aac120866f3cbf7364359bcc32a1f86ac3770",
"bytes": 44674192
},
"test": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet",
"sha256": "2665b088823ca9733c9f53a62aa9e4c8f6148a8d169ebfb69641d04a3e710552",
"bytes": 7175410
},
"eval": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet",
"sha256": "b492f3fd739408de18bfd17b5c57248b51b90dba10e744f2687b50cdc351e13f",
"bytes": 6746274
}
},
"release_gates": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.93,
"actual": 0.9994714168187103,
"passed": true
},
{
"section": "test",
"metric": "decay_recall",
"threshold": 0.9,
"actual": 1.0,
"passed": true
},
{
"section": "test",
"metric": "delete_recall",
"threshold": 0.9,
"actual": 0.9986786469344608,
"passed": true
}
]
}
},
"constraint_dimension": {
"task": "constraint_dimension",
"objective": "classification",
"trainer": "transformer_text",
"model_kind": "transformer_text",
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/constraint_dimension_model.joblib",
"hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/constraint_dimension_hf",
"train_rows": 48000,
"test": {
"rows": 6000,
"accuracy": 0.8828333333333334,
"macro_f1": 0.883185453547077,
"weighted_f1": 0.883185453547077,
"micro_f1": 0.8828333333333334,
"labels": [
"constraint_dimension::causal",
"constraint_dimension::goal",
"constraint_dimension::other",
"constraint_dimension::policy",
"constraint_dimension::state",
"constraint_dimension::value"
],
"confusion_matrix": [
[
966,
2,
20,
1,
7,
4
],
[
1,
927,
47,
2,
6,
17
],
[
12,
30,
817,
22,
56,
63
],
[
0,
2,
26,
949,
1,
22
],
[
27,
7,
63,
8,
865,
30
],
[
7,
19,
137,
27,
37,
773
]
],
"calibration_error": 0.08291319935909541,
"classification_report": {
"constraint_dimension::causal": {
"precision": 0.9536031589338598,
"recall": 0.966,
"f1-score": 0.9597615499254843,
"support": 1000.0
},
"constraint_dimension::goal": {
"precision": 0.939209726443769,
"recall": 0.927,
"f1-score": 0.9330649219929542,
"support": 1000.0
},
"constraint_dimension::other": {
"precision": 0.7360360360360361,
"recall": 0.817,
"f1-score": 0.7744075829383886,
"support": 1000.0
},
"constraint_dimension::policy": {
"precision": 0.9405351833498513,
"recall": 0.949,
"f1-score": 0.944748631159781,
"support": 1000.0
},
"constraint_dimension::state": {
"precision": 0.8899176954732511,
"recall": 0.865,
"f1-score": 0.8772819472616633,
"support": 1000.0
},
"constraint_dimension::value": {
"precision": 0.8503850385038504,
"recall": 0.773,
"f1-score": 0.8098480880041907,
"support": 1000.0
},
"accuracy": 0.8828333333333334,
"macro avg": {
"precision": 0.8849478064567696,
"recall": 0.8828333333333332,
"f1-score": 0.883185453547077,
"support": 6000.0
},
"weighted avg": {
"precision": 0.8849478064567696,
"recall": 0.8828333333333334,
"f1-score": 0.883185453547077,
"support": 6000.0
}
}
},
"eval": {
"rows": 6000,
"accuracy": 0.8698333333333333,
"macro_f1": 0.8703105353987516,
"weighted_f1": 0.8703105353987517,
"micro_f1": 0.8698333333333333,
"labels": [
"constraint_dimension::causal",
"constraint_dimension::goal",
"constraint_dimension::other",
"constraint_dimension::policy",
"constraint_dimension::state",
"constraint_dimension::value"
],
"confusion_matrix": [
[
965,
2,
16,
0,
12,
5
],
[
1,
907,
57,
1,
9,
25
],
[
19,
31,
791,
18,
56,
85
],
[
1,
0,
22,
954,
2,
21
],
[
27,
13,
78,
6,
842,
34
],
[
13,
23,
145,
23,
36,
760
]
],
"calibration_error": 0.09575599064379686,
"classification_report": {
"constraint_dimension::causal": {
"precision": 0.9405458089668616,
"recall": 0.965,
"f1-score": 0.9526159921026653,
"support": 1000.0
},
"constraint_dimension::goal": {
"precision": 0.9293032786885246,
"recall": 0.907,
"f1-score": 0.9180161943319838,
"support": 1000.0
},
"constraint_dimension::other": {
"precision": 0.7132551848512173,
"recall": 0.791,
"f1-score": 0.7501185395922239,
"support": 1000.0
},
"constraint_dimension::policy": {
"precision": 0.9520958083832335,
"recall": 0.954,
"f1-score": 0.9530469530469531,
"support": 1000.0
},
"constraint_dimension::state": {
"precision": 0.8798328108672936,
"recall": 0.842,
"f1-score": 0.8605007664793051,
"support": 1000.0
},
"constraint_dimension::value": {
"precision": 0.8172043010752689,
"recall": 0.76,
"f1-score": 0.7875647668393783,
"support": 1000.0
},
"accuracy": 0.8698333333333333,
"macro avg": {
"precision": 0.8720395321387332,
"recall": 0.8698333333333332,
"f1-score": 0.8703105353987516,
"support": 6000.0
},
"weighted avg": {
"precision": 0.8720395321387332,
"recall": 0.8698333333333333,
"f1-score": 0.8703105353987517,
"support": 6000.0
}
}
},
"actual_epochs": 10,
"best_epoch": 10,
"early_stopped": false,
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": "microsoft/deberta-v3-base",
"calibration": {
"method": "temperature_grid_search",
"rows": 6000,
"temperature": 2.0,
"loss": 0.5294126563569427
},
"artifact_scope": "task",
"evaluation_suite": "standard",
"dataset_hashes": {
"train": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet",
"sha256": "d6cf7bf6638ca6d2a0b12d3e011aac120866f3cbf7364359bcc32a1f86ac3770",
"bytes": 44674192
},
"test": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet",
"sha256": "c24ff4a481709443ccdac0bad5916fede972611b3cdd683a578f750d18a40e71",
"bytes": 7175410
},
"eval": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet",
"sha256": "b492f3fd739408de18bfd17b5c57248b51b90dba10e744f2687b50cdc351e13f",
"bytes": 6746274
}
},
"release_gates": {
"passed": true,
"checks": []
}
},
"context_tag": {
"task": "context_tag",
"objective": "classification",
"trainer": "transformer_text",
"model_kind": "transformer_text",
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/context_tag_model.joblib",
"hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/context_tag_hf",
"train_rows": 64000,
"test": {
"rows": 8000,
"accuracy": 0.947375,
"macro_f1": 0.9462078544778264,
"weighted_f1": 0.9462078544778263,
"micro_f1": 0.947375,
"labels": [
"context_tag::finance",
"context_tag::food",
"context_tag::general",
"context_tag::health",
"context_tag::social",
"context_tag::tech",
"context_tag::travel",
"context_tag::work"
],
"confusion_matrix": [
[
979,
0,
12,
1,
0,
3,
1,
4
],
[
0,
951,
15,
24,
8,
0,
2,
0
],
[
52,
34,
775,
27,
28,
21,
30,
33
],
[
0,
13,
15,
972,
0,
0,
0,
0
],
[
1,
5,
10,
0,
975,
0,
6,
3
],
[
2,
0,
9,
0,
0,
975,
0,
14
],
[
4,
0,
4,
0,
4,
1,
986,
1
],
[
5,
0,
11,
0,
0,
17,
1,
966
]
],
"calibration_error": 0.024662236875587645,
"classification_report": {
"context_tag::finance": {
"precision": 0.9386385426653883,
"recall": 0.979,
"f1-score": 0.9583945178658835,
"support": 1000.0
},
"context_tag::food": {
"precision": 0.9481555333998006,
"recall": 0.951,
"f1-score": 0.9495756365451822,
"support": 1000.0
},
"context_tag::general": {
"precision": 0.9106933019976499,
"recall": 0.775,
"f1-score": 0.8373851971907077,
"support": 1000.0
},
"context_tag::health": {
"precision": 0.94921875,
"recall": 0.972,
"f1-score": 0.9604743083003953,
"support": 1000.0
},
"context_tag::social": {
"precision": 0.9605911330049262,
"recall": 0.975,
"f1-score": 0.967741935483871,
"support": 1000.0
},
"context_tag::tech": {
"precision": 0.9587020648967551,
"recall": 0.975,
"f1-score": 0.9667823500247893,
"support": 1000.0
},
"context_tag::travel": {
"precision": 0.9610136452241715,
"recall": 0.986,
"f1-score": 0.9733464955577492,
"support": 1000.0
},
"context_tag::work": {
"precision": 0.9461312438785504,
"recall": 0.966,
"f1-score": 0.9559623948540327,
"support": 1000.0
},
"accuracy": 0.947375,
"macro avg": {
"precision": 0.9466430268834052,
"recall": 0.947375,
"f1-score": 0.9462078544778264,
"support": 8000.0
},
"weighted avg": {
"precision": 0.9466430268834054,
"recall": 0.947375,
"f1-score": 0.9462078544778263,
"support": 8000.0
}
}
},
"eval": {
"rows": 8000,
"accuracy": 0.94625,
"macro_f1": 0.9445890976694143,
"weighted_f1": 0.9445890976694143,
"micro_f1": 0.94625,
"labels": [
"context_tag::finance",
"context_tag::food",
"context_tag::general",
"context_tag::health",
"context_tag::social",
"context_tag::tech",
"context_tag::travel",
"context_tag::work"
],
"confusion_matrix": [
[
982,
0,
8,
0,
0,
4,
0,
6
],
[
1,
972,
9,
11,
6,
0,
1,
0
],
[
50,
53,
743,
33,
29,
26,
27,
39
],
[
1,
18,
10,
967,
1,
2,
0,
1
],
[
2,
5,
4,
1,
984,
0,
2,
2
],
[
5,
0,
14,
2,
1,
971,
0,
7
],
[
1,
2,
6,
0,
6,
1,
983,
1
],
[
1,
0,
11,
0,
0,
19,
1,
968
]
],
"calibration_error": 0.023930798305538282,
"classification_report": {
"context_tag::finance": {
"precision": 0.9415148609779482,
"recall": 0.982,
"f1-score": 0.9613313754282917,
"support": 1000.0
},
"context_tag::food": {
"precision": 0.9257142857142857,
"recall": 0.972,
"f1-score": 0.9482926829268292,
"support": 1000.0
},
"context_tag::general": {
"precision": 0.9229813664596274,
"recall": 0.743,
"f1-score": 0.8232686980609418,
"support": 1000.0
},
"context_tag::health": {
"precision": 0.9536489151873767,
"recall": 0.967,
"f1-score": 0.9602780536246276,
"support": 1000.0
},
"context_tag::social": {
"precision": 0.9581304771178188,
"recall": 0.984,
"f1-score": 0.9708929452392698,
"support": 1000.0
},
"context_tag::tech": {
"precision": 0.9491691104594331,
"recall": 0.971,
"f1-score": 0.9599604547701434,
"support": 1000.0
},
"context_tag::travel": {
"precision": 0.9694280078895463,
"recall": 0.983,
"f1-score": 0.9761668321747765,
"support": 1000.0
},
"context_tag::work": {
"precision": 0.9453125,
"recall": 0.968,
"f1-score": 0.9565217391304348,
"support": 1000.0
},
"accuracy": 0.94625,
"macro avg": {
"precision": 0.9457374404757546,
"recall": 0.94625,
"f1-score": 0.9445890976694143,
"support": 8000.0
},
"weighted avg": {
"precision": 0.9457374404757545,
"recall": 0.94625,
"f1-score": 0.9445890976694143,
"support": 8000.0
}
}
},
"actual_epochs": 3,
"best_epoch": 3,
"early_stopped": false,
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": "microsoft/deberta-v3-base",
"calibration": {
"method": "temperature_grid_search",
"rows": 8000,
"temperature": 2.0,
"loss": 0.22631261527409646
},
"artifact_scope": "task",
"evaluation_suite": "standard",
"dataset_hashes": {
"train": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet",
"sha256": "d6cf7bf6638ca6d2a0b12d3e011aac120866f3cbf7364359bcc32a1f86ac3770",
"bytes": 44674192
},
"test": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet",
"sha256": "c24ff4a481709443ccdac0bad5916fede972611b3cdd683a578f750d18a40e71",
"bytes": 7175410
},
"eval": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet",
"sha256": "b492f3fd739408de18bfd17b5c57248b51b90dba10e744f2687b50cdc351e13f",
"bytes": 6746274
}
},
"release_gates": {
"passed": true,
"checks": []
}
},
"confidence_bin": {
"task": "confidence_bin",
"objective": "classification",
"trainer": "ordinal_threshold",
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/confidence_bin_model.joblib",
"train_rows": 24000,
"test": {
"rows": 3000,
"accuracy": 1.0,
"macro_f1": 1.0,
"weighted_f1": 1.0,
"micro_f1": 1.0,
"labels": [
"low",
"medium",
"high"
],
"confusion_matrix": [
[
1000,
0,
0
],
[
0,
1000,
0
],
[
0,
0,
1000
]
],
"calibration_error": 0.0,
"classification_report": {
"confidence_bin::high": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"confidence_bin::low": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"confidence_bin::medium": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"accuracy": 1.0,
"macro avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 3000.0
},
"weighted avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 3000.0
}
},
"ordinal_mae": 0.0,
"off_by_two_rate": 0.0
},
"eval": {
"rows": 3000,
"accuracy": 1.0,
"macro_f1": 1.0,
"weighted_f1": 1.0,
"micro_f1": 1.0,
"labels": [
"low",
"medium",
"high"
],
"confusion_matrix": [
[
1000,
0,
0
],
[
0,
1000,
0
],
[
0,
0,
1000
]
],
"calibration_error": 0.0,
"classification_report": {
"confidence_bin::high": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"confidence_bin::low": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"confidence_bin::medium": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"accuracy": 1.0,
"macro avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 3000.0
},
"weighted avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 3000.0
}
},
"ordinal_mae": 0.0,
"off_by_two_rate": 0.0
},
"actual_epochs": 1,
"best_epoch": 1,
"early_stopped": false,
"boundary_count": 2,
"artifact_scope": "task",
"evaluation_suite": "standard",
"model_kind": "ordinal_threshold",
"dataset_hashes": {
"train": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet",
"sha256": "d8bf7adebbfa6cda2ef35311b60e5b6028efd58ced64101671e6c64d4e87ca17",
"bytes": 41617539
},
"test": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet",
"sha256": "46c4cf932e38240bb411ff50814b562f5daac3a876f807eaaaa5a52f8d981995",
"bytes": 6786069
},
"eval": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet",
"sha256": "ea69623ce36b98080f7c00ee722e45f7c870174a8967e87a5e7ed03ae18b1387",
"bytes": 6369869
}
},
"release_gates": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.85,
"actual": 1.0,
"passed": true
}
]
}
},
"decay_profile": {
"task": "decay_profile",
"objective": "classification",
"trainer": "ordinal_threshold",
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/decay_profile_model.joblib",
"train_rows": 40000,
"test": {
"rows": 5000,
"accuracy": 1.0,
"macro_f1": 1.0,
"weighted_f1": 1.0,
"micro_f1": 1.0,
"labels": [
"very_fast",
"fast",
"medium",
"slow",
"very_slow"
],
"confusion_matrix": [
[
1000,
0,
0,
0,
0
],
[
0,
1000,
0,
0,
0
],
[
0,
0,
1000,
0,
0
],
[
0,
0,
0,
1000,
0
],
[
0,
0,
0,
0,
1000
]
],
"calibration_error": 0.0,
"classification_report": {
"decay_profile::fast": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::medium": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::slow": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::very_fast": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::very_slow": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"accuracy": 1.0,
"macro avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 5000.0
},
"weighted avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 5000.0
}
},
"ordinal_mae": 0.0,
"off_by_two_rate": 0.0
},
"eval": {
"rows": 5000,
"accuracy": 1.0,
"macro_f1": 1.0,
"weighted_f1": 1.0,
"micro_f1": 1.0,
"labels": [
"very_fast",
"fast",
"medium",
"slow",
"very_slow"
],
"confusion_matrix": [
[
1000,
0,
0,
0,
0
],
[
0,
1000,
0,
0,
0
],
[
0,
0,
1000,
0,
0
],
[
0,
0,
0,
1000,
0
],
[
0,
0,
0,
0,
1000
]
],
"calibration_error": 0.0,
"classification_report": {
"decay_profile::fast": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::medium": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::slow": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::very_fast": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"decay_profile::very_slow": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 1000.0
},
"accuracy": 1.0,
"macro avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 5000.0
},
"weighted avg": {
"precision": 1.0,
"recall": 1.0,
"f1-score": 1.0,
"support": 5000.0
}
},
"ordinal_mae": 0.0,
"off_by_two_rate": 0.0
},
"actual_epochs": 1,
"best_epoch": 1,
"early_stopped": false,
"boundary_count": 4,
"artifact_scope": "task",
"evaluation_suite": "standard",
"model_kind": "ordinal_threshold",
"dataset_hashes": {
"train": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_train.parquet",
"sha256": "d8bf7adebbfa6cda2ef35311b60e5b6028efd58ced64101671e6c64d4e87ca17",
"bytes": 41617539
},
"test": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_test.parquet",
"sha256": "46c4cf932e38240bb411ff50814b562f5daac3a876f807eaaaa5a52f8d981995",
"bytes": 6786069
},
"eval": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/router_eval.parquet",
"sha256": "ea69623ce36b98080f7c00ee722e45f7c870174a8967e87a5e7ed03ae18b1387",
"bytes": 6369869
}
},
"release_gates": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.81,
"actual": 1.0,
"passed": true
}
]
}
},
"pii_span_detection": {
"task": "pii_span_detection",
"objective": "token_classification",
"trainer": "token_classification",
"model_path": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/pii_span_detection_model.joblib",
"hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/pii_span_detection_hf",
"train_rows": 30516,
"test": {
"span_precision": 0.9211675795604243,
"span_recall": 0.9452863749555318,
"span_f1": 0.9330711426364211,
"span_exact_match": 0.8445730247406225,
"rows": 5012
},
"eval": {
"span_precision": 0.9210037995935318,
"span_recall": 0.9411286681715576,
"span_f1": 0.9309574848160057,
"span_exact_match": 0.851520572450805,
"rows": 4472
},
"labels": {
"0": "O",
"1": "B-ACCOUNTNAME",
"2": "I-ACCOUNTNAME",
"3": "B-ACCOUNTNUMBER",
"4": "I-ACCOUNTNUMBER",
"5": "B-AGE",
"6": "I-AGE",
"7": "B-AMOUNT",
"8": "I-AMOUNT",
"9": "B-BIC",
"10": "I-BIC",
"11": "B-BITCOINADDRESS",
"12": "I-BITCOINADDRESS",
"13": "B-BUILDINGNUMBER",
"14": "I-BUILDINGNUMBER",
"15": "B-CITY",
"16": "I-CITY",
"17": "B-COMPANYNAME",
"18": "I-COMPANYNAME",
"19": "B-COUNTY",
"20": "I-COUNTY",
"21": "B-CREDITCARDCVV",
"22": "I-CREDITCARDCVV",
"23": "B-CREDITCARDISSUER",
"24": "I-CREDITCARDISSUER",
"25": "B-CREDITCARDNUMBER",
"26": "I-CREDITCARDNUMBER",
"27": "B-CURRENCY",
"28": "I-CURRENCY",
"29": "B-CURRENCYCODE",
"30": "I-CURRENCYCODE",
"31": "B-CURRENCYNAME",
"32": "I-CURRENCYNAME",
"33": "B-CURRENCYSYMBOL",
"34": "I-CURRENCYSYMBOL",
"35": "B-DATE",
"36": "I-DATE",
"37": "B-DOB",
"38": "I-DOB",
"39": "B-EMAIL",
"40": "I-EMAIL",
"41": "B-ETHEREUMADDRESS",
"42": "I-ETHEREUMADDRESS",
"43": "B-EYECOLOR",
"44": "I-EYECOLOR",
"45": "B-FIRSTNAME",
"46": "I-FIRSTNAME",
"47": "B-GENDER",
"48": "I-GENDER",
"49": "B-HEIGHT",
"50": "I-HEIGHT",
"51": "B-IBAN",
"52": "I-IBAN",
"53": "B-IP",
"54": "I-IP",
"55": "B-IPV4",
"56": "I-IPV4",
"57": "B-IPV6",
"58": "I-IPV6",
"59": "B-JOBAREA",
"60": "I-JOBAREA",
"61": "B-JOBTITLE",
"62": "I-JOBTITLE",
"63": "B-JOBTYPE",
"64": "I-JOBTYPE",
"65": "B-LASTNAME",
"66": "I-LASTNAME",
"67": "B-LITECOINADDRESS",
"68": "I-LITECOINADDRESS",
"69": "B-MAC",
"70": "I-MAC",
"71": "B-MASKEDNUMBER",
"72": "I-MASKEDNUMBER",
"73": "B-MIDDLENAME",
"74": "I-MIDDLENAME",
"75": "B-NEARBYGPSCOORDINATE",
"76": "I-NEARBYGPSCOORDINATE",
"77": "B-ORDINALDIRECTION",
"78": "I-ORDINALDIRECTION",
"79": "B-PASSWORD",
"80": "I-PASSWORD",
"81": "B-PHONEIMEI",
"82": "I-PHONEIMEI",
"83": "B-PHONENUMBER",
"84": "I-PHONENUMBER",
"85": "B-PIN",
"86": "I-PIN",
"87": "B-PREFIX",
"88": "I-PREFIX",
"89": "B-SECONDARYADDRESS",
"90": "I-SECONDARYADDRESS",
"91": "B-SECRET",
"92": "I-SECRET",
"93": "B-SEX",
"94": "I-SEX",
"95": "B-SSN",
"96": "I-SSN",
"97": "B-STATE",
"98": "I-STATE",
"99": "B-STREET",
"100": "I-STREET",
"101": "B-TIME",
"102": "I-TIME",
"103": "B-URL",
"104": "I-URL",
"105": "B-USERAGENT",
"106": "I-USERAGENT",
"107": "B-USERNAME",
"108": "I-USERNAME",
"109": "B-VEHICLEVIN",
"110": "I-VEHICLEVIN",
"111": "B-VEHICLEVRM",
"112": "I-VEHICLEVRM",
"113": "B-ZIPCODE",
"114": "I-ZIPCODE"
},
"epoch_stats": [
{
"epoch": 1,
"train_loss": 0.5123886795952879
},
{
"epoch": 2,
"train_loss": 0.10158961580695137
},
{
"epoch": 3,
"train_loss": 0.08095065996874068
},
{
"epoch": 4,
"train_loss": 0.0687989874073682
},
{
"epoch": 5,
"train_loss": 0.058967599591349715
},
{
"epoch": 6,
"train_loss": 0.04842000443624294
},
{
"epoch": 7,
"train_loss": 0.03766606290595617
},
{
"epoch": 8,
"train_loss": 0.024583430213327515
}
],
"actual_epochs": 8,
"best_epoch": 8,
"early_stopped": false,
"artifact_scope": "task",
"evaluation_suite": "standard",
"model_kind": "token_classification",
"dataset_hashes": {
"train": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pii_span_detection_train.parquet",
"sha256": "f904fecb9ca45337906ff8e3d60087e38091237777e82a6313e9ef5a21e82bc8",
"bytes": 3742506
},
"test": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pii_span_detection_test.parquet",
"sha256": "6d75b6997a97a61e2b884dfc36099605ecd5d7e5ae3476c54cc7aa33cdb5fb81",
"bytes": 607354
},
"eval": {
"path": "/nvme/CognitiveMemoryLayer/packages/models/prepared_data/modelpack/pii_span_detection_eval.parquet",
"sha256": "153d5d007b854ff6023261c4182a67df1dfb219537c4cebaf69ce8ebed4a2725",
"bytes": 515338
}
},
"release_gates": {
"passed": false,
"checks": [
{
"section": "test",
"metric": "span_exact_match",
"threshold": 0.88,
"actual": 0.8445730247406225,
"passed": false
},
{
"section": "test",
"metric": "span_f1",
"threshold": 0.93,
"actual": 0.9330711426364211,
"passed": true
}
]
}
}
},
"release_mode": false,
"allow_dirty": false,
"release_gates": {
"schema_match_pair": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.8,
"actual": 0.8551561470750885,
"passed": true
},
{
"section": "test",
"metric": "calibration_error",
"threshold": {
"max": 0.08
},
"actual": 0.03336120770113563,
"passed": true
}
]
},
"memory_type": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.86,
"actual": 1.0,
"passed": true
},
{
"section": "test",
"metric": "plan_f1",
"threshold": 0.75,
"actual": 1.0,
"passed": true
}
]
},
"novelty_pair": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "changed_f1",
"threshold": 0.88,
"actual": 0.9117293835068054,
"passed": true
}
]
},
"confidence_bin": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.85,
"actual": 1.0,
"passed": true
}
]
},
"decay_profile": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.81,
"actual": 1.0,
"passed": true
}
]
},
"pii_span_detection": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "span_exact_match",
"threshold": 0.84,
"actual": 0.8445730247406225,
"passed": true
},
{
"section": "test",
"metric": "span_f1",
"threshold": 0.93,
"actual": 0.9330711426364211,
"passed": true
}
]
},
"forgetting_action_policy": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.93,
"actual": 0.9994714168187103,
"passed": true
},
{
"section": "test",
"metric": "decay_recall",
"threshold": 0.9,
"actual": 1.0,
"passed": true
},
{
"section": "test",
"metric": "delete_recall",
"threshold": 0.9,
"actual": 0.9986786469344608,
"passed": true
}
]
},
"constraint_dimension": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.88,
"actual": 0.883185453547077,
"passed": true
},
{
"section": "test",
"metric": "calibration_error",
"threshold": {
"max": 0.06
},
"actual": 0.04340881209580012,
"passed": true
}
]
},
"context_tag": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "macro_f1",
"threshold": 0.94,
"actual": 0.9462078544778264,
"passed": true
}
]
},
"retrieval_constraint_relevance_pair": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "calibration_error",
"threshold": {
"max": 0.08
},
"actual": 0.0649609781444073,
"passed": true
}
]
},
"memory_rerank_pair": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "calibration_error",
"threshold": {
"max": 0.08
},
"actual": 0.06469904275987867,
"passed": true
}
]
},
"reconsolidation_candidate_pair": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "calibration_error",
"threshold": {
"max": 0.08
},
"actual": 0.07517948439121241,
"passed": true
}
]
},
"write_importance_regression": {
"passed": true,
"checks": [
{
"section": "test",
"metric": "test_mae",
"threshold": {
"max": 0.1
},
"actual": 0.01877478314980445,
"passed": true
}
]
}
},
"runtime_thresholds": {},
"artifact_validation": {
"ok": true,
"errors": []
}
}