tcpfn / benchmarks /intervention_results.json
mrshravan's picture
Upload benchmarks/intervention_results.json with huggingface_hub
9ca930e verified
{
"structures": {
"confounded": {
"rmse": 0.681593135140375,
"direction_accuracy": 0.0,
"trajectory_correlation": 0.0,
"null_detected": 0.0,
"pred_cate_mean": 0.6810493767981727,
"true_cate_mean": 0.0,
"n_seeds": 5
},
"mediated": {
"rmse": 0.8923469699693654,
"direction_accuracy": 0.4666666666666667,
"trajectory_correlation": -0.1076186800934075,
"null_detected": "N/A",
"pred_cate_mean": -0.0896030426301683,
"true_cate_mean": 0.5514786841923025,
"n_seeds": 5
},
"time_varying_confounded": {
"rmse": 0.40978652111886243,
"direction_accuracy": 1.0,
"trajectory_correlation": 0.0,
"null_detected": "N/A",
"pred_cate_mean": 0.18326412199096132,
"true_cate_mean": 0.5911041763020383,
"n_seeds": 5
},
"feedback": {
"rmse": 0.31327788634616005,
"direction_accuracy": 1.0,
"trajectory_correlation": 0.0,
"null_detected": "N/A",
"pred_cate_mean": 0.5442088283598423,
"true_cate_mean": 0.514855316018063,
"n_seeds": 5
},
"instrumental_variable": {
"rmse": 0.70705308193879,
"direction_accuracy": 0.9566666666666667,
"trajectory_correlation": -0.021855126454785802,
"null_detected": "N/A",
"pred_cate_mean": 0.2339213555591802,
"true_cate_mean": 0.877110000875206,
"n_seeds": 5
},
"non_identifiable": {
"rmse": 0.29658983764206714,
"direction_accuracy": 1.0,
"trajectory_correlation": -0.27477913370448287,
"null_detected": "N/A",
"pred_cate_mean": 0.8563931959867478,
"true_cate_mean": 0.6002255928070188,
"n_seeds": 5
}
},
"scenarios": {
"step": {
"scenario": "step",
"description": "Step Intervention",
"n_seeds": 5,
"trajectory_rmse": {
"mean": 0.44790337647382295,
"std": 0.11992705799993689
},
"ate_error": {
"mean": 0.1329101725025971,
"std": 0.13308464275986506
},
"direction_accuracy": {
"mean": 0.5377777777777777,
"std": 0.025915341754868006
},
"time_s": 1.6741529230494052,
"extra": {}
},
"dose_response": {
"scenario": "dose_response",
"description": "Dose-Response Curve",
"n_seeds": 5,
"trajectory_rmse": {
"mean": 0.2758524529939483,
"std": 0.07663341940224565
},
"ate_error": {
"mean": 0.13401241106339618,
"std": 0.14771866074543336
},
"direction_accuracy": {
"mean": 0.5444444444444444,
"std": 0.03296088216486962
},
"time_s": 324.4969568946399,
"extra": {}
},
"policy": {
"scenario": "policy",
"description": "Policy Comparison",
"n_seeds": 5,
"trajectory_rmse": {
"mean": 0.09002535829029422,
"std": 0.09175816283732381
},
"ate_error": {
"mean": 0.0615661122289803,
"std": 0.06800788225181435
},
"direction_accuracy": {
"mean": 0.6,
"std": 0.48989794855663565
},
"time_s": 181.22026548418216,
"extra": {}
},
"timing": {
"scenario": "timing",
"description": "Intervention Timing",
"n_seeds": 5,
"trajectory_rmse": {
"mean": 0.42171894065880655,
"std": 0.1268720400592207
},
"ate_error": {
"mean": 0.23317682692018069,
"std": 0.07347633462864078
},
"direction_accuracy": {
"mean": 0.5183333333333333,
"std": 0.04718462555630688
},
"time_s": 14.694185567088425,
"extra": {}
}
},
"machine": {
"timestamp": "2026-04-09T05:03:17.988416+00:00",
"hostname": "7aa1a49e1d2f",
"platform": "Linux-6.8.0-106-generic-x86_64-with-glibc2.39",
"python": "3.12.13",
"cpu": "x86_64",
"cpu_count": 384,
"torch_version": "2.10.0+cu130",
"gpu": "NVIDIA GeForce RTX 5090",
"gpu_count": 1,
"ram_gb": 540.5
}
}