{ "schema_version": "dataforge_eval_diagnostics_v1", "model_repo": "Praneshrajan15/DataForge-0.5B-SFT", "dataset_repo": "Praneshrajan15/dataforge-sft-trajectories", "dataset_sha": "94e2dd556d4f1260c5123d93ca6bf4f9da9b160a", "base_model": "Qwen/Qwen2.5-0.5B-Instruct", "quality_gate_failures": [], "promotion_slice": "deterministic_normalization", "slice_scores": { "base": { "deterministic_normalization": { "tasks": 20, "macro_f1": 0.0, "mean_f1": 0.0, "parse_success_rate": 1.0, "schema_case_error_count": 29, "finish_rate": 0.0, "false_repair_rate": 1.0, "false_repair_count": 73, "dataset_f1": { "beers": 0.0 } }, "external_reference_required": { "tasks": 66, "macro_f1": 0.0093, "mean_f1": 0.0081, "parse_success_rate": 1.0, "schema_case_error_count": 70, "finish_rate": 0.0, "false_repair_rate": 0.9882, "false_repair_count": 252, "dataset_f1": { "beers": 0.0154, "flights": 0.0, "hospital": 0.0125 } }, "not_inferable_from_prompt": { "tasks": 14, "macro_f1": 0.0, "mean_f1": 0.0, "parse_success_rate": 1.0, "schema_case_error_count": 14, "finish_rate": 0.0, "false_repair_rate": 1.0, "false_repair_count": 46, "dataset_f1": { "flights": 0.0, "hospital": 0.0 } } }, "sft": { "deterministic_normalization": { "tasks": 20, "macro_f1": 0.0077, "mean_f1": 0.0077, "parse_success_rate": 1.0, "schema_case_error_count": 0, "finish_rate": 0.05, "false_repair_rate": 0.9867, "false_repair_count": 74, "dataset_f1": { "beers": 0.0077 } }, "external_reference_required": { "tasks": 66, "macro_f1": 0.014, "mean_f1": 0.0137, "parse_success_rate": 0.9848, "schema_case_error_count": 8, "finish_rate": 0.0758, "false_repair_rate": 0.9831, "false_repair_count": 233, "dataset_f1": { "beers": 0.0154, "flights": 0.016, "hospital": 0.0106 } }, "not_inferable_from_prompt": { "tasks": 14, "macro_f1": 0.0, "mean_f1": 0.0, "parse_success_rate": 1.0, "schema_case_error_count": 8, "finish_rate": 0.0, "false_repair_rate": 1.0, "false_repair_count": 53, "dataset_f1": { "flights": 0.0, "hospital": 0.0 } } } }, "base": { "model_label": "base", "task_scores": [ { "task_index": 1, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.25, "precision": 0.25, "recall": 0.25, "tp": 1, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "overrepair": 2, "schema_case_error": 1 } }, { "task_index": 2, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 } }, { "task_index": 3, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 9, "schema_case_error": 3 } }, { "task_index": 4, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 5, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 6, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 4 } }, { "task_index": 7, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 3 } }, { "task_index": 8, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 9, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 } }, { "task_index": 10, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 } }, { "task_index": 11, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 14, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 14, "wrong_cell": 4 } }, { "task_index": 12, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "wrong_cell": 4 } }, { "task_index": 13, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 14, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_value": 3 } }, { "task_index": 15, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 4 } }, { "task_index": 16, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 3 } }, { "task_index": 17, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "wrong_value": 4 } }, { "task_index": 18, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 4 } }, { "task_index": 19, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 20, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 21, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 4 } }, { "task_index": 22, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 2, "schema_case_error": 4 } }, { "task_index": 23, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 4 } }, { "task_index": 24, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 4 } }, { "task_index": 25, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 5, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "overrepair": 3, "schema_case_error": 1, "wrong_cell": 1 } }, { "task_index": 26, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 2 } }, { "task_index": 27, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 28, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 1, "schema_case_error": 4 } }, { "task_index": 29, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_cell": 4 } }, { "task_index": 30, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_cell": 4 } }, { "task_index": 31, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 32, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "wrong_cell": 4 } }, { "task_index": 33, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 13, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 13, "overrepair": 4 } }, { "task_index": 34, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 1, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 35, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 36, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 4 } }, { "task_index": 37, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.087, "precision": 0.05, "recall": 0.3333, "tp": 1, "fp": 19, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 18, "schema_case_error": 1 } }, { "task_index": 38, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 1, "wrong_cell": 3 } }, { "task_index": 39, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3 } }, { "task_index": 40, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 2, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 2 } }, { "task_index": 41, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 42, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 4 } }, { "task_index": 43, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 4, "schema_case_error": 3 } }, { "task_index": 44, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 2, "wrong_value": 2 } }, { "task_index": 45, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 46, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 3 } }, { "task_index": 47, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 4, "schema_case_error": 3, "wrong_cell": 1 } }, { "task_index": 48, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 9, "schema_case_error": 3 } }, { "task_index": 49, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 1 } }, { "task_index": 50, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "wrong_cell": 4 } }, { "task_index": 51, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 10, "schema_case_error": 3 } }, { "task_index": 52, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 53, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 2, "wrong_value": 1 } }, { "task_index": 54, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 9, "schema_case_error": 4 } }, { "task_index": 55, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 } }, { "task_index": 56, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 } }, { "task_index": 57, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 } }, { "task_index": 58, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "schema_case_error": 1 } }, { "task_index": 59, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "wrong_value": 3 } }, { "task_index": 60, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 3 } }, { "task_index": 61, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 62, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 15, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 13, "overrepair": 1, "wrong_value": 2 } }, { "task_index": 63, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 64, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 1, "schema_case_error": 3 } }, { "task_index": 65, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 66, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.2, "precision": 0.25, "recall": 0.1667, "tp": 1, "fp": 3, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 2, "wrong_value": 1 } }, { "task_index": 67, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 1, "schema_case_error": 3 } }, { "task_index": 68, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 } }, { "task_index": 69, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3 } }, { "task_index": 70, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 } }, { "task_index": 71, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 } }, { "task_index": 72, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 3 } }, { "task_index": 73, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 3 } }, { "task_index": 74, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 11, "wrong_cell": 4 } }, { "task_index": 75, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 4 } }, { "task_index": 76, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 1, "schema_case_error": 4 } }, { "task_index": 77, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_value": 4 } }, { "task_index": 78, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 } }, { "task_index": 79, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 2, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 2 } }, { "task_index": 80, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 1 } }, { "task_index": 81, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3 } }, { "task_index": 82, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 4 } }, { "task_index": 83, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 15, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 84, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 6, "schema_case_error": 4 } }, { "task_index": 85, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 } }, { "task_index": 86, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 87, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 } }, { "task_index": 88, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 } }, { "task_index": 89, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 90, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 10, "schema_case_error": 1, "wrong_cell": 3 } }, { "task_index": 91, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "schema_case_error": 1 } }, { "task_index": 92, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_cell": 4 } }, { "task_index": 93, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 } }, { "task_index": 94, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 5, "schema_case_error": 3 } }, { "task_index": 95, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 96, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 10, "schema_case_error": 4 } }, { "task_index": 97, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 2, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "overrepair": 1, "schema_case_error": 1 } }, { "task_index": 98, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_value": 4 } }, { "task_index": 99, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3 } }, { "task_index": 100, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 2, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "overrepair": 1, "schema_case_error": 1 } } ], "failure_samples": [ { "task_index": 1, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.25, "precision": 0.25, "recall": 0.25, "tp": 1, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "overrepair": 2, "schema_case_error": 1 }, "target_rows": [ { "_row": "55", "index": "56", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-2", "MeasureName": "pneumonia patients assessed and given pneumococcal vaccination", "Score": "97%", "Sample": "172 patients", "Stateavg": "al_pn-2" }, { "_row": "56", "index": "57", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boxz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-3b", "MeasureName": "pneumonia patients whose initial emergency room blood culture was performed prior to the administration of the first hospital dose of antibiotics", "Score": "97%", "Sample": "120 patients", "Stateavg": "al_pn-xb" }, { "_row": "57", "index": "58", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505xuxsxhighwayx431xnorth", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2x6x938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-4", "MeasureName": "pneumonia patients given smoking cessation advice/counseling", "Score": "97%", "Sample": "98 patients", "Stateavg": "al_pn-4" }, { "_row": "58", "index": "59", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-5c", "MeasureName": "pneumonia patients given initial antibiotic(s) within 6 hours after arrival", "Score": "96%", "Sample": "211 patients", "Stateavg": "al_pn-5c" } ], "ground_truth": [ { "row": 56, "column": "City", "clean_value": "boaz" }, { "row": 56, "column": "Stateavg", "clean_value": "al_pn-3b" }, { "row": 57, "column": "Address1", "clean_value": "2505 u s highway 431 north" }, { "row": 57, "column": "PhoneNumber", "clean_value": "2565938310" } ], "predicted_repairs": [ { "row": 55, "column": "Index", "new_value": "56", "reason": "The new value for index is incorrect." }, { "row": 56, "column": "ProviderNumber", "new_value": "10005", "reason": "The new value for ProviderNumber is incorrect." }, { "row": 57, "column": "Address1", "new_value": "2505 u s highway 431 north", "reason": "The new value for Address1 is incorrect." }, { "row": 58, "column": "Address2", "new_value": "empty", "reason": "The new value for Address2 is empty." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 55,\n \"column\": \"Index\",\n \"new_value\": \"56\",\n \"reason\": \"The new value for index is incorrect.\"\n },\n {\n \"row\": 56,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10005\",\n \"reason\": \"The new value for ProviderNumber is incorrect.\"\n },\n {\n \"row\": 57,\n \"column\": \"Address1\",\n \"new_value\": \"2505 u s highway 431 north\",\n \"reason\": \"The new value for Address1 is incorrect.\"\n },\n {\n \"row\": 58,\n \"column\": \"Address2\",\n \"new_value\": \"empty\",\n \"reason\": \"The new value for Address2 is empty.\"\n }\n ]\n}\n```" }, { "task_index": 2, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 }, "target_rows": [ { "_row": "792", "tuple_id": "793", "src": "mia", "flight": "AA-2050-ORD-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "2:45P 12-01-11", "act_arr_time": "2:46P" }, { "_row": "793", "tuple_id": "794", "src": "mia", "flight": "AA-1165-JFK-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "10:34A 12-01-11", "act_arr_time": "10:08A" }, { "_row": "794", "tuple_id": "795", "src": "mia", "flight": "AA-484-DFW-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "7:55P 12-01-11", "act_arr_time": "7:39P" }, { "_row": "795", "tuple_id": "796", "src": "mia", "flight": "AA-466-IAH-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "9:20A 12-01-11", "act_arr_time": "9:04A" } ], "ground_truth": [ { "row": 792, "column": "sched_dep_time", "clean_value": "10:40 a.m." }, { "row": 792, "column": "act_dep_time", "clean_value": "11:05 a.m." }, { "row": 792, "column": "sched_arr_time", "clean_value": "2:45 p.m." }, { "row": 792, "column": "act_arr_time", "clean_value": "2:46 p.m." }, { "row": 793, "column": "sched_dep_time", "clean_value": "6:59 a.m." }, { "row": 793, "column": "act_dep_time", "clean_value": "7:22 a.m." }, { "row": 793, "column": "sched_arr_time", "clean_value": "10:34 a.m." }, { "row": 793, "column": "act_arr_time", "clean_value": "10:04 a.m." }, { "row": 794, "column": "sched_dep_time", "clean_value": "4:15 p.m." }, { "row": 794, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 794, "column": "sched_arr_time", "clean_value": "7:55 p.m." }, { "row": 794, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 795, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 795, "column": "act_dep_time", "clean_value": "6:08 a.m." }, { "row": 795, "column": "sched_arr_time", "clean_value": "9:20 a.m." }, { "row": 795, "column": "act_arr_time", "clean_value": "9:05 a.m." } ], "predicted_repairs": [ { "row": 792, "column": "act_arr_time", "new_value": "2:46P", "reason": "The act_arr_time column value has been replaced with '2:46P'." }, { "row": 793, "column": "act_arr_time", "new_value": "10:08A", "reason": "The act_arr_time column value has been replaced with '10:08A'." }, { "row": 794, "column": "act_arr_time", "new_value": "7:39P", "reason": "The act_arr_time column value has been replaced with '7:39P'." }, { "row": 795, "column": "act_arr_time", "new_value": "9:04A", "reason": "The act_arr_time column value has been replaced with '9:04A'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 792,\n \"column\": \"act_arr_time\",\n \"new_value\": \"2:46P\",\n \"reason\": \"The act_arr_time column value has been replaced with '2:46P'.\"\n },\n {\n \"row\": 793,\n \"column\": \"act_arr_time\",\n \"new_value\": \"10:08A\",\n \"reason\": \"The act_arr_time column value has been replaced with '10:08A'.\"\n },\n {\n \"row\": 794,\n \"column\": \"act_arr_time\",\n \"new_value\": \"7:39P\",\n \"reason\": \"The act_arr_time column value has been replaced with '7:39P'.\"\n },\n {\n \"row\": 795,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:04A\",\n \"reason\": \"The act_arr_time column value has been replaced with '9:04A'.\"\n }\n ]\n}\n```" }, { "task_index": 3, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 9, "schema_case_error": 3 }, "target_rows": [ { "_row": "1363", "index": "1364", "id": "2358", "beer-name": "Minhas Light (2012)", "style": "Light Lager", "ounces": "12.0 oz.", "abv": "0.04", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1364", "index": "1365", "id": "2282", "beer-name": "Huber", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "0.05%", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1365", "index": "1366", "id": "2281", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "16.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1366", "index": "1367", "id": "2280", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "12.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" } ], "ground_truth": [ { "row": 1363, "column": "ounces", "clean_value": "12" }, { "row": 1363, "column": "ibu", "clean_value": "" }, { "row": 1364, "column": "ounces", "clean_value": "12" }, { "row": 1364, "column": "abv", "clean_value": "0.05" }, { "row": 1364, "column": "ibu", "clean_value": "" }, { "row": 1365, "column": "ounces", "clean_value": "16" }, { "row": 1365, "column": "ibu", "clean_value": "" }, { "row": 1366, "column": "ounces", "clean_value": "12" }, { "row": 1366, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1363, "column": "Id", "new_value": "1364", "reason": "The beer name has been updated to 'Huber'." }, { "row": 1364, "column": "Id", "new_value": "1365", "reason": "The beer name has been updated to 'Clear Creek Ice'." }, { "row": 1365, "column": "Id", "new_value": "1366", "reason": "The beer name has been updated to 'Clear Creek Ice'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1363,\n \"column\": \"Id\",\n \"new_value\": \"1364\",\n \"reason\": \"The beer name has been updated to 'Huber'.\"\n },\n {\n \"row\": 1364,\n \"column\": \"Id\",\n \"new_value\": \"1365\",\n \"reason\": \"The beer name has been updated to 'Clear Creek Ice'.\"\n },\n {\n \"row\": 1365,\n \"column\": \"Id\",\n \"new_value\": \"1366\",\n \"reason\": \"The beer name has been updated to 'Clear Creek Ice'.\"\n }\n ]\n}\n```" }, { "task_index": 4, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "711", "index": "712", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "1xx%", "Sample": "9 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "712", "index": "713", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection xrevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "713", "index": "714", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "33x28365x1", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery paxienxs needing hair removed from xhe surgical area before surgery who had hair removed using a safer mexhod (elecxric clippers or hair removal cream c nox a razor)", "Score": "100%", "Sample": "33 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "714", "index": "715", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "88%", "Sample": "24 patients", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [ { "row": 711, "column": "Score", "clean_value": "100%" }, { "row": 712, "column": "Condition", "clean_value": "surgical infection prevention" }, { "row": 713, "column": "PhoneNumber", "clean_value": "3342836541" }, { "row": 713, "column": "MeasureName", "clean_value": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)" } ], "predicted_repairs": [ { "row": 711, "column": "Index", "new_value": "712", "reason": "The new value for index has been set to 712." }, { "row": 712, "column": "ProviderNumber", "new_value": "10034", "reason": "The new value for ProviderNumber has been set to 10034." }, { "row": 713, "column": "Address1", "new_value": "805 friendship road", "reason": "The new value for Address1 has been set to '805 friendship road'." }, { "row": 714, "column": "Address2", "new_value": "", "reason": "The new value for Address2 has been left as an empty string ('')." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 711,\n \"column\": \"Index\",\n \"new_value\": \"712\",\n \"reason\": \"The new value for index has been set to 712.\"\n },\n {\n \"row\": 712,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10034\",\n \"reason\": \"The new value for ProviderNumber has been set to 10034.\"\n },\n {\n \"row\": 713,\n \"column\": \"Address1\",\n \"new_value\": \"805 friendship road\",\n \"reason\": \"The new value for Address1 has been set to '805 friendship road'.\"\n },\n {\n \"row\": 714,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address2 has been left as an empty string ('').\"\n }\n ]\n}\n```" }, { "task_index": 5, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1727", "tuple_id": "1728", "src": "ua", "flight": "UA-397-JFK-SFO", "sched_dep_time": "8:00 a.m.", "act_dep_time": "8:29 a.m.", "sched_arr_time": "11:55 a.m.", "act_arr_time": "11:58 a.m." }, { "_row": "1728", "tuple_id": "1729", "src": "ua", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1729", "tuple_id": "1730", "src": "ua", "flight": "UA-2830-MCO-CLT", "sched_dep_time": "3:27 p.m.", "act_dep_time": "3:27 p.m.", "sched_arr_time": "5:05 p.m.", "act_arr_time": "5:17 p.m." }, { "_row": "1730", "tuple_id": "1731", "src": "ua", "flight": "UA-5487-SFO-MRY", "sched_dep_time": "10:39 a.m.", "act_dep_time": "10:33 a.m.", "sched_arr_time": "11:19 a.m.", "act_arr_time": "11:21 a.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1727, "column": "act_arr_time", "new_value": "11:58 a.m.", "reason": "The act_arr_time for flight UA-397-JFK-SFO has been updated to 11:58 a.m." }, { "row": 1728, "column": "act_arr_time", "new_value": "9:43 a.m.", "reason": "The act_arr_time for flight UA-3925-IAD-ORF has been updated to 9:43 a.m." }, { "row": 1729, "column": "act_arr_time", "new_value": "5:17 p.m.", "reason": "The act_arr_time for flight UA-2830-MCO-CLT has been updated to 5:17 p.m." }, { "row": 1730, "column": "act_arr_time", "new_value": "11:21 a.m.", "reason": "The act_arr_time for flight UA-5487-SFO-MRY has been updated to 11:21 a.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1727,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:58 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-397-JFK-SFO has been updated to 11:58 a.m.\"\n },\n {\n \"row\": 1728,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:43 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-3925-IAD-ORF has been updated to 9:43 a.m.\"\n },\n {\n \"row\": 1729,\n \"column\": \"act_arr_time\",\n \"new_value\": \"5:17 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-2830-MCO-CLT has been updated to 5:17 p.m.\"\n },\n {\n \"row\": 1730,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:21 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-5487-SFO-MRY has been updated to 11:21 a.m.\"\n }\n ]\n}\n```" }, { "task_index": 6, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 4 }, "target_rows": [ { "_row": "1840", "index": "1841", "id": "1539", "beer-name": "Monkey Fist IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.069%", "ibu": "65", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1841", "index": "1842", "id": "975", "beer-name": "Shipyard Summer Ale", "style": "American Pale Wheat Ale", "ounces": "12.0 oz", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1842", "index": "1843", "id": "814", "beer-name": "Pumpkinhead Ale", "style": "Pumpkin Ale", "ounces": "12.0 oz.", "abv": "0.047", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1843", "index": "1844", "id": "727", "beer-name": "Shipyard Export", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" } ], "ground_truth": [ { "row": 1840, "column": "ounces", "clean_value": "12" }, { "row": 1840, "column": "abv", "clean_value": "0.069" }, { "row": 1841, "column": "ounces", "clean_value": "12" }, { "row": 1841, "column": "ibu", "clean_value": "" }, { "row": 1842, "column": "ounces", "clean_value": "12" }, { "row": 1842, "column": "ibu", "clean_value": "" }, { "row": 1843, "column": "ounces", "clean_value": "12" }, { "row": 1843, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1840, "column": "Beer-Name", "new_value": "Monkey Fist IPA", "reason": "The beer name has been replaced with 'Monkey Fist IPA'." }, { "row": 1841, "column": "Beer-Name", "new_value": "Shipyard Summer Ale", "reason": "The beer name has been replaced with 'Shipyard Summer Ale'." }, { "row": 1842, "column": "Beer-Name", "new_value": "Pumpkinhead Ale", "reason": "The beer name has been replaced with 'Pumpkinhead Ale'." }, { "row": 1843, "column": "Beer-Name", "new_value": "Shipyard Export", "reason": "The beer name has been replaced with 'Shipyard Export'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1840,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Monkey Fist IPA\",\n \"reason\": \"The beer name has been replaced with 'Monkey Fist IPA'.\"\n },\n {\n \"row\": 1841,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Shipyard Summer Ale\",\n \"reason\": \"The beer name has been replaced with 'Shipyard Summer Ale'.\"\n },\n {\n \"row\": 1842,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Pumpkinhead Ale\",\n \"reason\": \"The beer name has been replaced with 'Pumpkinhead Ale'.\"\n },\n {\n \"row\": 1843,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Shipyard Export\",\n \"reason\": \"The beer name has been replaced with 'Shipyard Export'.\"\n }\n ]\n}\n```" }, { "task_index": 7, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 3 }, "target_rows": [ { "_row": "483", "index": "484", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "xl", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-card-2", "MeasureName": "surgery patients who were taking heart drugs called beta blockers before coming to the hospital who were kept on the beta blockers during the period just before and after their surgery", "Score": "100%", "Sample": "12 patients", "Stateavg": "al_scip-card-2" }, { "_row": "484", "index": "485", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "1x6 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "94%", "Sample": "52 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "485", "index": "486", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "xzark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "96%", "Sample": "52 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "486", "index": "487", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "85%", "Sample": "48 patients", "Stateavg": "al_scip-inf-3" } ], "ground_truth": [ { "row": 483, "column": "State", "clean_value": "al" }, { "row": 484, "column": "Address1", "clean_value": "126 hospital ave" }, { "row": 485, "column": "City", "clean_value": "ozark" } ], "predicted_repairs": [ { "row": 483, "column": "Index", "new_value": "484", "reason": "The address '126 hospital ave' was found in the contract version and is a valid row." }, { "row": 484, "column": "Index", "new_value": "485", "reason": "The address '1x6 hospital ave' was found in the contract version and is a valid row." }, { "row": 485, "column": "Index", "new_value": "486", "reason": "The address '126 hospital ave' was found in the contract version and is a valid row." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 483,\n \"column\": \"Index\",\n \"new_value\": \"484\",\n \"reason\": \"The address '126 hospital ave' was found in the contract version and is a valid row.\"\n },\n {\n \"row\": 484,\n \"column\": \"Index\",\n \"new_value\": \"485\",\n \"reason\": \"The address '1x6 hospital ave' was found in the contract version and is a valid row.\"\n },\n {\n \"row\": 485,\n \"column\": \"Index\",\n \"new_value\": \"486\",\n \"reason\": \"The address '126 hospital ave' was found in the contract version and is a valid row.\"\n }\n ]\n}\n```" }, { "task_index": 8, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "2025", "tuple_id": "2026", "src": "allegiantair", "flight": "UA-2708-EWR-CLT", "sched_dep_time": "", "act_dep_time": "3:04 p.m.", "sched_arr_time": "", "act_arr_time": "4:24 p.m." }, { "_row": "2026", "tuple_id": "2027", "src": "allegiantair", "flight": "UA-62-IAH-EWR", "sched_dep_time": "", "act_dep_time": "2:59 p.m.", "sched_arr_time": "", "act_arr_time": "7:10 p.m." }, { "_row": "2027", "tuple_id": "2028", "src": "allegiantair", "flight": "UA-1500-IAH-GUA", "sched_dep_time": "", "act_dep_time": "9:43 a.m.", "sched_arr_time": "", "act_arr_time": "12:12 p.m." }, { "_row": "2028", "tuple_id": "2029", "src": "allegiantair", "flight": "AA-3804-PHL-ORD", "sched_dep_time": "2:35 p.m.", "act_dep_time": "2:44 p.m.", "sched_arr_time": "4:05 p.m.", "act_arr_time": "3:36 p.m." } ], "ground_truth": [ { "row": 2025, "column": "sched_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "act_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "sched_arr_time", "clean_value": "4:53 p.m." }, { "row": 2025, "column": "act_arr_time", "clean_value": "4:44 p.m." }, { "row": 2026, "column": "sched_dep_time", "clean_value": "2:30 p.m." }, { "row": 2026, "column": "act_dep_time", "clean_value": "2:48 p.m." }, { "row": 2026, "column": "sched_arr_time", "clean_value": "7:03 p.m." }, { "row": 2027, "column": "sched_dep_time", "clean_value": "8:55 a.m." }, { "row": 2027, "column": "act_dep_time", "clean_value": "9:16 a.m." }, { "row": 2027, "column": "sched_arr_time", "clean_value": "11:45 a.m." }, { "row": 2027, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 2028, "column": "act_arr_time", "clean_value": "3:43 p.m." } ], "predicted_repairs": [ { "row": 2025, "column": "act_arr_time", "new_value": "4:24 p.m.", "reason": "The act_arr_time for flight UA-2708-EWR-CLT has been updated to 4:24 PM." }, { "row": 2026, "column": "act_arr_time", "new_value": "7:10 p.m.", "reason": "The act_arr_time for flight UA-62-IAH-EWR has been updated to 7:10 PM." }, { "row": 2027, "column": "act_arr_time", "new_value": "12:12 p.m.", "reason": "The act_arr_time for flight UA-1500-IAH-GUA has been updated to 12:12 PM." }, { "row": 2028, "column": "act_arr_time", "new_value": "3:36 p.m.", "reason": "The act_arr_time for flight AA-3804-PHL-ORD has been updated to 3:36 PM." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 2025,\n \"column\": \"act_arr_time\",\n \"new_value\": \"4:24 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-2708-EWR-CLT has been updated to 4:24 PM.\"\n },\n {\n \"row\": 2026,\n \"column\": \"act_arr_time\",\n \"new_value\": \"7:10 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-62-IAH-EWR has been updated to 7:10 PM.\"\n },\n {\n \"row\": 2027,\n \"column\": \"act_arr_time\",\n \"new_value\": \"12:12 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-1500-IAH-GUA has been updated to 12:12 PM.\"\n },\n {\n \"row\": 2028,\n \"column\": \"act_arr_time\",\n \"new_value\": \"3:36 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-3804-PHL-ORD has been updated to 3:36 PM.\"\n }\n ]\n}\n```" }, { "task_index": 9, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 }, "target_rows": [ { "_row": "657", "index": "658", "id": "685", "beer-name": "Lava Lake Wit", "style": "Witbier", "ounces": "12.0 oz.", "abv": "0.052", "ibu": "15", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "658", "index": "659", "id": "613", "beer-name": "Mountain Livin' Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.06", "ibu": "N/A", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "659", "index": "660", "id": "356", "beer-name": "Crazy Mountain Amber Ale", "style": "American Amber / Red Ale", "ounces": "12.0 ounce", "abv": "0.052", "ibu": "25", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "660", "index": "661", "id": "2029", "beer-name": "Tropicalia", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.065", "ibu": "65", "brewery_id": "247", "brewery-name": "Creature Comforts", "city": "Athens", "state": "GA" } ], "ground_truth": [ { "row": 657, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ibu", "clean_value": "" }, { "row": 659, "column": "ounces", "clean_value": "12" }, { "row": 660, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 657, "column": "abv", "new_value": "0.052", "reason": "The beer name 'Lava Lake Wit' was found in the target row but does not match any of the allowed beer names." }, { "row": 658, "column": "abv", "new_value": "0.06", "reason": "The beer name 'Mountain Livin' Pale Ale' was found in the target row but does not match any of the allowed beer names." }, { "row": 659, "column": "abv", "new_value": "0.052", "reason": "The beer name 'Crazy Mountain Amber Ale' was found in the target row but does not match any of the allowed beer names." }, { "row": 660, "column": "abv", "new_value": "0.065", "reason": "The beer name 'Tropicalia' was found in the target row but does not match any of the allowed beer names." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 657,\n \"column\": \"abv\",\n \"new_value\": \"0.052\",\n \"reason\": \"The beer name 'Lava Lake Wit' was found in the target row but does not match any of the allowed beer names.\"\n },\n {\n \"row\": 658,\n \"column\": \"abv\",\n \"new_value\": \"0.06\",\n \"reason\": \"The beer name 'Mountain Livin' Pale Ale' was found in the target row but does not match any of the allowed beer names.\"\n },\n {\n \"row\": 659,\n \"column\": \"abv\",\n \"new_value\": \"0.052\",\n \"reason\": \"The beer name 'Crazy Mountain Amber Ale' was found in the target row but does not match any of the allowed beer names.\"\n },\n {\n \"row\": 660,\n \"column\": \"abv\",\n \"new_value\": \"0.065\",\n \"reason\": \"The beer name 'Tropicalia' was found in the target row but does not match any of the allowed beer names.\"\n }\n ]\n}\n```" }, { "task_index": 10, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 }, "target_rows": [ { "_row": "122", "index": "123", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-4", "MeasureName": "heart attack patients given smoking cessation advice/counseling", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-4" }, { "_row": "123", "index": "124", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "0%", "Sample": "1 patients", "Stateavg": "al_ami-5" }, { "_row": "124", "index": "125", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "125", "index": "126", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" } ], "ground_truth": [], "predicted_repairs": [ { "row": 122, "column": "Index", "new_value": "123", "reason": "The address '101 hospital circle' is invalid." }, { "row": 123, "column": "Index", "new_value": "124", "reason": "The address '101 hospital circle' is invalid." }, { "row": 124, "column": "Index", "new_value": "125", "reason": "The address '101 hospital circle' is invalid." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 122,\n \"column\": \"Index\",\n \"new_value\": \"123\",\n \"reason\": \"The address '101 hospital circle' is invalid.\"\n },\n {\n \"row\": 123,\n \"column\": \"Index\",\n \"new_value\": \"124\",\n \"reason\": \"The address '101 hospital circle' is invalid.\"\n },\n {\n \"row\": 124,\n \"column\": \"Index\",\n \"new_value\": \"125\",\n \"reason\": \"The address '101 hospital circle' is invalid.\"\n }\n ]\n}\n```" }, { "task_index": 11, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 14, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 14, "wrong_cell": 4 }, "target_rows": [ { "_row": "1535", "tuple_id": "1536", "src": "flytecomm", "flight": "CO-1193-EWR-MCO", "sched_dep_time": "9:15 a.m.", "act_dep_time": "", "sched_arr_time": "12:18 p.m.", "act_arr_time": "" }, { "_row": "1536", "tuple_id": "1537", "src": "flytecomm", "flight": "AA-3842-MSP-ORD", "sched_dep_time": "", "act_dep_time": "6:57 a.m.", "sched_arr_time": "", "act_arr_time": "7:49 a.m." }, { "_row": "1537", "tuple_id": "1538", "src": "flytecomm", "flight": "AA-643-MIA-ORD", "sched_dep_time": "", "act_dep_time": "7:31 a.m.", "sched_arr_time": "", "act_arr_time": "9:26 a.m." }, { "_row": "1538", "tuple_id": "1539", "src": "flytecomm", "flight": "AA-1007-MIA-PHX", "sched_dep_time": "", "act_dep_time": "5:09 p.m.", "sched_arr_time": "", "act_arr_time": "7:43 p.m." } ], "ground_truth": [ { "row": 1535, "column": "act_dep_time", "clean_value": "9:14 a.m." }, { "row": 1535, "column": "act_arr_time", "clean_value": "12:09 p.m." }, { "row": 1536, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 1536, "column": "act_dep_time", "clean_value": "6:56 a.m." }, { "row": 1536, "column": "sched_arr_time", "clean_value": "7:30 a.m." }, { "row": 1536, "column": "act_arr_time", "clean_value": "7:51 a.m." }, { "row": 1537, "column": "sched_dep_time", "clean_value": "7:10 a.m." }, { "row": 1537, "column": "act_dep_time", "clean_value": "7:30 a.m." }, { "row": 1537, "column": "sched_arr_time", "clean_value": "9:35 a.m." }, { "row": 1537, "column": "act_arr_time", "clean_value": "9:31 a.m." }, { "row": 1538, "column": "sched_dep_time", "clean_value": "4:55 p.m." }, { "row": 1538, "column": "act_dep_time", "clean_value": "5:08 p.m." }, { "row": 1538, "column": "sched_arr_time", "clean_value": "8:05 p.m." }, { "row": 1538, "column": "act_arr_time", "clean_value": "7:55 p.m." } ], "predicted_repairs": [ { "row": 1535, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 1536, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 1537, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 1538, "column": "Column", "new_value": "value", "reason": "why" } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1535,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 1536,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 1537,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 1538,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n }\n ]\n}\n```" }, { "task_index": 12, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "wrong_cell": 4 }, "target_rows": [ { "_row": "1774", "index": "1775", "id": "1841", "beer-name": "Alpha Blackback", "style": "American Black Ale", "ounces": "12.0 oz", "abv": "0.07200000000000001%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1775", "index": "1776", "id": "1782", "beer-name": "Kiss Off IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.063%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1776", "index": "1777", "id": "1552", "beer-name": "Dog Days Summer Ale", "style": "K\u00f6lsch", "ounces": "12.0 oz.", "abv": "0.045%", "ibu": "28", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1777", "index": "1778", "id": "1479", "beer-name": "1881 California Red", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.055999999999999994%", "ibu": "35", "brewery_id": "397", "brewery-name": "Ruhstaller Beer Company", "city": "Sacramento", "state": "CA" } ], "ground_truth": [ { "row": 1774, "column": "ounces", "clean_value": "12" }, { "row": 1774, "column": "abv", "clean_value": "0.072" }, { "row": 1774, "column": "ibu", "clean_value": "" }, { "row": 1775, "column": "ounces", "clean_value": "12" }, { "row": 1775, "column": "abv", "clean_value": "0.063" }, { "row": 1775, "column": "ibu", "clean_value": "" }, { "row": 1776, "column": "ounces", "clean_value": "12" }, { "row": 1776, "column": "abv", "clean_value": "0.045" }, { "row": 1777, "column": "ounces", "clean_value": "12" }, { "row": 1777, "column": "abv", "clean_value": "0.056" } ], "predicted_repairs": [ { "row": 1774, "column": "Beer Name", "new_value": "Alpha Blackback", "reason": "The beer name has been replaced with 'Alpha Blackback'." }, { "row": 1775, "column": "Beer Name", "new_value": "Kiss Off IPA", "reason": "The beer name has been replaced with 'Kiss Off IPA'." }, { "row": 1776, "column": "Beer Name", "new_value": "Dog Days Summer Ale", "reason": "The beer name has been replaced with 'Dog Days Summer Ale'." }, { "row": 1777, "column": "Beer Name", "new_value": "1881 California Red", "reason": "The beer name has been replaced with '1881 California Red'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1774,\n \"column\": \"Beer Name\",\n \"new_value\": \"Alpha Blackback\",\n \"reason\": \"The beer name has been replaced with 'Alpha Blackback'.\"\n },\n {\n \"row\": 1775,\n \"column\": \"Beer Name\",\n \"new_value\": \"Kiss Off IPA\",\n \"reason\": \"The beer name has been replaced with 'Kiss Off IPA'.\"\n },\n {\n \"row\": 1776,\n \"column\": \"Beer Name\",\n \"new_value\": \"Dog Days Summer Ale\",\n \"reason\": \"The beer name has been replaced with 'Dog Days Summer Ale'.\"\n },\n {\n \"row\": 1777,\n \"column\": \"Beer Name\",\n \"new_value\": \"1881 California Red\",\n \"reason\": \"The beer name has been replaced with '1881 California Red'.\"\n }\n ]\n}\n```" }, { "task_index": 13, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "881", "index": "882", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "82%", "Sample": "11 patients", "Stateavg": "al_ami-5" }, { "_row": "882", "index": "883", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "883", "index": "884", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" }, { "_row": "884", "index": "885", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "xl", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "87%", "Sample": "67 patients", "Stateavg": "al_hf-1" } ], "ground_truth": [ { "row": 881, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 883, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 884, "column": "State", "clean_value": "al" } ], "predicted_repairs": [ { "row": 881, "column": "Index", "new_value": "882", "reason": "The new value for index is invalid." }, { "row": 882, "column": "ProviderNumber", "new_value": "10045", "reason": "The new value for ProviderNumber is invalid." }, { "row": 883, "column": "Address1", "new_value": "1653 temple avenue north", "reason": "The new value for Address1 is invalid." }, { "row": 884, "column": "Address2", "new_value": "", "reason": "The new value for Address2 is missing or invalid." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 881,\n \"column\": \"Index\",\n \"new_value\": \"882\",\n \"reason\": \"The new value for index is invalid.\"\n },\n {\n \"row\": 882,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10045\",\n \"reason\": \"The new value for ProviderNumber is invalid.\"\n },\n {\n \"row\": 883,\n \"column\": \"Address1\",\n \"new_value\": \"1653 temple avenue north\",\n \"reason\": \"The new value for Address1 is invalid.\"\n },\n {\n \"row\": 884,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address2 is missing or invalid.\"\n }\n ]\n}\n```" }, { "task_index": 14, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_value": 3 }, "target_rows": [ { "_row": "1675", "tuple_id": "1676", "src": "wunderground", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:45 a.m.", "sched_arr_time": "4:37 p.m.", "act_arr_time": "4:57 p.m." }, { "_row": "1676", "tuple_id": "1677", "src": "wunderground", "flight": "AA-2957-DFW-CVG", "sched_dep_time": "7:55 a.m.", "act_dep_time": "8:05 a.m.", "sched_arr_time": "10:55 a.m.", "act_arr_time": "10:58 a.m." }, { "_row": "1677", "tuple_id": "1678", "src": "wunderground", "flight": "AA-1664-MIA-ATL", "sched_dep_time": "10:15 a.m.", "act_dep_time": "10:19 a.m.", "sched_arr_time": "11:43 a.m.", "act_arr_time": "11:50 a.m." }, { "_row": "1678", "tuple_id": "1679", "src": "wunderground", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "7:50 a.m.", "act_arr_time": "7:59 a.m." } ], "ground_truth": [ { "row": 1675, "column": "act_dep_time", "clean_value": "11:30 a.m." }, { "row": 1675, "column": "sched_arr_time", "clean_value": "4:57 p.m." }, { "row": 1675, "column": "act_arr_time", "clean_value": "5:05 p.m." }, { "row": 1676, "column": "act_dep_time", "clean_value": "8:04 a.m." }, { "row": 1676, "column": "sched_arr_time", "clean_value": "11:05 a.m." }, { "row": 1676, "column": "act_arr_time", "clean_value": "11:01 a.m." }, { "row": 1677, "column": "act_dep_time", "clean_value": "10:18 a.m." }, { "row": 1677, "column": "sched_arr_time", "clean_value": "12:10 p.m." }, { "row": 1677, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 1678, "column": "sched_arr_time", "clean_value": "8:00 a.m." }, { "row": 1678, "column": "act_arr_time", "clean_value": "8:06 a.m." } ], "predicted_repairs": [ { "row": 1675, "column": "act_arr_time", "new_value": "10:58 a.m.", "reason": "The act_arr_time for flight AA-2957-DFW-CVG has been updated to 10:55 a.m." }, { "row": 1676, "column": "act_arr_time", "new_value": "11:50 a.m.", "reason": "The act_arr_time for flight AA-1664-MIA-ATL has been updated to 11:43 a.m." }, { "row": 1677, "column": "act_arr_time", "new_value": "11:50 a.m.", "reason": "The act_arr_time for flight AA-3979-CVG-ORD has been updated to 11:43 a.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1675,\n \"column\": \"act_arr_time\",\n \"new_value\": \"10:58 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-2957-DFW-CVG has been updated to 10:55 a.m.\"\n },\n {\n \"row\": 1676,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:50 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-1664-MIA-ATL has been updated to 11:43 a.m.\"\n },\n {\n \"row\": 1677,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:50 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-3979-CVG-ORD has been updated to 11:43 a.m.\"\n }\n ]\n}\n```" }, { "task_index": 15, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 4 }, "target_rows": [ { "_row": "1813", "index": "1814", "id": "307", "beer-name": "Santa Fe Oktoberfest", "style": "M\u00e4rzen / Oktoberfest", "ounces": "12.0 oz.", "abv": "", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1814", "index": "1815", "id": "305", "beer-name": "Imperial Java Stout", "style": "Russian Imperial Stout", "ounces": "12.0 oz.", "abv": "0.08%", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1815", "index": "1816", "id": "304", "beer-name": "Freestyle Pilsner", "style": "German Pilsener", "ounces": "12.0 oz.", "abv": "0.055", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1816", "index": "1817", "id": "217", "beer-name": "Happy Camper IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.066", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" } ], "ground_truth": [ { "row": 1813, "column": "ounces", "clean_value": "12" }, { "row": 1813, "column": "ibu", "clean_value": "" }, { "row": 1814, "column": "ounces", "clean_value": "12" }, { "row": 1814, "column": "abv", "clean_value": "0.08" }, { "row": 1814, "column": "ibu", "clean_value": "" }, { "row": 1815, "column": "ounces", "clean_value": "12" }, { "row": 1815, "column": "ibu", "clean_value": "" }, { "row": 1816, "column": "ounces", "clean_value": "12" }, { "row": 1816, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1813, "column": "style", "new_value": "Happy Camper IPA", "reason": "The beer name has been replaced with 'Happy Camper IPA'." }, { "row": 1814, "column": "style", "new_value": "Imperial Java Stout", "reason": "The beer name has been replaced with 'Imperial Java Stout'." }, { "row": 1815, "column": "style", "new_value": "Freestyle Pilsner", "reason": "The beer name has been replaced with 'Freestyle Pilsner'." }, { "row": 1816, "column": "style", "new_value": "Happy Camper IPA", "reason": "The beer name has been replaced with 'Happy Camper IPA'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1813,\n \"column\": \"style\",\n \"new_value\": \"Happy Camper IPA\",\n \"reason\": \"The beer name has been replaced with 'Happy Camper IPA'.\"\n },\n {\n \"row\": 1814,\n \"column\": \"style\",\n \"new_value\": \"Imperial Java Stout\",\n \"reason\": \"The beer name has been replaced with 'Imperial Java Stout'.\"\n },\n {\n \"row\": 1815,\n \"column\": \"style\",\n \"new_value\": \"Freestyle Pilsner\",\n \"reason\": \"The beer name has been replaced with 'Freestyle Pilsner'.\"\n },\n {\n \"row\": 1816,\n \"column\": \"style\",\n \"new_value\": \"Happy Camper IPA\",\n \"reason\": \"The beer name has been replaced with 'Happy Camper IPA'.\"\n }\n ]\n}\n```" }, { "task_index": 16, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 3 }, "target_rows": [ { "_row": "734", "index": "735", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "99%", "Sample": "411 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "735", "index": "736", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scix-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "98%", "Sample": "417 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "736", "index": "737", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912xalabamaxhighwayx157", "Address2": "empty", "Address3": "empty", "City": "cuxxman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "98%", "Sample": "405 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "737", "index": "738", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 735, "column": "MeasureCode", "clean_value": "scip-inf-2" }, { "row": 736, "column": "Address1", "clean_value": "1912 alabama highway 157" }, { "row": 736, "column": "City", "clean_value": "cullman" } ], "predicted_repairs": [ { "row": 734, "column": "Index", "new_value": "735", "reason": "The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue." }, { "row": 735, "column": "Index", "new_value": "736", "reason": "The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue." }, { "row": 736, "column": "Index", "new_value": "737", "reason": "The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 734,\n \"column\": \"Index\",\n \"new_value\": \"735\",\n \"reason\": \"The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue.\"\n },\n {\n \"row\": 735,\n \"column\": \"Index\",\n \"new_value\": \"736\",\n \"reason\": \"The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue.\"\n },\n {\n \"row\": 736,\n \"column\": \"Index\",\n \"new_value\": \"737\",\n \"reason\": \"The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue.\"\n }\n ]\n}\n```" }, { "task_index": 17, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "wrong_value": 4 }, "target_rows": [ { "_row": "167", "tuple_id": "168", "src": "boston", "flight": "UA-3515-IAD-MSP", "sched_dep_time": "", "act_dep_time": "8:26 a.m.", "sched_arr_time": "", "act_arr_time": "9:54 a.m." }, { "_row": "168", "tuple_id": "169", "src": "boston", "flight": "AA-3468-CVG-MIA", "sched_dep_time": "7:00 a.m.", "act_dep_time": "7:25 a.m.", "sched_arr_time": "9:55 a.m.", "act_arr_time": "9:42 a.m." }, { "_row": "169", "tuple_id": "170", "src": "boston", "flight": "AA-484-DFW-MIA", "sched_dep_time": "4:15 p.m.", "act_dep_time": "4:30 p.m.", "sched_arr_time": "7:55 p.m.", "act_arr_time": "7:35 p.m." }, { "_row": "170", "tuple_id": "171", "src": "boston", "flight": "AA-1886-BOS-MIA", "sched_dep_time": "", "act_dep_time": "10:55 a.m.", "sched_arr_time": "", "act_arr_time": "1:34 p.m." } ], "ground_truth": [ { "row": 167, "column": "sched_dep_time", "clean_value": "8:15 a.m." }, { "row": 167, "column": "act_dep_time", "clean_value": "8:12 a.m." }, { "row": 167, "column": "sched_arr_time", "clean_value": "10:06 a.m." }, { "row": 167, "column": "act_arr_time", "clean_value": "9:56 a.m." }, { "row": 168, "column": "act_arr_time", "clean_value": "9:45 a.m." }, { "row": 169, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 169, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 170, "column": "sched_dep_time", "clean_value": "10:45 a.m." }, { "row": 170, "column": "sched_arr_time", "clean_value": "2:20 p.m." }, { "row": 170, "column": "act_arr_time", "clean_value": "1:40 p.m." } ], "predicted_repairs": [ { "row": 167, "column": "act_arr_time", "new_value": "9:54 a.m.", "reason": "The act_arr_time for flight UA-3515-IAD-MSP has been updated to 9:54 a.m." }, { "row": 168, "column": "act_arr_time", "new_value": "9:42 a.m.", "reason": "The act_arr_time for flight AA-3468-CVG-MIA has been updated to 9:42 a.m." }, { "row": 169, "column": "act_arr_time", "new_value": "7:35 p.m.", "reason": "The act_arr_time for flight AA-484-DFW-MIA has been updated to 7:35 p.m." }, { "row": 170, "column": "act_arr_time", "new_value": "1:34 p.m.", "reason": "The act_arr_time for flight AA-1886-BOS-MIA has been updated to 1:34 p.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 167,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:54 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-3515-IAD-MSP has been updated to 9:54 a.m.\"\n },\n {\n \"row\": 168,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:42 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-3468-CVG-MIA has been updated to 9:42 a.m.\"\n },\n {\n \"row\": 169,\n \"column\": \"act_arr_time\",\n \"new_value\": \"7:35 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-484-DFW-MIA has been updated to 7:35 p.m.\"\n },\n {\n \"row\": 170,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:34 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-1886-BOS-MIA has been updated to 1:34 p.m.\"\n }\n ]\n}\n```" }, { "task_index": 18, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 4 }, "target_rows": [ { "_row": "1589", "index": "1590", "id": "785", "beer-name": "Old Chub (2003)", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1590", "index": "1591", "id": "745", "beer-name": "Dale's Pale Ale (2008)", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1591", "index": "1592", "id": "744", "beer-name": "Dale's Pale Ale (2006)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.065%", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons CO", "state": "" }, { "_row": "1592", "index": "1593", "id": "743", "beer-name": "Dale's Pale Ale (2004)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" } ], "ground_truth": [ { "row": 1589, "column": "ounces", "clean_value": "12" }, { "row": 1590, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "abv", "clean_value": "0.065" }, { "row": 1591, "column": "city", "clean_value": "Lyons" }, { "row": 1591, "column": "state", "clean_value": "CO" }, { "row": 1592, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1589, "column": "Beer-Name", "new_value": "Old Chub (2003)", "reason": "The beer name has been replaced with 'Old Chub (2003)'." }, { "row": 1590, "column": "Beer-Name", "new_value": "Dale's Pale Ale (2008)", "reason": "The beer name has been replaced with 'Dale's Pale Ale (2008)'." }, { "row": 1591, "column": "Beer-Name", "new_value": "Dale's Pale Ale (2006)", "reason": "The beer name has been replaced with 'Dale's Pale Ale (2006)'." }, { "row": 1592, "column": "Beer-Name", "new_value": "Dale's Pale Ale (2004)", "reason": "The beer name has been replaced with 'Dale's Pale Ale (2004)'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1589,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Old Chub (2003)\",\n \"reason\": \"The beer name has been replaced with 'Old Chub (2003)'.\"\n },\n {\n \"row\": 1590,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Dale's Pale Ale (2008)\",\n \"reason\": \"The beer name has been replaced with 'Dale's Pale Ale (2008)'.\"\n },\n {\n \"row\": 1591,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Dale's Pale Ale (2006)\",\n \"reason\": \"The beer name has been replaced with 'Dale's Pale Ale (2006)'.\"\n },\n {\n \"row\": 1592,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Dale's Pale Ale (2004)\",\n \"reason\": \"The beer name has been replaced with 'Dale's Pale Ale (2004)'.\"\n }\n ]\n}\n```" }, { "task_index": 19, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "512", "index": "513", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "513", "index": "514", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "chxrokxx", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "100%", "Sample": "6 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "514", "index": "515", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "1xx%", "Sample": "5 patients", "Stateavg": "al_scip-vte-1" }, { "_row": "515", "index": "516", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-2", "MeasureName": "patients who got treatment at the right time (within 24 hours before or after their surgery) to help prevent blood clots after certain types of surgery", "Score": "100%", "Sample": "5 patients", "Stateavg": "al_scip-vte-2" } ], "ground_truth": [ { "row": 513, "column": "CountyName", "clean_value": "cherokee" }, { "row": 514, "column": "Score", "clean_value": "100%" } ], "predicted_repairs": [ { "row": 512, "column": "Index", "new_value": "513", "reason": "The address '400 northwood dr' has been replaced with '513'." }, { "row": 513, "column": "ProviderNumber", "new_value": "10022", "reason": "The address '400 northwood dr' has been replaced with '10022'." }, { "row": 514, "column": "Address1", "new_value": "400 northwood dr", "reason": "The address '400 northwood dr' has been replaced with '400 northwood dr'." }, { "row": 515, "column": "Address2", "new_value": "", "reason": "The address '400 northwood dr' has been replaced with an empty string." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 512,\n \"column\": \"Index\",\n \"new_value\": \"513\",\n \"reason\": \"The address '400 northwood dr' has been replaced with '513'.\"\n },\n {\n \"row\": 513,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10022\",\n \"reason\": \"The address '400 northwood dr' has been replaced with '10022'.\"\n },\n {\n \"row\": 514,\n \"column\": \"Address1\",\n \"new_value\": \"400 northwood dr\",\n \"reason\": \"The address '400 northwood dr' has been replaced with '400 northwood dr'.\"\n },\n {\n \"row\": 515,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The address '400 northwood dr' has been replaced with an empty string.\"\n }\n ]\n}\n```" }, { "task_index": 20, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "13", "tuple_id": "14", "src": "aa", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "8:00 a.m.", "act_arr_time": "8:06 a.m." }, { "_row": "14", "tuple_id": "15", "src": "aa", "flight": "AA-1279-DFW-PHX", "sched_dep_time": "1:00 p.m.", "act_dep_time": "2:04 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:30 p.m." }, { "_row": "15", "tuple_id": "16", "src": "aa", "flight": "AA-616-DFW-DTW", "sched_dep_time": "9:05 a.m.", "act_dep_time": "10:10 a.m.", "sched_arr_time": "12:35 p.m.", "act_arr_time": "1:27 p.m." }, { "_row": "16", "tuple_id": "17", "src": "aa", "flight": "AA-4344-ORD-DTW", "sched_dep_time": "11:45 a.m.", "act_dep_time": "12:13 p.m.", "sched_arr_time": "2:00 p.m.", "act_arr_time": "2:10 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 13, "column": "act_arr_time", "new_value": "8:06 a.m.", "reason": "The act_arr_time for flight AA-3979-CVG-ORD has been updated to 8:06 a.m." }, { "row": 14, "column": "act_arr_time", "new_value": "3:30 p.m.", "reason": "The act_arr_time for flight AA-1279-DFW-PHX has been updated to 3:30 p.m." }, { "row": 15, "column": "act_arr_time", "new_value": "1:27 p.m.", "reason": "The act_arr_time for flight AA-616-DFW-DTW has been updated to 1:27 p.m." }, { "row": 16, "column": "act_arr_time", "new_value": "2:10 p.m.", "reason": "The act_arr_time for flight AA-4344-ORD-DTW has been updated to 2:10 p.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 13,\n \"column\": \"act_arr_time\",\n \"new_value\": \"8:06 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-3979-CVG-ORD has been updated to 8:06 a.m.\"\n },\n {\n \"row\": 14,\n \"column\": \"act_arr_time\",\n \"new_value\": \"3:30 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-1279-DFW-PHX has been updated to 3:30 p.m.\"\n },\n {\n \"row\": 15,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:27 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-616-DFW-DTW has been updated to 1:27 p.m.\"\n },\n {\n \"row\": 16,\n \"column\": \"act_arr_time\",\n \"new_value\": \"2:10 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-4344-ORD-DTW has been updated to 2:10 p.m.\"\n }\n ]\n}\n```" }, { "task_index": 21, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 4 }, "target_rows": [ { "_row": "662", "index": "663", "id": "2293", "beer-name": "Aviator Raspberry Blonde", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.049%", "ibu": "25", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "663", "index": "664", "id": "1105", "beer-name": "3 Picket Porter", "style": "American Porter", "ounces": "12.0 oz.", "abv": "0.055%", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "664", "index": "665", "id": "1104", "beer-name": "Rusty Nail Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.056", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "665", "index": "666", "id": "2145", "beer-name": "Red Water Irish Style Red", "style": "American Amber / Red Ale", "ounces": "12.0 OZ.", "abv": "0.065", "ibu": "N/A", "brewery_id": "212", "brewery-name": "Crow Peak Brewing Company", "city": "Spearfish", "state": "SD" } ], "ground_truth": [ { "row": 662, "column": "ounces", "clean_value": "12" }, { "row": 662, "column": "abv", "clean_value": "0.049" }, { "row": 663, "column": "ounces", "clean_value": "12" }, { "row": 663, "column": "abv", "clean_value": "0.055" }, { "row": 663, "column": "ibu", "clean_value": "" }, { "row": 664, "column": "ounces", "clean_value": "12" }, { "row": 664, "column": "ibu", "clean_value": "" }, { "row": 665, "column": "ounces", "clean_value": "12" }, { "row": 665, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 662, "column": "style", "new_value": "American Blonde Ale", "reason": "The beer name has been changed to American Blonde Ale." }, { "row": 663, "column": "style", "new_value": "American Porter", "reason": "The beer name has been changed to American Porter." }, { "row": 664, "column": "style", "new_value": "American Pale Ale (APA)", "reason": "The beer name has been changed to American Pale Ale (APA)." }, { "row": 665, "column": "style", "new_value": "American Amber / Red Ale", "reason": "The beer name has been changed to American Amber / Red Ale." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 662,\n \"column\": \"style\",\n \"new_value\": \"American Blonde Ale\",\n \"reason\": \"The beer name has been changed to American Blonde Ale.\"\n },\n {\n \"row\": 663,\n \"column\": \"style\",\n \"new_value\": \"American Porter\",\n \"reason\": \"The beer name has been changed to American Porter.\"\n },\n {\n \"row\": 664,\n \"column\": \"style\",\n \"new_value\": \"American Pale Ale (APA)\",\n \"reason\": \"The beer name has been changed to American Pale Ale (APA).\"\n },\n {\n \"row\": 665,\n \"column\": \"style\",\n \"new_value\": \"American Amber / Red Ale\",\n \"reason\": \"The beer name has been changed to American Amber / Red Ale.\"\n }\n ]\n}\n```" }, { "task_index": 22, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 2, "schema_case_error": 4 }, "target_rows": [ { "_row": "870", "index": "871", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "80%", "Sample": "15 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "871", "index": "872", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "87%", "Sample": "15 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "872", "index": "873", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntaxy non-pxofit - pxivate", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "87%", "Sample": "15 patiexts", "Stateavg": "al_scip-inf-3" }, { "_row": "873", "index": "874", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 872, "column": "HospitalOwner", "clean_value": "voluntary non-profit - private" }, { "row": 872, "column": "Sample", "clean_value": "15 patients" } ], "predicted_repairs": [ { "row": 870, "column": "Index", "new_value": "870", "reason": "The address '1256 military street south' does not match any allowed column name." }, { "row": 871, "column": "Index", "new_value": "871", "reason": "The address '1256 military street south' does not match any allowed column name." }, { "row": 872, "column": "Index", "new_value": "872", "reason": "The address '1256 military street south' does not match any allowed column name." }, { "row": 873, "column": "Index", "new_value": "873", "reason": "The address '1256 military street south' does not match any allowed column name." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 870,\n \"column\": \"Index\",\n \"new_value\": \"870\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n },\n {\n \"row\": 871,\n \"column\": \"Index\",\n \"new_value\": \"871\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n },\n {\n \"row\": 872,\n \"column\": \"Index\",\n \"new_value\": \"872\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n },\n {\n \"row\": 873,\n \"column\": \"Index\",\n \"new_value\": \"873\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n }\n ]\n}\n```" }, { "task_index": 23, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 4 }, "target_rows": [ { "_row": "324", "tuple_id": "325", "src": "weather", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:20 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "2:49 p.m." }, { "_row": "325", "tuple_id": "326", "src": "weather", "flight": "UA-854-SFO-IAH", "sched_dep_time": "7:53 a.m.", "act_dep_time": "8:07 a.m.", "sched_arr_time": "1:39 p.m.", "act_arr_time": "1:23 p.m." }, { "_row": "326", "tuple_id": "327", "src": "weather", "flight": "AA-415-BOS-ORD", "sched_dep_time": "8:35 a.m.", "act_dep_time": "", "sched_arr_time": "10:40 a.m.", "act_arr_time": "" }, { "_row": "327", "tuple_id": "328", "src": "weather", "flight": "AA-85-JFK-SFO", "sched_dep_time": "3:05 p.m.", "act_dep_time": "", "sched_arr_time": "6:30 p.m.", "act_arr_time": "" } ], "ground_truth": [ { "row": 324, "column": "act_dep_time", "clean_value": "1:19 p.m." }, { "row": 324, "column": "act_arr_time", "clean_value": "3:13 p.m." }, { "row": 325, "column": "act_dep_time", "clean_value": "7:49 a.m." }, { "row": 325, "column": "act_arr_time", "clean_value": "1:30 p.m." }, { "row": 326, "column": "act_dep_time", "clean_value": "8:56 a.m." }, { "row": 326, "column": "act_arr_time", "clean_value": "10:16 a.m." }, { "row": 327, "column": "act_dep_time", "clean_value": "3:36 p.m." }, { "row": 327, "column": "act_arr_time", "clean_value": "6:43 p.m." } ], "predicted_repairs": [ { "row": 324, "column": "act_arr_time", "new_value": "1:23 p.m.", "reason": "The act_arr_time for flight AA-854-SFO-IAH has been updated to 1:23 PM." }, { "row": 325, "column": "act_arr_time", "new_value": "", "reason": "The act_arr_time for flight AA-85-JFK-SFO is missing or incorrect." }, { "row": 326, "column": "act_arr_time", "new_value": "", "reason": "The act_arr_time for flight AA-415-BOS-ORD is missing or incorrect." }, { "row": 327, "column": "act_arr_time", "new_value": "", "reason": "The act_arr_time for flight AA-789-ORD-DEN is missing or incorrect." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 324,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:23 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-854-SFO-IAH has been updated to 1:23 PM.\"\n },\n {\n \"row\": 325,\n \"column\": \"act_arr_time\",\n \"new_value\": \"\",\n \"reason\": \"The act_arr_time for flight AA-85-JFK-SFO is missing or incorrect.\"\n },\n {\n \"row\": 326,\n \"column\": \"act_arr_time\",\n \"new_value\": \"\",\n \"reason\": \"The act_arr_time for flight AA-415-BOS-ORD is missing or incorrect.\"\n },\n {\n \"row\": 327,\n \"column\": \"act_arr_time\",\n \"new_value\": \"\",\n \"reason\": \"The act_arr_time for flight AA-789-ORD-DEN is missing or incorrect.\"\n }\n ]\n}\n```" }, { "task_index": 24, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 4 }, "target_rows": [ { "_row": "1597", "index": "1598", "id": "1533", "beer-name": "G'KNIGHT", "style": "American Double / Imperial IPA", "ounces": "12.0 OZ.", "abv": "0.087%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1598", "index": "1599", "id": "1532", "beer-name": "Ten Fidy", "style": "Russian Imperial Stout", "ounces": "12.0 oz", "abv": "0.099%", "ibu": "98", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1599", "index": "1600", "id": "1328", "beer-name": "Deviant Dale's IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.08%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1600", "index": "1601", "id": "1175", "beer-name": "Old Chub", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" } ], "ground_truth": [ { "row": 1597, "column": "ounces", "clean_value": "12" }, { "row": 1597, "column": "abv", "clean_value": "0.087" }, { "row": 1598, "column": "ounces", "clean_value": "12" }, { "row": 1598, "column": "abv", "clean_value": "0.099" }, { "row": 1599, "column": "ounces", "clean_value": "16" }, { "row": 1599, "column": "abv", "clean_value": "0.08" }, { "row": 1600, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1597, "column": "Abv", "new_value": "0.087%", "reason": "The beer name 'G'KNIGHT' was found in the target row but does not match any allowed column value." }, { "row": 1598, "column": "Abv", "new_value": "0.099%", "reason": "The beer name 'Ten Fidy' was found in the target row but does not match any allowed column value." }, { "row": 1599, "column": "Abv", "new_value": "0.08%", "reason": "The beer name 'Deviant Dale's IPA' was found in the target row but does not match any allowed column value." }, { "row": 1600, "column": "Abv", "new_value": "0.08%", "reason": "The beer name 'Old Chub' was found in the target row but does not match any allowed column value." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1597,\n \"column\": \"Abv\",\n \"new_value\": \"0.087%\",\n \"reason\": \"The beer name 'G'KNIGHT' was found in the target row but does not match any allowed column value.\"\n },\n {\n \"row\": 1598,\n \"column\": \"Abv\",\n \"new_value\": \"0.099%\",\n \"reason\": \"The beer name 'Ten Fidy' was found in the target row but does not match any allowed column value.\"\n },\n {\n \"row\": 1599,\n \"column\": \"Abv\",\n \"new_value\": \"0.08%\",\n \"reason\": \"The beer name 'Deviant Dale's IPA' was found in the target row but does not match any allowed column value.\"\n },\n {\n \"row\": 1600,\n \"column\": \"Abv\",\n \"new_value\": \"0.08%\",\n \"reason\": \"The beer name 'Old Chub' was found in the target row but does not match any allowed column value.\"\n }\n ]\n}\n```" }, { "task_index": 25, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 5, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "overrepair": 3, "schema_case_error": 1, "wrong_cell": 1 }, "target_rows": [ { "_row": "661", "index": "662", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-3" }, { "_row": "662", "index": "663", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-4" }, { "_row": "663", "index": "664", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-6" }, { "_row": "664", "index": "665", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [], "predicted_repairs": [ { "row": 661, "column": "Index", "new_value": "662", "reason": "The new value for index has been set to 662." }, { "row": 662, "column": "ProviderNumber", "new_value": "10032", "reason": "The new value for ProviderNumber has been set to 10032." }, { "row": 663, "column": "Address1", "new_value": "209 north main street", "reason": "The new value for Address1 has been set to '209 north main street'." }, { "row": 664, "column": "Address2", "new_value": "", "reason": "The new value for Address2 has been left as an empty string ('')." }, { "row": 665, "column": "Address3", "new_value": "", "reason": "The new value for Address3 has been left as an empty string ('')." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 661,\n \"column\": \"Index\",\n \"new_value\": \"662\",\n \"reason\": \"The new value for index has been set to 662.\"\n },\n {\n \"row\": 662,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10032\",\n \"reason\": \"The new value for ProviderNumber has been set to 10032.\"\n },\n {\n \"row\": 663,\n \"column\": \"Address1\",\n \"new_value\": \"209 north main street\",\n \"reason\": \"The new value for Address1 has been set to '209 north main street'.\"\n },\n {\n \"row\": 664,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address2 has been left as an empty string ('').\"\n },\n {\n \"row\": 665,\n \"column\": \"Address3\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address3 has been left as an empty string ('').\"\n }\n ]\n}\n```" } ], "failure_samples_by_slice": { "deterministic_normalization": [ { "task_index": 3, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 9, "schema_case_error": 3 }, "target_rows": [ { "_row": "1363", "index": "1364", "id": "2358", "beer-name": "Minhas Light (2012)", "style": "Light Lager", "ounces": "12.0 oz.", "abv": "0.04", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1364", "index": "1365", "id": "2282", "beer-name": "Huber", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "0.05%", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1365", "index": "1366", "id": "2281", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "16.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1366", "index": "1367", "id": "2280", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "12.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" } ], "ground_truth": [ { "row": 1363, "column": "ounces", "clean_value": "12" }, { "row": 1363, "column": "ibu", "clean_value": "" }, { "row": 1364, "column": "ounces", "clean_value": "12" }, { "row": 1364, "column": "abv", "clean_value": "0.05" }, { "row": 1364, "column": "ibu", "clean_value": "" }, { "row": 1365, "column": "ounces", "clean_value": "16" }, { "row": 1365, "column": "ibu", "clean_value": "" }, { "row": 1366, "column": "ounces", "clean_value": "12" }, { "row": 1366, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1363, "column": "Id", "new_value": "1364", "reason": "The beer name has been updated to 'Huber'." }, { "row": 1364, "column": "Id", "new_value": "1365", "reason": "The beer name has been updated to 'Clear Creek Ice'." }, { "row": 1365, "column": "Id", "new_value": "1366", "reason": "The beer name has been updated to 'Clear Creek Ice'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1363,\n \"column\": \"Id\",\n \"new_value\": \"1364\",\n \"reason\": \"The beer name has been updated to 'Huber'.\"\n },\n {\n \"row\": 1364,\n \"column\": \"Id\",\n \"new_value\": \"1365\",\n \"reason\": \"The beer name has been updated to 'Clear Creek Ice'.\"\n },\n {\n \"row\": 1365,\n \"column\": \"Id\",\n \"new_value\": \"1366\",\n \"reason\": \"The beer name has been updated to 'Clear Creek Ice'.\"\n }\n ]\n}\n```" }, { "task_index": 6, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 4 }, "target_rows": [ { "_row": "1840", "index": "1841", "id": "1539", "beer-name": "Monkey Fist IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.069%", "ibu": "65", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1841", "index": "1842", "id": "975", "beer-name": "Shipyard Summer Ale", "style": "American Pale Wheat Ale", "ounces": "12.0 oz", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1842", "index": "1843", "id": "814", "beer-name": "Pumpkinhead Ale", "style": "Pumpkin Ale", "ounces": "12.0 oz.", "abv": "0.047", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1843", "index": "1844", "id": "727", "beer-name": "Shipyard Export", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" } ], "ground_truth": [ { "row": 1840, "column": "ounces", "clean_value": "12" }, { "row": 1840, "column": "abv", "clean_value": "0.069" }, { "row": 1841, "column": "ounces", "clean_value": "12" }, { "row": 1841, "column": "ibu", "clean_value": "" }, { "row": 1842, "column": "ounces", "clean_value": "12" }, { "row": 1842, "column": "ibu", "clean_value": "" }, { "row": 1843, "column": "ounces", "clean_value": "12" }, { "row": 1843, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1840, "column": "Beer-Name", "new_value": "Monkey Fist IPA", "reason": "The beer name has been replaced with 'Monkey Fist IPA'." }, { "row": 1841, "column": "Beer-Name", "new_value": "Shipyard Summer Ale", "reason": "The beer name has been replaced with 'Shipyard Summer Ale'." }, { "row": 1842, "column": "Beer-Name", "new_value": "Pumpkinhead Ale", "reason": "The beer name has been replaced with 'Pumpkinhead Ale'." }, { "row": 1843, "column": "Beer-Name", "new_value": "Shipyard Export", "reason": "The beer name has been replaced with 'Shipyard Export'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1840,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Monkey Fist IPA\",\n \"reason\": \"The beer name has been replaced with 'Monkey Fist IPA'.\"\n },\n {\n \"row\": 1841,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Shipyard Summer Ale\",\n \"reason\": \"The beer name has been replaced with 'Shipyard Summer Ale'.\"\n },\n {\n \"row\": 1842,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Pumpkinhead Ale\",\n \"reason\": \"The beer name has been replaced with 'Pumpkinhead Ale'.\"\n },\n {\n \"row\": 1843,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Shipyard Export\",\n \"reason\": \"The beer name has been replaced with 'Shipyard Export'.\"\n }\n ]\n}\n```" }, { "task_index": 9, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 }, "target_rows": [ { "_row": "657", "index": "658", "id": "685", "beer-name": "Lava Lake Wit", "style": "Witbier", "ounces": "12.0 oz.", "abv": "0.052", "ibu": "15", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "658", "index": "659", "id": "613", "beer-name": "Mountain Livin' Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.06", "ibu": "N/A", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "659", "index": "660", "id": "356", "beer-name": "Crazy Mountain Amber Ale", "style": "American Amber / Red Ale", "ounces": "12.0 ounce", "abv": "0.052", "ibu": "25", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "660", "index": "661", "id": "2029", "beer-name": "Tropicalia", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.065", "ibu": "65", "brewery_id": "247", "brewery-name": "Creature Comforts", "city": "Athens", "state": "GA" } ], "ground_truth": [ { "row": 657, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ibu", "clean_value": "" }, { "row": 659, "column": "ounces", "clean_value": "12" }, { "row": 660, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 657, "column": "abv", "new_value": "0.052", "reason": "The beer name 'Lava Lake Wit' was found in the target row but does not match any of the allowed beer names." }, { "row": 658, "column": "abv", "new_value": "0.06", "reason": "The beer name 'Mountain Livin' Pale Ale' was found in the target row but does not match any of the allowed beer names." }, { "row": 659, "column": "abv", "new_value": "0.052", "reason": "The beer name 'Crazy Mountain Amber Ale' was found in the target row but does not match any of the allowed beer names." }, { "row": 660, "column": "abv", "new_value": "0.065", "reason": "The beer name 'Tropicalia' was found in the target row but does not match any of the allowed beer names." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 657,\n \"column\": \"abv\",\n \"new_value\": \"0.052\",\n \"reason\": \"The beer name 'Lava Lake Wit' was found in the target row but does not match any of the allowed beer names.\"\n },\n {\n \"row\": 658,\n \"column\": \"abv\",\n \"new_value\": \"0.06\",\n \"reason\": \"The beer name 'Mountain Livin' Pale Ale' was found in the target row but does not match any of the allowed beer names.\"\n },\n {\n \"row\": 659,\n \"column\": \"abv\",\n \"new_value\": \"0.052\",\n \"reason\": \"The beer name 'Crazy Mountain Amber Ale' was found in the target row but does not match any of the allowed beer names.\"\n },\n {\n \"row\": 660,\n \"column\": \"abv\",\n \"new_value\": \"0.065\",\n \"reason\": \"The beer name 'Tropicalia' was found in the target row but does not match any of the allowed beer names.\"\n }\n ]\n}\n```" }, { "task_index": 15, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 4 }, "target_rows": [ { "_row": "1813", "index": "1814", "id": "307", "beer-name": "Santa Fe Oktoberfest", "style": "M\u00e4rzen / Oktoberfest", "ounces": "12.0 oz.", "abv": "", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1814", "index": "1815", "id": "305", "beer-name": "Imperial Java Stout", "style": "Russian Imperial Stout", "ounces": "12.0 oz.", "abv": "0.08%", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1815", "index": "1816", "id": "304", "beer-name": "Freestyle Pilsner", "style": "German Pilsener", "ounces": "12.0 oz.", "abv": "0.055", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1816", "index": "1817", "id": "217", "beer-name": "Happy Camper IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.066", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" } ], "ground_truth": [ { "row": 1813, "column": "ounces", "clean_value": "12" }, { "row": 1813, "column": "ibu", "clean_value": "" }, { "row": 1814, "column": "ounces", "clean_value": "12" }, { "row": 1814, "column": "abv", "clean_value": "0.08" }, { "row": 1814, "column": "ibu", "clean_value": "" }, { "row": 1815, "column": "ounces", "clean_value": "12" }, { "row": 1815, "column": "ibu", "clean_value": "" }, { "row": 1816, "column": "ounces", "clean_value": "12" }, { "row": 1816, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1813, "column": "style", "new_value": "Happy Camper IPA", "reason": "The beer name has been replaced with 'Happy Camper IPA'." }, { "row": 1814, "column": "style", "new_value": "Imperial Java Stout", "reason": "The beer name has been replaced with 'Imperial Java Stout'." }, { "row": 1815, "column": "style", "new_value": "Freestyle Pilsner", "reason": "The beer name has been replaced with 'Freestyle Pilsner'." }, { "row": 1816, "column": "style", "new_value": "Happy Camper IPA", "reason": "The beer name has been replaced with 'Happy Camper IPA'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1813,\n \"column\": \"style\",\n \"new_value\": \"Happy Camper IPA\",\n \"reason\": \"The beer name has been replaced with 'Happy Camper IPA'.\"\n },\n {\n \"row\": 1814,\n \"column\": \"style\",\n \"new_value\": \"Imperial Java Stout\",\n \"reason\": \"The beer name has been replaced with 'Imperial Java Stout'.\"\n },\n {\n \"row\": 1815,\n \"column\": \"style\",\n \"new_value\": \"Freestyle Pilsner\",\n \"reason\": \"The beer name has been replaced with 'Freestyle Pilsner'.\"\n },\n {\n \"row\": 1816,\n \"column\": \"style\",\n \"new_value\": \"Happy Camper IPA\",\n \"reason\": \"The beer name has been replaced with 'Happy Camper IPA'.\"\n }\n ]\n}\n```" }, { "task_index": 21, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 4 }, "target_rows": [ { "_row": "662", "index": "663", "id": "2293", "beer-name": "Aviator Raspberry Blonde", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.049%", "ibu": "25", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "663", "index": "664", "id": "1105", "beer-name": "3 Picket Porter", "style": "American Porter", "ounces": "12.0 oz.", "abv": "0.055%", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "664", "index": "665", "id": "1104", "beer-name": "Rusty Nail Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.056", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "665", "index": "666", "id": "2145", "beer-name": "Red Water Irish Style Red", "style": "American Amber / Red Ale", "ounces": "12.0 OZ.", "abv": "0.065", "ibu": "N/A", "brewery_id": "212", "brewery-name": "Crow Peak Brewing Company", "city": "Spearfish", "state": "SD" } ], "ground_truth": [ { "row": 662, "column": "ounces", "clean_value": "12" }, { "row": 662, "column": "abv", "clean_value": "0.049" }, { "row": 663, "column": "ounces", "clean_value": "12" }, { "row": 663, "column": "abv", "clean_value": "0.055" }, { "row": 663, "column": "ibu", "clean_value": "" }, { "row": 664, "column": "ounces", "clean_value": "12" }, { "row": 664, "column": "ibu", "clean_value": "" }, { "row": 665, "column": "ounces", "clean_value": "12" }, { "row": 665, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 662, "column": "style", "new_value": "American Blonde Ale", "reason": "The beer name has been changed to American Blonde Ale." }, { "row": 663, "column": "style", "new_value": "American Porter", "reason": "The beer name has been changed to American Porter." }, { "row": 664, "column": "style", "new_value": "American Pale Ale (APA)", "reason": "The beer name has been changed to American Pale Ale (APA)." }, { "row": 665, "column": "style", "new_value": "American Amber / Red Ale", "reason": "The beer name has been changed to American Amber / Red Ale." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 662,\n \"column\": \"style\",\n \"new_value\": \"American Blonde Ale\",\n \"reason\": \"The beer name has been changed to American Blonde Ale.\"\n },\n {\n \"row\": 663,\n \"column\": \"style\",\n \"new_value\": \"American Porter\",\n \"reason\": \"The beer name has been changed to American Porter.\"\n },\n {\n \"row\": 664,\n \"column\": \"style\",\n \"new_value\": \"American Pale Ale (APA)\",\n \"reason\": \"The beer name has been changed to American Pale Ale (APA).\"\n },\n {\n \"row\": 665,\n \"column\": \"style\",\n \"new_value\": \"American Amber / Red Ale\",\n \"reason\": \"The beer name has been changed to American Amber / Red Ale.\"\n }\n ]\n}\n```" }, { "task_index": 24, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 4 }, "target_rows": [ { "_row": "1597", "index": "1598", "id": "1533", "beer-name": "G'KNIGHT", "style": "American Double / Imperial IPA", "ounces": "12.0 OZ.", "abv": "0.087%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1598", "index": "1599", "id": "1532", "beer-name": "Ten Fidy", "style": "Russian Imperial Stout", "ounces": "12.0 oz", "abv": "0.099%", "ibu": "98", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1599", "index": "1600", "id": "1328", "beer-name": "Deviant Dale's IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.08%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1600", "index": "1601", "id": "1175", "beer-name": "Old Chub", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" } ], "ground_truth": [ { "row": 1597, "column": "ounces", "clean_value": "12" }, { "row": 1597, "column": "abv", "clean_value": "0.087" }, { "row": 1598, "column": "ounces", "clean_value": "12" }, { "row": 1598, "column": "abv", "clean_value": "0.099" }, { "row": 1599, "column": "ounces", "clean_value": "16" }, { "row": 1599, "column": "abv", "clean_value": "0.08" }, { "row": 1600, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1597, "column": "Abv", "new_value": "0.087%", "reason": "The beer name 'G'KNIGHT' was found in the target row but does not match any allowed column value." }, { "row": 1598, "column": "Abv", "new_value": "0.099%", "reason": "The beer name 'Ten Fidy' was found in the target row but does not match any allowed column value." }, { "row": 1599, "column": "Abv", "new_value": "0.08%", "reason": "The beer name 'Deviant Dale's IPA' was found in the target row but does not match any allowed column value." }, { "row": 1600, "column": "Abv", "new_value": "0.08%", "reason": "The beer name 'Old Chub' was found in the target row but does not match any allowed column value." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1597,\n \"column\": \"Abv\",\n \"new_value\": \"0.087%\",\n \"reason\": \"The beer name 'G'KNIGHT' was found in the target row but does not match any allowed column value.\"\n },\n {\n \"row\": 1598,\n \"column\": \"Abv\",\n \"new_value\": \"0.099%\",\n \"reason\": \"The beer name 'Ten Fidy' was found in the target row but does not match any allowed column value.\"\n },\n {\n \"row\": 1599,\n \"column\": \"Abv\",\n \"new_value\": \"0.08%\",\n \"reason\": \"The beer name 'Deviant Dale's IPA' was found in the target row but does not match any allowed column value.\"\n },\n {\n \"row\": 1600,\n \"column\": \"Abv\",\n \"new_value\": \"0.08%\",\n \"reason\": \"The beer name 'Old Chub' was found in the target row but does not match any allowed column value.\"\n }\n ]\n}\n```" }, { "task_index": 30, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_cell": 4 }, "target_rows": [ { "_row": "374", "index": "375", "id": "1288", "beer-name": "Bozone Hefe Weizen", "style": "Hefeweizen", "ounces": "12.0 oz.", "abv": "0.06", "ibu": "25", "brewery_id": "219", "brewery-name": "Bozeman Brewing Company", "city": "Bozeman", "state": "MT" }, { "_row": "375", "index": "376", "id": "470", "beer-name": "Bozone Select Amber Ale", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.055%", "ibu": "N/A", "brewery_id": "219", "brewery-name": "Bozeman Brewing Company", "city": "Bozeman", "state": "MT" }, { "_row": "376", "index": "377", "id": "2167", "beer-name": "Evil Owl", "style": "American Amber / Red Ale", "ounces": "12.0 oz. Alumi-Tek", "abv": "0.052", "ibu": "40", "brewery_id": "207", "brewery-name": "Branchline Brewing Company", "city": "San Antonio", "state": "TX" }, { "_row": "377", "index": "378", "id": "2204", "beer-name": "Post Time K\u00f6lsch", "style": "K\u00f6lsch", "ounces": "16.0 oz", "abv": "0.05", "ibu": "N/A", "brewery_id": "195", "brewery-name": "Breakside Brewery", "city": "Portland", "state": "OR" } ], "ground_truth": [ { "row": 374, "column": "ounces", "clean_value": "12" }, { "row": 375, "column": "ounces", "clean_value": "12" }, { "row": 375, "column": "abv", "clean_value": "0.055" }, { "row": 375, "column": "ibu", "clean_value": "" }, { "row": 376, "column": "ounces", "clean_value": "12" }, { "row": 377, "column": "ounces", "clean_value": "16" }, { "row": 377, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 374, "column": "bozeman_brewery_name", "new_value": "Bozeman Brewing Company", "reason": "The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'." }, { "row": 375, "column": "bozeman_brewery_name", "new_value": "Bozeman Brewing Company", "reason": "The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'." }, { "row": 376, "column": "bozeman_brewery_name", "new_value": "Bozeman Brewing Company", "reason": "The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'." }, { "row": 377, "column": "bozeman_brewery_name", "new_value": "Bozeman Brewing Company", "reason": "The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 374,\n \"column\": \"bozeman_brewery_name\",\n \"new_value\": \"Bozeman Brewing Company\",\n \"reason\": \"The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'.\"\n },\n {\n \"row\": 375,\n \"column\": \"bozeman_brewery_name\",\n \"new_value\": \"Bozeman Brewing Company\",\n \"reason\": \"The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'.\"\n },\n {\n \"row\": 376,\n \"column\": \"bozeman_brewery_name\",\n \"new_value\": \"Bozeman Brewing Company\",\n \"reason\": \"The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'.\"\n },\n {\n \"row\": 377,\n \"column\": \"bozeman_brewery_name\",\n \"new_value\": \"Bozeman Brewing Company\",\n \"reason\": \"The beer name has been changed to 'Bozone Hefe Weizen' from 'Bozeman Brewing Company'.\"\n }\n ]\n}\n```" }, { "task_index": 36, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 4 }, "target_rows": [ { "_row": "2211", "index": "2212", "id": "114", "beer-name": "Triangle White Ale", "style": "Witbier", "ounces": "12.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "524", "brewery-name": "Triangle Brewing Company", "city": "Durham", "state": "NC" }, { "_row": "2212", "index": "2213", "id": "113", "beer-name": "Triangle Belgian Golden Ale", "style": "Belgian Strong Pale Ale", "ounces": "12.0 ounce", "abv": "0.08%", "ibu": "N/A", "brewery_id": "524", "brewery-name": "Triangle Brewing Company", "city": "Durham", "state": "NC" }, { "_row": "2213", "index": "2214", "id": "2445", "beer-name": "Troegenator", "style": "Doppelbock", "ounces": "16.0 ounce", "abv": "0.082", "ibu": "N/A", "brewery_id": "97", "brewery-name": "Tr\u00f6egs Brewing Company", "city": "Hershey", "state": "PA" }, { "_row": "2214", "index": "2215", "id": "2444", "beer-name": "Nugget Nectar", "style": "American Amber / Red Ale", "ounces": "16.0 ounce", "abv": "0.075", "ibu": "93", "brewery_id": "97", "brewery-name": "Tr\u00f6egs Brewing Company", "city": "Hershey", "state": "PA" } ], "ground_truth": [ { "row": 2211, "column": "ounces", "clean_value": "12" }, { "row": 2211, "column": "ibu", "clean_value": "" }, { "row": 2212, "column": "ounces", "clean_value": "12" }, { "row": 2212, "column": "abv", "clean_value": "0.08" }, { "row": 2212, "column": "ibu", "clean_value": "" }, { "row": 2213, "column": "ounces", "clean_value": "16" }, { "row": 2213, "column": "ibu", "clean_value": "" }, { "row": 2214, "column": "ounces", "clean_value": "16" } ], "predicted_repairs": [ { "row": 2211, "column": "Beer-Name", "new_value": "Triangle White Ale", "reason": "The beer name has been replaced with 'Triangle White Ale'." }, { "row": 2212, "column": "Beer-Name", "new_value": "Triangle Belgian Golden Ale", "reason": "The beer name has been replaced with 'Triangle Belgian Golden Ale'." }, { "row": 2213, "column": "Beer-Name", "new_value": "Troegenator", "reason": "The beer name has been replaced with 'Troegenator'." }, { "row": 2214, "column": "Beer-Name", "new_value": "Nugget Nectar", "reason": "The beer name has been replaced with 'Nugget Nectar'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 2211,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Triangle White Ale\",\n \"reason\": \"The beer name has been replaced with 'Triangle White Ale'.\"\n },\n {\n \"row\": 2212,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Triangle Belgian Golden Ale\",\n \"reason\": \"The beer name has been replaced with 'Triangle Belgian Golden Ale'.\"\n },\n {\n \"row\": 2213,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Troegenator\",\n \"reason\": \"The beer name has been replaced with 'Troegenator'.\"\n },\n {\n \"row\": 2214,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Nugget Nectar\",\n \"reason\": \"The beer name has been replaced with 'Nugget Nectar'.\"\n }\n ]\n}\n```" }, { "task_index": 39, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3 }, "target_rows": [ { "_row": "1271", "index": "1272", "id": "1671", "beer-name": "Gillespie Brown Ale", "style": "American Brown Ale", "ounces": "12.0 oz", "abv": "0.095", "ibu": "49", "brewery_id": "346", "brewery-name": "Manzanita Brewing Company", "city": "Santee", "state": "CA" }, { "_row": "1272", "index": "1273", "id": "1670", "beer-name": "Manzanita Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 OZ.", "abv": "0.066", "ibu": "44", "brewery_id": "346", "brewery-name": "Manzanita Brewing Company", "city": "Santee", "state": "CA" }, { "_row": "1273", "index": "1274", "id": "1262", "beer-name": "Marble Pilsner", "style": "German Pilsener", "ounces": "12.0 oz", "abv": "0.047%", "ibu": "N/A", "brewery_id": "443", "brewery-name": "Marble Brewery", "city": "Albuquerque", "state": "NM" }, { "_row": "1274", "index": "1275", "id": "845", "beer-name": "Marble India Pale Ale", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "443", "brewery-name": "Marble Brewery", "city": "Albuquerque", "state": "NM" } ], "ground_truth": [ { "row": 1271, "column": "ounces", "clean_value": "12" }, { "row": 1272, "column": "ounces", "clean_value": "12" }, { "row": 1273, "column": "ounces", "clean_value": "12" }, { "row": 1273, "column": "abv", "clean_value": "0.047" }, { "row": 1273, "column": "ibu", "clean_value": "" }, { "row": 1274, "column": "ounces", "clean_value": "12" }, { "row": 1274, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1271, "column": "style", "new_value": "American Brown Ale", "reason": "The beer name has been changed to 'American Brown Ale'." }, { "row": 1272, "column": "style", "new_value": "American Pale Ale (APA)", "reason": "The beer name has been changed to 'American Pale Ale (APA)'." }, { "row": 1273, "column": "style", "new_value": "German Pilsener", "reason": "The beer name has been changed to 'German Pilsener'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1271,\n \"column\": \"style\",\n \"new_value\": \"American Brown Ale\",\n \"reason\": \"The beer name has been changed to 'American Brown Ale'.\"\n },\n {\n \"row\": 1272,\n \"column\": \"style\",\n \"new_value\": \"American Pale Ale (APA)\",\n \"reason\": \"The beer name has been changed to 'American Pale Ale (APA)'.\"\n },\n {\n \"row\": 1273,\n \"column\": \"style\",\n \"new_value\": \"German Pilsener\",\n \"reason\": \"The beer name has been changed to 'German Pilsener'.\"\n }\n ]\n}\n```" }, { "task_index": 48, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 9, "schema_case_error": 3 }, "target_rows": [ { "_row": "491", "index": "492", "id": "49", "beer-name": "Porkslap Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.043%", "ibu": "N/A", "brewery_id": "556", "brewery-name": "Butternuts Beer and Ale", "city": "Garrattsville", "state": "NY" }, { "_row": "492", "index": "493", "id": "2657", "beer-name": "Blackbeard", "style": "American Double / Imperial Stout", "ounces": "12.0 ounce", "abv": "0.093", "ibu": "N/A", "brewery_id": "5", "brewery-name": "COAST Brewing Company", "city": "Charleston", "state": "SC" }, { "_row": "493", "index": "494", "id": "2656", "beer-name": "Rye Knot", "style": "American Brown Ale", "ounces": "12.0 oz. Alumi-Tek", "abv": "0.062", "ibu": "N/A", "brewery_id": "5", "brewery-name": "COAST Brewing Company", "city": "Charleston", "state": "SC" }, { "_row": "494", "index": "495", "id": "2655", "beer-name": "Dead Arm", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.06", "ibu": "N/A", "brewery_id": "5", "brewery-name": "COAST Brewing Company", "city": "Charleston", "state": "SC" } ], "ground_truth": [ { "row": 491, "column": "ounces", "clean_value": "12" }, { "row": 491, "column": "abv", "clean_value": "0.043" }, { "row": 491, "column": "ibu", "clean_value": "" }, { "row": 492, "column": "ounces", "clean_value": "12" }, { "row": 492, "column": "ibu", "clean_value": "" }, { "row": 493, "column": "ounces", "clean_value": "12" }, { "row": 493, "column": "ibu", "clean_value": "" }, { "row": 494, "column": "ounces", "clean_value": "12" }, { "row": 494, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 491, "column": "Beer-Name", "new_value": "Blackbeard", "reason": "The beer name has been replaced with 'Blackbeard'." }, { "row": 492, "column": "Beer-Name", "new_value": "Rye Knot", "reason": "The beer name has been replaced with 'Rye Knot'." }, { "row": 493, "column": "Beer-Name", "new_value": "Dead Arm", "reason": "The beer name has been replaced with 'Dead Arm'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 491,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Blackbeard\",\n \"reason\": \"The beer name has been replaced with 'Blackbeard'.\"\n },\n {\n \"row\": 492,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Rye Knot\",\n \"reason\": \"The beer name has been replaced with 'Rye Knot'.\"\n },\n {\n \"row\": 493,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Dead Arm\",\n \"reason\": \"The beer name has been replaced with 'Dead Arm'.\"\n }\n ]\n}\n```" }, { "task_index": 51, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 10, "schema_case_error": 3 }, "target_rows": [ { "_row": "2265", "index": "2266", "id": "877", "beer-name": "Draught Hard Apple Cider", "style": "Cider", "ounces": "16.0 oz", "abv": "0.065", "ibu": "N/A", "brewery_id": "338", "brewery-name": "Uncle John's Fruit House Winery", "city": "St. John's", "state": "MI" }, { "_row": "2266", "index": "2267", "id": "606", "beer-name": "Scotty K NA", "style": "Low Alcohol Beer", "ounces": "16.0 ounce", "abv": "0.001%", "ibu": "N/A", "brewery_id": "522", "brewery-name": "Uncommon Brewers", "city": "Santa Cruz", "state": "CA" }, { "_row": "2267", "index": "2268", "id": "543", "beer-name": "Bacon Brown Ale", "style": "American Brown Ale", "ounces": "16.0 oz", "abv": "0.068%", "ibu": "N/A", "brewery_id": "522", "brewery-name": "Uncommon Brewers", "city": "Santa Cruz", "state": "CA" }, { "_row": "2268", "index": "2269", "id": "347", "beer-name": "Golden State Ale", "style": "Belgian Pale Ale", "ounces": "16.0 oz.", "abv": "0.064", "ibu": "N/A", "brewery_id": "522", "brewery-name": "Uncommon Brewers", "city": "Santa Cruz", "state": "CA" } ], "ground_truth": [ { "row": 2265, "column": "ounces", "clean_value": "16" }, { "row": 2265, "column": "ibu", "clean_value": "" }, { "row": 2266, "column": "ounces", "clean_value": "16" }, { "row": 2266, "column": "abv", "clean_value": "0.001" }, { "row": 2266, "column": "ibu", "clean_value": "" }, { "row": 2267, "column": "ounces", "clean_value": "16" }, { "row": 2267, "column": "abv", "clean_value": "0.068" }, { "row": 2267, "column": "ibu", "clean_value": "" }, { "row": 2268, "column": "ounces", "clean_value": "16" }, { "row": 2268, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 2265, "column": "Beer-Name", "new_value": "Scotty K NA", "reason": "The beer name has been updated to 'Scotty K NA'." }, { "row": 2266, "column": "Beer-Name", "new_value": "Bacon Brown Ale", "reason": "The beer name has been updated to 'Bacon Brown Ale'." }, { "row": 2267, "column": "Beer-Name", "new_value": "Golden State Ale", "reason": "The beer name has been updated to 'Golden State Ale'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 2265,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Scotty K NA\",\n \"reason\": \"The beer name has been updated to 'Scotty K NA'.\"\n },\n {\n \"row\": 2266,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Bacon Brown Ale\",\n \"reason\": \"The beer name has been updated to 'Bacon Brown Ale'.\"\n },\n {\n \"row\": 2267,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Golden State Ale\",\n \"reason\": \"The beer name has been updated to 'Golden State Ale'.\"\n }\n ]\n}\n```" }, { "task_index": 54, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 9, "schema_case_error": 4 }, "target_rows": [ { "_row": "123", "index": "124", "id": "1293", "beer-name": "Angry Orchard Crisp Apple", "style": "Cider", "ounces": "16.0 oz.", "abv": "0.05%", "ibu": "N/A", "brewery_id": "434", "brewery-name": "Angry Orchard Cider Company", "city": "Cincinnati", "state": "OH" }, { "_row": "124", "index": "125", "id": "1292", "beer-name": "Angry Orchard Crisp Apple", "style": "Cider", "ounces": "12.0 OZ.", "abv": "0.05", "ibu": "N/A", "brewery_id": "434", "brewery-name": "Angry Orchard Cider Company", "city": "Cincinnati", "state": "OH" }, { "_row": "125", "index": "126", "id": "2207", "beer-name": "Golden One", "style": "Belgian Pale Ale", "ounces": "12.0 oz.", "abv": "0.068", "ibu": "N/A", "brewery_id": "193", "brewery-name": "Anthem Brewing Company", "city": "Oklahoma City", "state": "OK" }, { "_row": "126", "index": "127", "id": "2040", "beer-name": "Arjuna", "style": "Witbier", "ounces": "12.0 ounce", "abv": "0.06", "ibu": "N/A", "brewery_id": "193", "brewery-name": "Anthem Brewing Company", "city": "Oklahoma City", "state": "OK" } ], "ground_truth": [ { "row": 123, "column": "ounces", "clean_value": "16" }, { "row": 123, "column": "abv", "clean_value": "0.05" }, { "row": 123, "column": "ibu", "clean_value": "" }, { "row": 124, "column": "ounces", "clean_value": "12" }, { "row": 124, "column": "ibu", "clean_value": "" }, { "row": 125, "column": "ounces", "clean_value": "12" }, { "row": 125, "column": "ibu", "clean_value": "" }, { "row": 126, "column": "ounces", "clean_value": "12" }, { "row": 126, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 123, "column": "Abv", "new_value": "0.05%", "reason": "The beer name 'Angry Orchard Crisp Apple' is missing an abv value." }, { "row": 124, "column": "Abv", "new_value": "0.05", "reason": "The beer name 'Angry Orchard Crisp Apple' has a missing abv value." }, { "row": 125, "column": "Abv", "new_value": "0.068", "reason": "The beer name 'Golden One' has a missing abv value." }, { "row": 126, "column": "Abv", "new_value": "0.06", "reason": "The beer name 'Arjuna' has a missing abv value." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 123,\n \"column\": \"Abv\",\n \"new_value\": \"0.05%\",\n \"reason\": \"The beer name 'Angry Orchard Crisp Apple' is missing an abv value.\"\n },\n {\n \"row\": 124,\n \"column\": \"Abv\",\n \"new_value\": \"0.05\",\n \"reason\": \"The beer name 'Angry Orchard Crisp Apple' has a missing abv value.\"\n },\n {\n \"row\": 125,\n \"column\": \"Abv\",\n \"new_value\": \"0.068\",\n \"reason\": \"The beer name 'Golden One' has a missing abv value.\"\n },\n {\n \"row\": 126,\n \"column\": \"Abv\",\n \"new_value\": \"0.06\",\n \"reason\": \"The beer name 'Arjuna' has a missing abv value.\"\n }\n ]\n}\n```" }, { "task_index": 57, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 }, "target_rows": [ { "_row": "782", "index": "783", "id": "1731", "beer-name": "Peaches & Cream", "style": "Fruit / Vegetable Beer", "ounces": "16.0 oz.", "abv": "0.046", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "783", "index": "784", "id": "1022", "beer-name": "Quaff India Style Session Ale", "style": "American IPA", "ounces": "16.0 OZ.", "abv": "0.051", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "784", "index": "785", "id": "895", "beer-name": "Loki Red Ale (2013)", "style": "American Amber / Red Ale", "ounces": "16.0 OZ.", "abv": "0.075", "ibu": "53", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "785", "index": "786", "id": "682", "beer-name": "Mjolnir Imperial IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.069", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" } ], "ground_truth": [ { "row": 782, "column": "ounces", "clean_value": "16" }, { "row": 782, "column": "ibu", "clean_value": "" }, { "row": 783, "column": "ounces", "clean_value": "16" }, { "row": 783, "column": "ibu", "clean_value": "" }, { "row": 784, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 782, "column": "abv", "new_value": "0.046", "reason": "The beer name has been replaced with 'Peaches & Cream'." }, { "row": 783, "column": "abv", "new_value": "0.051", "reason": "The beer name has been replaced with 'Quaff India Style Session Ale'." }, { "row": 784, "column": "abv", "new_value": "0.075", "reason": "The beer name has been replaced with 'Loki Red Ale (2013)'." }, { "row": 785, "column": "abv", "new_value": "0.069", "reason": "The beer name has been replaced with 'Mjolnir Imperial IPA'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 782,\n \"column\": \"abv\",\n \"new_value\": \"0.046\",\n \"reason\": \"The beer name has been replaced with 'Peaches & Cream'.\"\n },\n {\n \"row\": 783,\n \"column\": \"abv\",\n \"new_value\": \"0.051\",\n \"reason\": \"The beer name has been replaced with 'Quaff India Style Session Ale'.\"\n },\n {\n \"row\": 784,\n \"column\": \"abv\",\n \"new_value\": \"0.075\",\n \"reason\": \"The beer name has been replaced with 'Loki Red Ale (2013)'.\"\n },\n {\n \"row\": 785,\n \"column\": \"abv\",\n \"new_value\": \"0.069\",\n \"reason\": \"The beer name has been replaced with 'Mjolnir Imperial IPA'.\"\n }\n ]\n}\n```" }, { "task_index": 72, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 3 }, "target_rows": [ { "_row": "1325", "index": "1326", "id": "1508", "beer-name": "Shark Bait", "style": "Fruit / Vegetable Beer", "ounces": "12.0 oz", "abv": "0.053%", "ibu": "11", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" }, { "_row": "1326", "index": "1327", "id": "1507", "beer-name": "Gator Tail Brown Ale", "style": "American Brown Ale", "ounces": "12.0 ounce", "abv": "0.053", "ibu": "30", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" }, { "_row": "1327", "index": "1328", "id": "1506", "beer-name": "Miami Vice IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.071", "ibu": "62", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" }, { "_row": "1328", "index": "1329", "id": "1325", "beer-name": "Big Rod Coconut Ale", "style": "American Blonde Ale", "ounces": "12.0 oz", "abv": "0.053", "ibu": "16", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" } ], "ground_truth": [ { "row": 1325, "column": "ounces", "clean_value": "12" }, { "row": 1325, "column": "abv", "clean_value": "0.053" }, { "row": 1326, "column": "ounces", "clean_value": "12" }, { "row": 1327, "column": "ounces", "clean_value": "12" }, { "row": 1328, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1325, "column": "style", "new_value": "Big Rod Coconut Ale", "reason": "The beer name has been changed to 'Big Rod Coconut Ale'." }, { "row": 1326, "column": "style", "new_value": "Gator Tail Brown Ale", "reason": "The beer name has been changed to 'Gator Tail Brown Ale'." }, { "row": 1327, "column": "style", "new_value": "Miami Vice IPA", "reason": "The beer name has been changed to 'Miami Vice IPA'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1325,\n \"column\": \"style\",\n \"new_value\": \"Big Rod Coconut Ale\",\n \"reason\": \"The beer name has been changed to 'Big Rod Coconut Ale'.\"\n },\n {\n \"row\": 1326,\n \"column\": \"style\",\n \"new_value\": \"Gator Tail Brown Ale\",\n \"reason\": \"The beer name has been changed to 'Gator Tail Brown Ale'.\"\n },\n {\n \"row\": 1327,\n \"column\": \"style\",\n \"new_value\": \"Miami Vice IPA\",\n \"reason\": \"The beer name has been changed to 'Miami Vice IPA'.\"\n }\n ]\n}\n```" }, { "task_index": 78, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 }, "target_rows": [ { "_row": "783", "index": "784", "id": "1022", "beer-name": "Quaff India Style Session Ale", "style": "American IPA", "ounces": "16.0 OZ.", "abv": "0.051", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "784", "index": "785", "id": "895", "beer-name": "Loki Red Ale (2013)", "style": "American Amber / Red Ale", "ounces": "16.0 OZ.", "abv": "0.075", "ibu": "53", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "785", "index": "786", "id": "682", "beer-name": "Mjolnir Imperial IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.069", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "786", "index": "787", "id": "112", "beer-name": "Fearless Scottish Ale", "style": "Scottish Ale", "ounces": "16.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" } ], "ground_truth": [ { "row": 783, "column": "ounces", "clean_value": "16" }, { "row": 783, "column": "ibu", "clean_value": "" }, { "row": 784, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ibu", "clean_value": "" }, { "row": 786, "column": "ounces", "clean_value": "16" }, { "row": 786, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 783, "column": "abv", "new_value": "0.051", "reason": "The beer name has been replaced with 'Quaff India Style Session Ale'." }, { "row": 784, "column": "abv", "new_value": "0.075", "reason": "The beer name has been replaced with 'Loki Red Ale (2013)'." }, { "row": 785, "column": "abv", "new_value": "0.069", "reason": "The beer name has been replaced with 'Mjolnir Imperial IPA'." }, { "row": 786, "column": "abv", "new_value": "0.05", "reason": "The beer name has been replaced with 'Fearless Scottish Ale'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 783,\n \"column\": \"abv\",\n \"new_value\": \"0.051\",\n \"reason\": \"The beer name has been replaced with 'Quaff India Style Session Ale'.\"\n },\n {\n \"row\": 784,\n \"column\": \"abv\",\n \"new_value\": \"0.075\",\n \"reason\": \"The beer name has been replaced with 'Loki Red Ale (2013)'.\"\n },\n {\n \"row\": 785,\n \"column\": \"abv\",\n \"new_value\": \"0.069\",\n \"reason\": \"The beer name has been replaced with 'Mjolnir Imperial IPA'.\"\n },\n {\n \"row\": 786,\n \"column\": \"abv\",\n \"new_value\": \"0.05\",\n \"reason\": \"The beer name has been replaced with 'Fearless Scottish Ale'.\"\n }\n ]\n}\n```" }, { "task_index": 81, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3 }, "target_rows": [ { "_row": "299", "index": "300", "id": "1025", "beer-name": "N Street Drive-In 50th Anniversary IPA", "style": "American Double / Imperial IPA", "ounces": "12.0 ounce", "abv": "", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" }, { "_row": "300", "index": "301", "id": "1012", "beer-name": "467 Ethan's Stout", "style": "American Stout", "ounces": "12.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" }, { "_row": "301", "index": "302", "id": "942", "beer-name": "1335 Wicked Snout", "style": "Saison / Farmhouse Ale", "ounces": "12.0 ounce", "abv": "0.064", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" }, { "_row": "302", "index": "303", "id": "937", "beer-name": "543 Skull Creek Fresh Hopped Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.045", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" } ], "ground_truth": [ { "row": 299, "column": "ounces", "clean_value": "12" }, { "row": 299, "column": "ibu", "clean_value": "" }, { "row": 300, "column": "ounces", "clean_value": "12" }, { "row": 300, "column": "ibu", "clean_value": "" }, { "row": 301, "column": "ounces", "clean_value": "12" }, { "row": 301, "column": "ibu", "clean_value": "" }, { "row": 302, "column": "ounces", "clean_value": "12" }, { "row": 302, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 299, "column": "style", "new_value": "American Double / Imperial IPA", "reason": "The beer name has been changed to American Double / Imperial IPA." }, { "row": 300, "column": "style", "new_value": "American Stout", "reason": "The beer name has been changed to American Stout." }, { "row": 301, "column": "style", "new_value": "Saison / Farmhouse Ale", "reason": "The beer name has been changed to Saison / Farmhouse Ale." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 299,\n \"column\": \"style\",\n \"new_value\": \"American Double / Imperial IPA\",\n \"reason\": \"The beer name has been changed to American Double / Imperial IPA.\"\n },\n {\n \"row\": 300,\n \"column\": \"style\",\n \"new_value\": \"American Stout\",\n \"reason\": \"The beer name has been changed to American Stout.\"\n },\n {\n \"row\": 301,\n \"column\": \"style\",\n \"new_value\": \"Saison / Farmhouse Ale\",\n \"reason\": \"The beer name has been changed to Saison / Farmhouse Ale.\"\n }\n ]\n}\n```" }, { "task_index": 84, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 6, "schema_case_error": 4 }, "target_rows": [ { "_row": "2014", "index": "2015", "id": "139", "beer-name": "Point Amber Classic", "style": "American Amber / Red Lager", "ounces": "12.0 oz.", "abv": "0.047", "ibu": "14", "brewery_id": "131", "brewery-name": "Stevens Point Brewery", "city": "Stevens Point", "state": "WI" }, { "_row": "2015", "index": "2016", "id": "138", "beer-name": "Point Special Lager", "style": "American Adjunct Lager", "ounces": "12.0 oz", "abv": "0.047", "ibu": "9", "brewery_id": "131", "brewery-name": "Stevens Point Brewery", "city": "Stevens Point", "state": "WI" }, { "_row": "2016", "index": "2017", "id": "953", "beer-name": "Wisco Disco", "style": "American Amber / Red Ale", "ounces": "16.0 ounce", "abv": "0.051%", "ibu": "31", "brewery_id": "486", "brewery-name": "Stillmank Beer Company", "city": "Green Bay", "state": "WI" }, { "_row": "2017", "index": "2018", "id": "1983", "beer-name": "Brontide", "style": "American Black Ale", "ounces": "12.0 OZ.", "abv": "0.05", "ibu": "N/A", "brewery_id": "255", "brewery-name": "Stillwater Artisanal Ales", "city": "Baltimore", "state": "MD" } ], "ground_truth": [ { "row": 2014, "column": "ounces", "clean_value": "12" }, { "row": 2015, "column": "ounces", "clean_value": "12" }, { "row": 2016, "column": "ounces", "clean_value": "16" }, { "row": 2016, "column": "abv", "clean_value": "0.051" }, { "row": 2017, "column": "ounces", "clean_value": "12" }, { "row": 2017, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 2014, "column": "Beer-Name", "new_value": "Point Amber Classic", "reason": "The beer name has been replaced with 'Point Amber Classic'." }, { "row": 2015, "column": "Beer-Name", "new_value": "Point Special Lager", "reason": "The beer name has been replaced with 'Point Special Lager'." }, { "row": 2016, "column": "Beer-Name", "new_value": "Wisco Disco", "reason": "The beer name has been replaced with 'Wisco Disco'." }, { "row": 2017, "column": "Beer-Name", "new_value": "Brontide", "reason": "The beer name has been replaced with 'Brontide'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 2014,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Point Amber Classic\",\n \"reason\": \"The beer name has been replaced with 'Point Amber Classic'.\"\n },\n {\n \"row\": 2015,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Point Special Lager\",\n \"reason\": \"The beer name has been replaced with 'Point Special Lager'.\"\n },\n {\n \"row\": 2016,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Wisco Disco\",\n \"reason\": \"The beer name has been replaced with 'Wisco Disco'.\"\n },\n {\n \"row\": 2017,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Brontide\",\n \"reason\": \"The beer name has been replaced with 'Brontide'.\"\n }\n ]\n}\n```" }, { "task_index": 87, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 }, "target_rows": [ { "_row": "203", "index": "204", "id": "1855", "beer-name": "Tarnation California-Style Lager", "style": "California Common / Steam Beer", "ounces": "12.0 oz", "abv": "0.053", "ibu": "N/A", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" }, { "_row": "204", "index": "205", "id": "1778", "beer-name": "On the Count of 3 (2015)", "style": "Hefeweizen", "ounces": "16.0 oz", "abv": "0.07%", "ibu": "42", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" }, { "_row": "205", "index": "206", "id": "1209", "beer-name": "Summer Swelter", "style": "American Pale Wheat Ale", "ounces": "12.0 oz", "abv": "0.047", "ibu": "N/A", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" }, { "_row": "206", "index": "207", "id": "954", "beer-name": "Phantom Punch Winter Stout", "style": "Foreign / Export Stout", "ounces": "12.0 oz.", "abv": "0.068", "ibu": "N/A", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" } ], "ground_truth": [ { "row": 203, "column": "ounces", "clean_value": "12" }, { "row": 203, "column": "ibu", "clean_value": "" }, { "row": 204, "column": "ounces", "clean_value": "16" }, { "row": 204, "column": "abv", "clean_value": "0.07" }, { "row": 205, "column": "ounces", "clean_value": "12" }, { "row": 205, "column": "ibu", "clean_value": "" }, { "row": 206, "column": "ounces", "clean_value": "12" }, { "row": 206, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 203, "column": "style", "new_value": "California Common / Steam Beer", "reason": "The beer name has been changed to 'California Common / Steam Beer' as per the contract." }, { "row": 204, "column": "style", "new_value": "Hefeweizen", "reason": "The beer name has been changed to 'Hefeweizen' as per the contract." }, { "row": 205, "column": "style", "new_value": "American Pale Wheat Ale", "reason": "The beer name has been changed to 'American Pale Wheat Ale' as per the contract." }, { "row": 206, "column": "style", "new_value": "Foreign / Export Stout", "reason": "The beer name has been changed to 'Foreign / Export Stout' as per the contract." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 203,\n \"column\": \"style\",\n \"new_value\": \"California Common / Steam Beer\",\n \"reason\": \"The beer name has been changed to 'California Common / Steam Beer' as per the contract.\"\n },\n {\n \"row\": 204,\n \"column\": \"style\",\n \"new_value\": \"Hefeweizen\",\n \"reason\": \"The beer name has been changed to 'Hefeweizen' as per the contract.\"\n },\n {\n \"row\": 205,\n \"column\": \"style\",\n \"new_value\": \"American Pale Wheat Ale\",\n \"reason\": \"The beer name has been changed to 'American Pale Wheat Ale' as per the contract.\"\n },\n {\n \"row\": 206,\n \"column\": \"style\",\n \"new_value\": \"Foreign / Export Stout\",\n \"reason\": \"The beer name has been changed to 'Foreign / Export Stout' as per the contract.\"\n }\n ]\n}\n```" }, { "task_index": 93, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 }, "target_rows": [ { "_row": "1413", "index": "1414", "id": "132", "beer-name": "Full Moon Belgian White Ale (2007)", "style": "Witbier", "ounces": "12.0 oz.", "abv": "0.085", "ibu": "N/A", "brewery_id": "507", "brewery-name": "Mudshark Brewing Company", "city": "Lake Havasu City", "state": "AZ" }, { "_row": "1414", "index": "1415", "id": "131", "beer-name": "Dry Heat Hefeweizen (2006)", "style": "Hefeweizen", "ounces": "12.0 OZ.", "abv": "0.055", "ibu": "N/A", "brewery_id": "507", "brewery-name": "Mudshark Brewing Company", "city": "Lake Havasu City", "state": "AZ" }, { "_row": "1415", "index": "1416", "id": "1598", "beer-name": "Mustang Sixty-Six", "style": "American Amber / Red Lager", "ounces": "12.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "366", "brewery-name": "Mustang Brewing Company", "city": "Mustang", "state": "OK" }, { "_row": "1416", "index": "1417", "id": "862", "beer-name": "Mustang '33", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "0.04", "ibu": "N/A", "brewery_id": "366", "brewery-name": "Mustang Brewing Company", "city": "Mustang", "state": "OK" } ], "ground_truth": [ { "row": 1413, "column": "ounces", "clean_value": "12" }, { "row": 1413, "column": "ibu", "clean_value": "" }, { "row": 1414, "column": "ounces", "clean_value": "12" }, { "row": 1414, "column": "ibu", "clean_value": "" }, { "row": 1415, "column": "ounces", "clean_value": "12" }, { "row": 1415, "column": "ibu", "clean_value": "" }, { "row": 1416, "column": "ounces", "clean_value": "12" }, { "row": 1416, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1413, "column": "abv", "new_value": "0.085", "reason": "The beer name has been replaced with a new value." }, { "row": 1414, "column": "abv", "new_value": "0.055", "reason": "The beer name has been replaced with a new value." }, { "row": 1415, "column": "abv", "new_value": "0.05", "reason": "The beer name has been replaced with a new value." }, { "row": 1416, "column": "abv", "new_value": "0.04", "reason": "The beer name has been replaced with a new value." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1413,\n \"column\": \"abv\",\n \"new_value\": \"0.085\",\n \"reason\": \"The beer name has been replaced with a new value.\"\n },\n {\n \"row\": 1414,\n \"column\": \"abv\",\n \"new_value\": \"0.055\",\n \"reason\": \"The beer name has been replaced with a new value.\"\n },\n {\n \"row\": 1415,\n \"column\": \"abv\",\n \"new_value\": \"0.05\",\n \"reason\": \"The beer name has been replaced with a new value.\"\n },\n {\n \"row\": 1416,\n \"column\": \"abv\",\n \"new_value\": \"0.04\",\n \"reason\": \"The beer name has been replaced with a new value.\"\n }\n ]\n}\n```" }, { "task_index": 99, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3 }, "target_rows": [ { "_row": "979", "index": "980", "id": "1106", "beer-name": "Pablo Beach Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.05%", "ibu": "30", "brewery_id": "466", "brewery-name": "Green Room Brewing", "city": "Jacksonville", "state": "FL" }, { "_row": "980", "index": "981", "id": "2314", "beer-name": "Wild Trail Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.057", "ibu": "44", "brewery_id": "156", "brewery-name": "Greenbrier Valley Brewing Company", "city": "Lewisburg", "state": "WV" }, { "_row": "981", "index": "982", "id": "2313", "beer-name": "Mothman Black IPA", "style": "American Black Ale", "ounces": "12.0 ounce", "abv": "0.067", "ibu": "71", "brewery_id": "156", "brewery-name": "Greenbrier Valley Brewing Company", "city": "Lewisburg", "state": "WV" }, { "_row": "982", "index": "983", "id": "2461", "beer-name": "Autumn Winds Fest Beer", "style": "M\u00e4rzen / Oktoberfest", "ounces": "16.0 ounce", "abv": "0.058", "ibu": "N/A", "brewery_id": "86", "brewery-name": "Grey Sail Brewing Company", "city": "Westerly", "state": "RI" } ], "ground_truth": [ { "row": 979, "column": "ounces", "clean_value": "12" }, { "row": 979, "column": "abv", "clean_value": "0.05" }, { "row": 980, "column": "ounces", "clean_value": "12" }, { "row": 981, "column": "ounces", "clean_value": "12" }, { "row": 982, "column": "ounces", "clean_value": "16" }, { "row": 982, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 979, "column": "style", "new_value": "Autumn Winds Fest Beer", "reason": "The beer name has been updated to 'Autumn Winds Fest Beer'." }, { "row": 980, "column": "style", "new_value": "Autumn Winds Fest Beer", "reason": "The beer name has been updated to 'Autumn Winds Fest Beer'." }, { "row": 981, "column": "style", "new_value": "Autumn Winds Fest Beer", "reason": "The beer name has been updated to 'Autumn Winds Fest Beer'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 979,\n \"column\": \"style\",\n \"new_value\": \"Autumn Winds Fest Beer\",\n \"reason\": \"The beer name has been updated to 'Autumn Winds Fest Beer'.\"\n },\n {\n \"row\": 980,\n \"column\": \"style\",\n \"new_value\": \"Autumn Winds Fest Beer\",\n \"reason\": \"The beer name has been updated to 'Autumn Winds Fest Beer'.\"\n },\n {\n \"row\": 981,\n \"column\": \"style\",\n \"new_value\": \"Autumn Winds Fest Beer\",\n \"reason\": \"The beer name has been updated to 'Autumn Winds Fest Beer'.\"\n }\n ]\n}\n```" } ], "not_inferable_from_prompt": [ { "task_index": 5, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1727", "tuple_id": "1728", "src": "ua", "flight": "UA-397-JFK-SFO", "sched_dep_time": "8:00 a.m.", "act_dep_time": "8:29 a.m.", "sched_arr_time": "11:55 a.m.", "act_arr_time": "11:58 a.m." }, { "_row": "1728", "tuple_id": "1729", "src": "ua", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1729", "tuple_id": "1730", "src": "ua", "flight": "UA-2830-MCO-CLT", "sched_dep_time": "3:27 p.m.", "act_dep_time": "3:27 p.m.", "sched_arr_time": "5:05 p.m.", "act_arr_time": "5:17 p.m." }, { "_row": "1730", "tuple_id": "1731", "src": "ua", "flight": "UA-5487-SFO-MRY", "sched_dep_time": "10:39 a.m.", "act_dep_time": "10:33 a.m.", "sched_arr_time": "11:19 a.m.", "act_arr_time": "11:21 a.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1727, "column": "act_arr_time", "new_value": "11:58 a.m.", "reason": "The act_arr_time for flight UA-397-JFK-SFO has been updated to 11:58 a.m." }, { "row": 1728, "column": "act_arr_time", "new_value": "9:43 a.m.", "reason": "The act_arr_time for flight UA-3925-IAD-ORF has been updated to 9:43 a.m." }, { "row": 1729, "column": "act_arr_time", "new_value": "5:17 p.m.", "reason": "The act_arr_time for flight UA-2830-MCO-CLT has been updated to 5:17 p.m." }, { "row": 1730, "column": "act_arr_time", "new_value": "11:21 a.m.", "reason": "The act_arr_time for flight UA-5487-SFO-MRY has been updated to 11:21 a.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1727,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:58 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-397-JFK-SFO has been updated to 11:58 a.m.\"\n },\n {\n \"row\": 1728,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:43 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-3925-IAD-ORF has been updated to 9:43 a.m.\"\n },\n {\n \"row\": 1729,\n \"column\": \"act_arr_time\",\n \"new_value\": \"5:17 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-2830-MCO-CLT has been updated to 5:17 p.m.\"\n },\n {\n \"row\": 1730,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:21 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-5487-SFO-MRY has been updated to 11:21 a.m.\"\n }\n ]\n}\n```" }, { "task_index": 10, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 }, "target_rows": [ { "_row": "122", "index": "123", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-4", "MeasureName": "heart attack patients given smoking cessation advice/counseling", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-4" }, { "_row": "123", "index": "124", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "0%", "Sample": "1 patients", "Stateavg": "al_ami-5" }, { "_row": "124", "index": "125", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "125", "index": "126", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" } ], "ground_truth": [], "predicted_repairs": [ { "row": 122, "column": "Index", "new_value": "123", "reason": "The address '101 hospital circle' is invalid." }, { "row": 123, "column": "Index", "new_value": "124", "reason": "The address '101 hospital circle' is invalid." }, { "row": 124, "column": "Index", "new_value": "125", "reason": "The address '101 hospital circle' is invalid." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 122,\n \"column\": \"Index\",\n \"new_value\": \"123\",\n \"reason\": \"The address '101 hospital circle' is invalid.\"\n },\n {\n \"row\": 123,\n \"column\": \"Index\",\n \"new_value\": \"124\",\n \"reason\": \"The address '101 hospital circle' is invalid.\"\n },\n {\n \"row\": 124,\n \"column\": \"Index\",\n \"new_value\": \"125\",\n \"reason\": \"The address '101 hospital circle' is invalid.\"\n }\n ]\n}\n```" }, { "task_index": 20, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "13", "tuple_id": "14", "src": "aa", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "8:00 a.m.", "act_arr_time": "8:06 a.m." }, { "_row": "14", "tuple_id": "15", "src": "aa", "flight": "AA-1279-DFW-PHX", "sched_dep_time": "1:00 p.m.", "act_dep_time": "2:04 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:30 p.m." }, { "_row": "15", "tuple_id": "16", "src": "aa", "flight": "AA-616-DFW-DTW", "sched_dep_time": "9:05 a.m.", "act_dep_time": "10:10 a.m.", "sched_arr_time": "12:35 p.m.", "act_arr_time": "1:27 p.m." }, { "_row": "16", "tuple_id": "17", "src": "aa", "flight": "AA-4344-ORD-DTW", "sched_dep_time": "11:45 a.m.", "act_dep_time": "12:13 p.m.", "sched_arr_time": "2:00 p.m.", "act_arr_time": "2:10 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 13, "column": "act_arr_time", "new_value": "8:06 a.m.", "reason": "The act_arr_time for flight AA-3979-CVG-ORD has been updated to 8:06 a.m." }, { "row": 14, "column": "act_arr_time", "new_value": "3:30 p.m.", "reason": "The act_arr_time for flight AA-1279-DFW-PHX has been updated to 3:30 p.m." }, { "row": 15, "column": "act_arr_time", "new_value": "1:27 p.m.", "reason": "The act_arr_time for flight AA-616-DFW-DTW has been updated to 1:27 p.m." }, { "row": 16, "column": "act_arr_time", "new_value": "2:10 p.m.", "reason": "The act_arr_time for flight AA-4344-ORD-DTW has been updated to 2:10 p.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 13,\n \"column\": \"act_arr_time\",\n \"new_value\": \"8:06 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-3979-CVG-ORD has been updated to 8:06 a.m.\"\n },\n {\n \"row\": 14,\n \"column\": \"act_arr_time\",\n \"new_value\": \"3:30 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-1279-DFW-PHX has been updated to 3:30 p.m.\"\n },\n {\n \"row\": 15,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:27 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-616-DFW-DTW has been updated to 1:27 p.m.\"\n },\n {\n \"row\": 16,\n \"column\": \"act_arr_time\",\n \"new_value\": \"2:10 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-4344-ORD-DTW has been updated to 2:10 p.m.\"\n }\n ]\n}\n```" }, { "task_index": 25, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 5, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "overrepair": 3, "schema_case_error": 1, "wrong_cell": 1 }, "target_rows": [ { "_row": "661", "index": "662", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-3" }, { "_row": "662", "index": "663", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-4" }, { "_row": "663", "index": "664", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-6" }, { "_row": "664", "index": "665", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [], "predicted_repairs": [ { "row": 661, "column": "Index", "new_value": "662", "reason": "The new value for index has been set to 662." }, { "row": 662, "column": "ProviderNumber", "new_value": "10032", "reason": "The new value for ProviderNumber has been set to 10032." }, { "row": 663, "column": "Address1", "new_value": "209 north main street", "reason": "The new value for Address1 has been set to '209 north main street'." }, { "row": 664, "column": "Address2", "new_value": "", "reason": "The new value for Address2 has been left as an empty string ('')." }, { "row": 665, "column": "Address3", "new_value": "", "reason": "The new value for Address3 has been left as an empty string ('')." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 661,\n \"column\": \"Index\",\n \"new_value\": \"662\",\n \"reason\": \"The new value for index has been set to 662.\"\n },\n {\n \"row\": 662,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10032\",\n \"reason\": \"The new value for ProviderNumber has been set to 10032.\"\n },\n {\n \"row\": 663,\n \"column\": \"Address1\",\n \"new_value\": \"209 north main street\",\n \"reason\": \"The new value for Address1 has been set to '209 north main street'.\"\n },\n {\n \"row\": 664,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address2 has been left as an empty string ('').\"\n },\n {\n \"row\": 665,\n \"column\": \"Address3\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address3 has been left as an empty string ('').\"\n }\n ]\n}\n```" }, { "task_index": 35, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1452", "tuple_id": "1453", "src": "ifly", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1453", "tuple_id": "1454", "src": "ifly", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:19 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:13 p.m." }, { "_row": "1454", "tuple_id": "1455", "src": "ifly", "flight": "AA-1434-DFW-MCO", "sched_dep_time": "7:15 a.m.", "act_dep_time": "7:21 a.m.", "sched_arr_time": "10:35 a.m.", "act_arr_time": "10:36 a.m." }, { "_row": "1455", "tuple_id": "1456", "src": "ifly", "flight": "UA-664-ORD-PHL", "sched_dep_time": "1:33 p.m.", "act_dep_time": "1:31 p.m.", "sched_arr_time": "4:31 p.m.", "act_arr_time": "4:23 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1452, "column": "act_arr_time", "new_value": "3:13 p.m.", "reason": "The act_arr_time for flight UA-3925-IAD-ORF has been updated to 3:13 PM." }, { "row": 1453, "column": "act_arr_time", "new_value": "10:36 a.m.", "reason": "The act_arr_time for flight AA-789-ORD-DEN has been updated to 10:36 AM." }, { "row": 1454, "column": "act_arr_time", "new_value": "10:35 a.m.", "reason": "The act_arr_time for flight AA-1434-DFW-MCO has been updated to 10:35 AM." }, { "row": 1455, "column": "act_arr_time", "new_value": "4:23 p.m.", "reason": "The act_arr_time for flight UA-664-ORD-PHL has been updated to 4:23 PM." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1452,\n \"column\": \"act_arr_time\",\n \"new_value\": \"3:13 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-3925-IAD-ORF has been updated to 3:13 PM.\"\n },\n {\n \"row\": 1453,\n \"column\": \"act_arr_time\",\n \"new_value\": \"10:36 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-789-ORD-DEN has been updated to 10:36 AM.\"\n },\n {\n \"row\": 1454,\n \"column\": \"act_arr_time\",\n \"new_value\": \"10:35 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-1434-DFW-MCO has been updated to 10:35 AM.\"\n },\n {\n \"row\": 1455,\n \"column\": \"act_arr_time\",\n \"new_value\": \"4:23 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-664-ORD-PHL has been updated to 4:23 PM.\"\n }\n ]\n}\n```" }, { "task_index": 40, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 2, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 2 }, "target_rows": [ { "_row": "299", "index": "300", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "empty", "Stateavg": "al_ami-7a" }, { "_row": "300", "index": "301", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "empty", "Stateavg": "al_ami-8a" }, { "_row": "301", "index": "302", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "empty", "Sample": "empty", "Stateavg": "al_hf-1" }, { "_row": "302", "index": "303", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "empty", "Sample": "empty", "Stateavg": "al_hf-2" } ], "ground_truth": [], "predicted_repairs": [ { "row": 299, "column": "Condition", "new_value": "heart attack", "reason": "The condition has been updated to 'heart attack'." }, { "row": 300, "column": "Condition", "new_value": "heart failure", "reason": "The condition has been updated to 'heart failure'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 299,\n \"column\": \"Condition\",\n \"new_value\": \"heart attack\",\n \"reason\": \"The condition has been updated to 'heart attack'.\"\n },\n {\n \"row\": 300,\n \"column\": \"Condition\",\n \"new_value\": \"heart failure\",\n \"reason\": \"The condition has been updated to 'heart failure'.\"\n }\n ]\n}\n```" }, { "task_index": 50, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "wrong_cell": 4 }, "target_rows": [ { "_row": "1450", "tuple_id": "1451", "src": "ifly", "flight": "CO-89-IAH-EWR", "sched_dep_time": "6:00 a.m.", "act_dep_time": "6:02 a.m.", "sched_arr_time": "10:20 a.m.", "act_arr_time": "10:27 a.m." }, { "_row": "1451", "tuple_id": "1452", "src": "ifly", "flight": "UA-938-DEN-ORD", "sched_dep_time": "4:16 p.m.", "act_dep_time": "4:15 p.m.", "sched_arr_time": "7:35 p.m.", "act_arr_time": "7:36 p.m." }, { "_row": "1452", "tuple_id": "1453", "src": "ifly", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1453", "tuple_id": "1454", "src": "ifly", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:19 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:13 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1450, "column": "Column", "new_value": "value", "reason": "Why" }, { "row": 1451, "column": "Column", "new_value": "value", "reason": "Why" }, { "row": 1452, "column": "Column", "new_value": "value", "reason": "Why" }, { "row": 1453, "column": "Column", "new_value": "value", "reason": "Why" } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1450,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n },\n {\n \"row\": 1451,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n },\n {\n \"row\": 1452,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n },\n {\n \"row\": 1453,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n }\n ]\n}\n```" }, { "task_index": 55, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 }, "target_rows": [ { "_row": "910", "index": "911", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "88%", "Sample": "8 patients", "Stateavg": "al_ami-7a" }, { "_row": "911", "index": "912", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "100%", "Sample": "16 patients", "Stateavg": "al_ami-8a" }, { "_row": "912", "index": "913", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "100%", "Sample": "268 patients", "Stateavg": "al_hf-1" }, { "_row": "913", "index": "914", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "100%", "Sample": "350 patients", "Stateavg": "al_hf-2" } ], "ground_truth": [], "predicted_repairs": [ { "row": 910, "column": "Index", "new_value": "911", "reason": "The address '600 south third street' has been replaced with a new value." }, { "row": 911, "column": "Index", "new_value": "912", "reason": "The address '600 south third street' has been replaced with a new value." }, { "row": 912, "column": "Index", "new_value": "913", "reason": "The address '600 south third street' has been replaced with a new value." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 910,\n \"column\": \"Index\",\n \"new_value\": \"911\",\n \"reason\": \"The address '600 south third street' has been replaced with a new value.\"\n },\n {\n \"row\": 911,\n \"column\": \"Index\",\n \"new_value\": \"912\",\n \"reason\": \"The address '600 south third street' has been replaced with a new value.\"\n },\n {\n \"row\": 912,\n \"column\": \"Index\",\n \"new_value\": \"913\",\n \"reason\": \"The address '600 south third street' has been replaced with a new value.\"\n }\n ]\n}\n```" }, { "task_index": 65, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "559", "tuple_id": "560", "src": "flightstats", "flight": "AA-446-DFW-PHL", "sched_dep_time": "11:50 a.m.", "act_dep_time": "12:12 p.m.", "sched_arr_time": "3:50 p.m.", "act_arr_time": "4:09 p.m." }, { "_row": "560", "tuple_id": "561", "src": "flightstats", "flight": "CO-1023-IAH-DEN", "sched_dep_time": "11:40 a.m.", "act_dep_time": "11:56 a.m.", "sched_arr_time": "1:17 p.m.", "act_arr_time": "1:14 p.m." }, { "_row": "561", "tuple_id": "562", "src": "flightstats", "flight": "AA-466-IAH-MIA", "sched_dep_time": "6:00 a.m.", "act_dep_time": "6:08 a.m.", "sched_arr_time": "9:20 a.m.", "act_arr_time": "9:05 a.m." }, { "_row": "562", "tuple_id": "563", "src": "flightstats", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:30 a.m.", "sched_arr_time": "4:57 p.m.", "act_arr_time": "5:05 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 559, "column": "act_arr_time", "new_value": "1:14 p.m.", "reason": "The act_arr_time for flight AA-446-DFW-PHL has been updated to 1:14 p.m." }, { "row": 560, "column": "act_arr_time", "new_value": "1:17 p.m.", "reason": "The act_arr_time for flight CO-1023-IAH-DEN has been updated to 1:17 p.m." }, { "row": 561, "column": "act_arr_time", "new_value": "9:05 a.m.", "reason": "The act_arr_time for flight AA-466-IAH-MIA has been updated to 9:05 a.m." }, { "row": 562, "column": "act_arr_time", "new_value": "5:05 p.m.", "reason": "The act_arr_time for flight UA-3050-PHX-CLT has been updated to 5:05 p.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 559,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:14 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-446-DFW-PHL has been updated to 1:14 p.m.\"\n },\n {\n \"row\": 560,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:17 p.m.\",\n \"reason\": \"The act_arr_time for flight CO-1023-IAH-DEN has been updated to 1:17 p.m.\"\n },\n {\n \"row\": 561,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:05 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-466-IAH-MIA has been updated to 9:05 a.m.\"\n },\n {\n \"row\": 562,\n \"column\": \"act_arr_time\",\n \"new_value\": \"5:05 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-3050-PHX-CLT has been updated to 5:05 p.m.\"\n }\n ]\n}\n```" }, { "task_index": 70, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 }, "target_rows": [ { "_row": "458", "index": "459", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-card-2", "MeasureName": "surgery patients who were taking heart drugs called beta blockers before coming to the hospital who were kept on the beta blockers during the period just before and after their surgery", "Score": "81%", "Sample": "54 patients", "Stateavg": "al_scip-card-2" }, { "_row": "459", "index": "460", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "92%", "Sample": "253 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "460", "index": "461", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "91%", "Sample": "255 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "461", "index": "462", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "84%", "Sample": "245 patients", "Stateavg": "al_scip-inf-3" } ], "ground_truth": [], "predicted_repairs": [ { "row": 458, "column": "Index", "new_value": "459", "reason": "The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names." }, { "row": 459, "column": "Index", "new_value": "460", "reason": "The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names." }, { "row": 460, "column": "Index", "new_value": "461", "reason": "The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 458,\n \"column\": \"Index\",\n \"new_value\": \"459\",\n \"reason\": \"The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names.\"\n },\n {\n \"row\": 459,\n \"column\": \"Index\",\n \"new_value\": \"460\",\n \"reason\": \"The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names.\"\n },\n {\n \"row\": 460,\n \"column\": \"Index\",\n \"new_value\": \"461\",\n \"reason\": \"The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names.\"\n }\n ]\n}\n```" }, { "task_index": 80, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 1 }, "target_rows": [ { "_row": "589", "tuple_id": "590", "src": "flightstats", "flight": "UA-2906-PHL-MCO", "sched_dep_time": "3:50 p.m.", "act_dep_time": "4:28 p.m.", "sched_arr_time": "6:23 p.m.", "act_arr_time": "6:38 p.m." }, { "_row": "590", "tuple_id": "591", "src": "flightstats", "flight": "UA-938-DEN-ORD", "sched_dep_time": "4:16 p.m.", "act_dep_time": "4:15 p.m.", "sched_arr_time": "7:35 p.m.", "act_arr_time": "7:36 p.m." }, { "_row": "591", "tuple_id": "592", "src": "flightstats", "flight": "AA-1221-MCO-ORD", "sched_dep_time": "8:00 p.m.", "act_dep_time": "8:23 p.m.", "sched_arr_time": "9:45 p.m.", "act_arr_time": "9:53 p.m." }, { "_row": "592", "tuple_id": "593", "src": "flightstats", "flight": "CO-16-LAX-EWR", "sched_dep_time": "10:25 a.m.", "act_dep_time": "10:20 a.m.", "sched_arr_time": "6:44 p.m.", "act_arr_time": "6:34 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 590, "column": "src", "new_value": "flightstats", "reason": "The source column has been replaced with 'flightstats'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 590,\n \"column\": \"src\",\n \"new_value\": \"flightstats\",\n \"reason\": \"The source column has been replaced with 'flightstats'.\"\n }\n ]\n}\n```" }, { "task_index": 85, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "schema_case_error": 3 }, "target_rows": [ { "_row": "141", "index": "142", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "100%", "Sample": "4 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "142", "index": "143", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "100%", "Sample": "4 patients", "Stateavg": "al_scip-vte-1" }, { "_row": "143", "index": "144", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-2", "MeasureName": "patients who got treatment at the right time (within 24 hours before or after their surgery) to help prevent blood clots after certain types of surgery", "Score": "100%", "Sample": "4 patients", "Stateavg": "al_scip-vte-2" }, { "_row": "144", "index": "145", "ProviderNumber": "10009", "HospitalName": "hartselle medical center", "Address1": "201 pine street northwest", "Address2": "empty", "Address3": "empty", "City": "hartselle", "State": "al", "ZipCode": "35640", "CountyName": "morgan", "PhoneNumber": "2567736511", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-1", "MeasureName": "heart attack patients given aspirin at arrival", "Score": "100%", "Sample": "6 patients", "Stateavg": "al_ami-1" } ], "ground_truth": [], "predicted_repairs": [ { "row": 141, "column": "Index", "new_value": "142", "reason": "The patient's address has been updated." }, { "row": 142, "column": "Index", "new_value": "143", "reason": "The patient's address has been updated." }, { "row": 143, "column": "Index", "new_value": "144", "reason": "The patient's address has been updated." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 141,\n \"column\": \"Index\",\n \"new_value\": \"142\",\n \"reason\": \"The patient's address has been updated.\"\n },\n {\n \"row\": 142,\n \"column\": \"Index\",\n \"new_value\": \"143\",\n \"reason\": \"The patient's address has been updated.\"\n },\n {\n \"row\": 143,\n \"column\": \"Index\",\n \"new_value\": \"144\",\n \"reason\": \"The patient's address has been updated.\"\n }\n ]\n}\n```" }, { "task_index": 95, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1431", "tuple_id": "1432", "src": "CO", "flight": "CO-1614-LAX-IAH", "sched_dep_time": "12:30 a.m.", "act_dep_time": "12:41 a.m.", "sched_arr_time": "5:35 a.m.", "act_arr_time": "5:26 a.m." }, { "_row": "1432", "tuple_id": "1433", "src": "CO", "flight": "CO-1088-CLE-IAH", "sched_dep_time": "8:40 a.m.", "act_dep_time": "8:40 a.m.", "sched_arr_time": "10:54 a.m.", "act_arr_time": "10:56 a.m." }, { "_row": "1433", "tuple_id": "1434", "src": "CO", "flight": "CO-58-DEN-IAH", "sched_dep_time": "11:25 a.m.", "act_dep_time": "11:32 a.m.", "sched_arr_time": "2:50 p.m.", "act_arr_time": "3:31 p.m." }, { "_row": "1434", "tuple_id": "1435", "src": "CO", "flight": "CO-50-CLE-EWR", "sched_dep_time": "2:55 p.m.", "act_dep_time": "3:31 p.m.", "sched_arr_time": "4:49 p.m.", "act_arr_time": "5:26 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1431, "column": "act_arr_time", "new_value": "5:26 a.m.", "reason": "The act_arr_time for flight CO-1614-LAX-IAH has been updated to 5:26 a.m." }, { "row": 1432, "column": "act_arr_time", "new_value": "10:56 a.m.", "reason": "The act_arr_time for flight CO-1088-CLE-IAH has been updated to 10:54 a.m." }, { "row": 1433, "column": "act_arr_time", "new_value": "3:31 p.m.", "reason": "The act_arr_time for flight CO-58-DEN-IAH has been updated to 3:31 p.m." }, { "row": 1434, "column": "act_arr_time", "new_value": "5:26 p.m.", "reason": "The act_arr_time for flight CO-50-CLE-EWR has been updated to 5:26 p.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1431,\n \"column\": \"act_arr_time\",\n \"new_value\": \"5:26 a.m.\",\n \"reason\": \"The act_arr_time for flight CO-1614-LAX-IAH has been updated to 5:26 a.m.\"\n },\n {\n \"row\": 1432,\n \"column\": \"act_arr_time\",\n \"new_value\": \"10:56 a.m.\",\n \"reason\": \"The act_arr_time for flight CO-1088-CLE-IAH has been updated to 10:54 a.m.\"\n },\n {\n \"row\": 1433,\n \"column\": \"act_arr_time\",\n \"new_value\": \"3:31 p.m.\",\n \"reason\": \"The act_arr_time for flight CO-58-DEN-IAH has been updated to 3:31 p.m.\"\n },\n {\n \"row\": 1434,\n \"column\": \"act_arr_time\",\n \"new_value\": \"5:26 p.m.\",\n \"reason\": \"The act_arr_time for flight CO-50-CLE-EWR has been updated to 5:26 p.m.\"\n }\n ]\n}\n```" }, { "task_index": 100, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 2, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "overrepair": 1, "schema_case_error": 1 }, "target_rows": [ { "_row": "623", "index": "624", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "82%", "Sample": "527 patients", "Stateavg": "al_hf-1" }, { "_row": "624", "index": "625", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "100%", "Sample": "570 patients", "Stateavg": "al_hf-2" }, { "_row": "625", "index": "626", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-3", "MeasureName": "heart failure patients given ace inhibitor or arb for left ventricular systolic dysfunction (lvsd)", "Score": "92%", "Sample": "272 patients", "Stateavg": "al_hf-3" }, { "_row": "626", "index": "627", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-4", "MeasureName": "heart failure patients given smoking cessation advice/counseling", "Score": "100%", "Sample": "101 patients", "Stateavg": "al_hf-4" } ], "ground_truth": [], "predicted_repairs": [ { "row": 623, "column": "Index", "new_value": "624", "reason": "The new value '624' is within the allowed range." }, { "row": 624, "column": "ProviderNumber", "new_value": "10029", "reason": "The new value '10029' matches the expected column name." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 623,\n \"column\": \"Index\",\n \"new_value\": \"624\",\n \"reason\": \"The new value '624' is within the allowed range.\"\n },\n {\n \"row\": 624,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10029\",\n \"reason\": \"The new value '10029' matches the expected column name.\"\n }\n ]\n}\n```" } ], "external_reference_required": [ { "task_index": 1, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.25, "precision": 0.25, "recall": 0.25, "tp": 1, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "overrepair": 2, "schema_case_error": 1 }, "target_rows": [ { "_row": "55", "index": "56", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-2", "MeasureName": "pneumonia patients assessed and given pneumococcal vaccination", "Score": "97%", "Sample": "172 patients", "Stateavg": "al_pn-2" }, { "_row": "56", "index": "57", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boxz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-3b", "MeasureName": "pneumonia patients whose initial emergency room blood culture was performed prior to the administration of the first hospital dose of antibiotics", "Score": "97%", "Sample": "120 patients", "Stateavg": "al_pn-xb" }, { "_row": "57", "index": "58", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505xuxsxhighwayx431xnorth", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2x6x938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-4", "MeasureName": "pneumonia patients given smoking cessation advice/counseling", "Score": "97%", "Sample": "98 patients", "Stateavg": "al_pn-4" }, { "_row": "58", "index": "59", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-5c", "MeasureName": "pneumonia patients given initial antibiotic(s) within 6 hours after arrival", "Score": "96%", "Sample": "211 patients", "Stateavg": "al_pn-5c" } ], "ground_truth": [ { "row": 56, "column": "City", "clean_value": "boaz" }, { "row": 56, "column": "Stateavg", "clean_value": "al_pn-3b" }, { "row": 57, "column": "Address1", "clean_value": "2505 u s highway 431 north" }, { "row": 57, "column": "PhoneNumber", "clean_value": "2565938310" } ], "predicted_repairs": [ { "row": 55, "column": "Index", "new_value": "56", "reason": "The new value for index is incorrect." }, { "row": 56, "column": "ProviderNumber", "new_value": "10005", "reason": "The new value for ProviderNumber is incorrect." }, { "row": 57, "column": "Address1", "new_value": "2505 u s highway 431 north", "reason": "The new value for Address1 is incorrect." }, { "row": 58, "column": "Address2", "new_value": "empty", "reason": "The new value for Address2 is empty." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 55,\n \"column\": \"Index\",\n \"new_value\": \"56\",\n \"reason\": \"The new value for index is incorrect.\"\n },\n {\n \"row\": 56,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10005\",\n \"reason\": \"The new value for ProviderNumber is incorrect.\"\n },\n {\n \"row\": 57,\n \"column\": \"Address1\",\n \"new_value\": \"2505 u s highway 431 north\",\n \"reason\": \"The new value for Address1 is incorrect.\"\n },\n {\n \"row\": 58,\n \"column\": \"Address2\",\n \"new_value\": \"empty\",\n \"reason\": \"The new value for Address2 is empty.\"\n }\n ]\n}\n```" }, { "task_index": 2, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 }, "target_rows": [ { "_row": "792", "tuple_id": "793", "src": "mia", "flight": "AA-2050-ORD-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "2:45P 12-01-11", "act_arr_time": "2:46P" }, { "_row": "793", "tuple_id": "794", "src": "mia", "flight": "AA-1165-JFK-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "10:34A 12-01-11", "act_arr_time": "10:08A" }, { "_row": "794", "tuple_id": "795", "src": "mia", "flight": "AA-484-DFW-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "7:55P 12-01-11", "act_arr_time": "7:39P" }, { "_row": "795", "tuple_id": "796", "src": "mia", "flight": "AA-466-IAH-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "9:20A 12-01-11", "act_arr_time": "9:04A" } ], "ground_truth": [ { "row": 792, "column": "sched_dep_time", "clean_value": "10:40 a.m." }, { "row": 792, "column": "act_dep_time", "clean_value": "11:05 a.m." }, { "row": 792, "column": "sched_arr_time", "clean_value": "2:45 p.m." }, { "row": 792, "column": "act_arr_time", "clean_value": "2:46 p.m." }, { "row": 793, "column": "sched_dep_time", "clean_value": "6:59 a.m." }, { "row": 793, "column": "act_dep_time", "clean_value": "7:22 a.m." }, { "row": 793, "column": "sched_arr_time", "clean_value": "10:34 a.m." }, { "row": 793, "column": "act_arr_time", "clean_value": "10:04 a.m." }, { "row": 794, "column": "sched_dep_time", "clean_value": "4:15 p.m." }, { "row": 794, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 794, "column": "sched_arr_time", "clean_value": "7:55 p.m." }, { "row": 794, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 795, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 795, "column": "act_dep_time", "clean_value": "6:08 a.m." }, { "row": 795, "column": "sched_arr_time", "clean_value": "9:20 a.m." }, { "row": 795, "column": "act_arr_time", "clean_value": "9:05 a.m." } ], "predicted_repairs": [ { "row": 792, "column": "act_arr_time", "new_value": "2:46P", "reason": "The act_arr_time column value has been replaced with '2:46P'." }, { "row": 793, "column": "act_arr_time", "new_value": "10:08A", "reason": "The act_arr_time column value has been replaced with '10:08A'." }, { "row": 794, "column": "act_arr_time", "new_value": "7:39P", "reason": "The act_arr_time column value has been replaced with '7:39P'." }, { "row": 795, "column": "act_arr_time", "new_value": "9:04A", "reason": "The act_arr_time column value has been replaced with '9:04A'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 792,\n \"column\": \"act_arr_time\",\n \"new_value\": \"2:46P\",\n \"reason\": \"The act_arr_time column value has been replaced with '2:46P'.\"\n },\n {\n \"row\": 793,\n \"column\": \"act_arr_time\",\n \"new_value\": \"10:08A\",\n \"reason\": \"The act_arr_time column value has been replaced with '10:08A'.\"\n },\n {\n \"row\": 794,\n \"column\": \"act_arr_time\",\n \"new_value\": \"7:39P\",\n \"reason\": \"The act_arr_time column value has been replaced with '7:39P'.\"\n },\n {\n \"row\": 795,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:04A\",\n \"reason\": \"The act_arr_time column value has been replaced with '9:04A'.\"\n }\n ]\n}\n```" }, { "task_index": 4, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "711", "index": "712", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "1xx%", "Sample": "9 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "712", "index": "713", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection xrevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "713", "index": "714", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "33x28365x1", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery paxienxs needing hair removed from xhe surgical area before surgery who had hair removed using a safer mexhod (elecxric clippers or hair removal cream c nox a razor)", "Score": "100%", "Sample": "33 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "714", "index": "715", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "88%", "Sample": "24 patients", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [ { "row": 711, "column": "Score", "clean_value": "100%" }, { "row": 712, "column": "Condition", "clean_value": "surgical infection prevention" }, { "row": 713, "column": "PhoneNumber", "clean_value": "3342836541" }, { "row": 713, "column": "MeasureName", "clean_value": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)" } ], "predicted_repairs": [ { "row": 711, "column": "Index", "new_value": "712", "reason": "The new value for index has been set to 712." }, { "row": 712, "column": "ProviderNumber", "new_value": "10034", "reason": "The new value for ProviderNumber has been set to 10034." }, { "row": 713, "column": "Address1", "new_value": "805 friendship road", "reason": "The new value for Address1 has been set to '805 friendship road'." }, { "row": 714, "column": "Address2", "new_value": "", "reason": "The new value for Address2 has been left as an empty string ('')." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 711,\n \"column\": \"Index\",\n \"new_value\": \"712\",\n \"reason\": \"The new value for index has been set to 712.\"\n },\n {\n \"row\": 712,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10034\",\n \"reason\": \"The new value for ProviderNumber has been set to 10034.\"\n },\n {\n \"row\": 713,\n \"column\": \"Address1\",\n \"new_value\": \"805 friendship road\",\n \"reason\": \"The new value for Address1 has been set to '805 friendship road'.\"\n },\n {\n \"row\": 714,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address2 has been left as an empty string ('').\"\n }\n ]\n}\n```" }, { "task_index": 7, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 3 }, "target_rows": [ { "_row": "483", "index": "484", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "xl", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-card-2", "MeasureName": "surgery patients who were taking heart drugs called beta blockers before coming to the hospital who were kept on the beta blockers during the period just before and after their surgery", "Score": "100%", "Sample": "12 patients", "Stateavg": "al_scip-card-2" }, { "_row": "484", "index": "485", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "1x6 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "94%", "Sample": "52 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "485", "index": "486", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "xzark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "96%", "Sample": "52 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "486", "index": "487", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "85%", "Sample": "48 patients", "Stateavg": "al_scip-inf-3" } ], "ground_truth": [ { "row": 483, "column": "State", "clean_value": "al" }, { "row": 484, "column": "Address1", "clean_value": "126 hospital ave" }, { "row": 485, "column": "City", "clean_value": "ozark" } ], "predicted_repairs": [ { "row": 483, "column": "Index", "new_value": "484", "reason": "The address '126 hospital ave' was found in the contract version and is a valid row." }, { "row": 484, "column": "Index", "new_value": "485", "reason": "The address '1x6 hospital ave' was found in the contract version and is a valid row." }, { "row": 485, "column": "Index", "new_value": "486", "reason": "The address '126 hospital ave' was found in the contract version and is a valid row." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 483,\n \"column\": \"Index\",\n \"new_value\": \"484\",\n \"reason\": \"The address '126 hospital ave' was found in the contract version and is a valid row.\"\n },\n {\n \"row\": 484,\n \"column\": \"Index\",\n \"new_value\": \"485\",\n \"reason\": \"The address '1x6 hospital ave' was found in the contract version and is a valid row.\"\n },\n {\n \"row\": 485,\n \"column\": \"Index\",\n \"new_value\": \"486\",\n \"reason\": \"The address '126 hospital ave' was found in the contract version and is a valid row.\"\n }\n ]\n}\n```" }, { "task_index": 8, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "2025", "tuple_id": "2026", "src": "allegiantair", "flight": "UA-2708-EWR-CLT", "sched_dep_time": "", "act_dep_time": "3:04 p.m.", "sched_arr_time": "", "act_arr_time": "4:24 p.m." }, { "_row": "2026", "tuple_id": "2027", "src": "allegiantair", "flight": "UA-62-IAH-EWR", "sched_dep_time": "", "act_dep_time": "2:59 p.m.", "sched_arr_time": "", "act_arr_time": "7:10 p.m." }, { "_row": "2027", "tuple_id": "2028", "src": "allegiantair", "flight": "UA-1500-IAH-GUA", "sched_dep_time": "", "act_dep_time": "9:43 a.m.", "sched_arr_time": "", "act_arr_time": "12:12 p.m." }, { "_row": "2028", "tuple_id": "2029", "src": "allegiantair", "flight": "AA-3804-PHL-ORD", "sched_dep_time": "2:35 p.m.", "act_dep_time": "2:44 p.m.", "sched_arr_time": "4:05 p.m.", "act_arr_time": "3:36 p.m." } ], "ground_truth": [ { "row": 2025, "column": "sched_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "act_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "sched_arr_time", "clean_value": "4:53 p.m." }, { "row": 2025, "column": "act_arr_time", "clean_value": "4:44 p.m." }, { "row": 2026, "column": "sched_dep_time", "clean_value": "2:30 p.m." }, { "row": 2026, "column": "act_dep_time", "clean_value": "2:48 p.m." }, { "row": 2026, "column": "sched_arr_time", "clean_value": "7:03 p.m." }, { "row": 2027, "column": "sched_dep_time", "clean_value": "8:55 a.m." }, { "row": 2027, "column": "act_dep_time", "clean_value": "9:16 a.m." }, { "row": 2027, "column": "sched_arr_time", "clean_value": "11:45 a.m." }, { "row": 2027, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 2028, "column": "act_arr_time", "clean_value": "3:43 p.m." } ], "predicted_repairs": [ { "row": 2025, "column": "act_arr_time", "new_value": "4:24 p.m.", "reason": "The act_arr_time for flight UA-2708-EWR-CLT has been updated to 4:24 PM." }, { "row": 2026, "column": "act_arr_time", "new_value": "7:10 p.m.", "reason": "The act_arr_time for flight UA-62-IAH-EWR has been updated to 7:10 PM." }, { "row": 2027, "column": "act_arr_time", "new_value": "12:12 p.m.", "reason": "The act_arr_time for flight UA-1500-IAH-GUA has been updated to 12:12 PM." }, { "row": 2028, "column": "act_arr_time", "new_value": "3:36 p.m.", "reason": "The act_arr_time for flight AA-3804-PHL-ORD has been updated to 3:36 PM." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 2025,\n \"column\": \"act_arr_time\",\n \"new_value\": \"4:24 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-2708-EWR-CLT has been updated to 4:24 PM.\"\n },\n {\n \"row\": 2026,\n \"column\": \"act_arr_time\",\n \"new_value\": \"7:10 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-62-IAH-EWR has been updated to 7:10 PM.\"\n },\n {\n \"row\": 2027,\n \"column\": \"act_arr_time\",\n \"new_value\": \"12:12 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-1500-IAH-GUA has been updated to 12:12 PM.\"\n },\n {\n \"row\": 2028,\n \"column\": \"act_arr_time\",\n \"new_value\": \"3:36 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-3804-PHL-ORD has been updated to 3:36 PM.\"\n }\n ]\n}\n```" }, { "task_index": 11, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 14, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 14, "wrong_cell": 4 }, "target_rows": [ { "_row": "1535", "tuple_id": "1536", "src": "flytecomm", "flight": "CO-1193-EWR-MCO", "sched_dep_time": "9:15 a.m.", "act_dep_time": "", "sched_arr_time": "12:18 p.m.", "act_arr_time": "" }, { "_row": "1536", "tuple_id": "1537", "src": "flytecomm", "flight": "AA-3842-MSP-ORD", "sched_dep_time": "", "act_dep_time": "6:57 a.m.", "sched_arr_time": "", "act_arr_time": "7:49 a.m." }, { "_row": "1537", "tuple_id": "1538", "src": "flytecomm", "flight": "AA-643-MIA-ORD", "sched_dep_time": "", "act_dep_time": "7:31 a.m.", "sched_arr_time": "", "act_arr_time": "9:26 a.m." }, { "_row": "1538", "tuple_id": "1539", "src": "flytecomm", "flight": "AA-1007-MIA-PHX", "sched_dep_time": "", "act_dep_time": "5:09 p.m.", "sched_arr_time": "", "act_arr_time": "7:43 p.m." } ], "ground_truth": [ { "row": 1535, "column": "act_dep_time", "clean_value": "9:14 a.m." }, { "row": 1535, "column": "act_arr_time", "clean_value": "12:09 p.m." }, { "row": 1536, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 1536, "column": "act_dep_time", "clean_value": "6:56 a.m." }, { "row": 1536, "column": "sched_arr_time", "clean_value": "7:30 a.m." }, { "row": 1536, "column": "act_arr_time", "clean_value": "7:51 a.m." }, { "row": 1537, "column": "sched_dep_time", "clean_value": "7:10 a.m." }, { "row": 1537, "column": "act_dep_time", "clean_value": "7:30 a.m." }, { "row": 1537, "column": "sched_arr_time", "clean_value": "9:35 a.m." }, { "row": 1537, "column": "act_arr_time", "clean_value": "9:31 a.m." }, { "row": 1538, "column": "sched_dep_time", "clean_value": "4:55 p.m." }, { "row": 1538, "column": "act_dep_time", "clean_value": "5:08 p.m." }, { "row": 1538, "column": "sched_arr_time", "clean_value": "8:05 p.m." }, { "row": 1538, "column": "act_arr_time", "clean_value": "7:55 p.m." } ], "predicted_repairs": [ { "row": 1535, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 1536, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 1537, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 1538, "column": "Column", "new_value": "value", "reason": "why" } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1535,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 1536,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 1537,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 1538,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n }\n ]\n}\n```" }, { "task_index": 12, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "wrong_cell": 4 }, "target_rows": [ { "_row": "1774", "index": "1775", "id": "1841", "beer-name": "Alpha Blackback", "style": "American Black Ale", "ounces": "12.0 oz", "abv": "0.07200000000000001%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1775", "index": "1776", "id": "1782", "beer-name": "Kiss Off IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.063%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1776", "index": "1777", "id": "1552", "beer-name": "Dog Days Summer Ale", "style": "K\u00f6lsch", "ounces": "12.0 oz.", "abv": "0.045%", "ibu": "28", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1777", "index": "1778", "id": "1479", "beer-name": "1881 California Red", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.055999999999999994%", "ibu": "35", "brewery_id": "397", "brewery-name": "Ruhstaller Beer Company", "city": "Sacramento", "state": "CA" } ], "ground_truth": [ { "row": 1774, "column": "ounces", "clean_value": "12" }, { "row": 1774, "column": "abv", "clean_value": "0.072" }, { "row": 1774, "column": "ibu", "clean_value": "" }, { "row": 1775, "column": "ounces", "clean_value": "12" }, { "row": 1775, "column": "abv", "clean_value": "0.063" }, { "row": 1775, "column": "ibu", "clean_value": "" }, { "row": 1776, "column": "ounces", "clean_value": "12" }, { "row": 1776, "column": "abv", "clean_value": "0.045" }, { "row": 1777, "column": "ounces", "clean_value": "12" }, { "row": 1777, "column": "abv", "clean_value": "0.056" } ], "predicted_repairs": [ { "row": 1774, "column": "Beer Name", "new_value": "Alpha Blackback", "reason": "The beer name has been replaced with 'Alpha Blackback'." }, { "row": 1775, "column": "Beer Name", "new_value": "Kiss Off IPA", "reason": "The beer name has been replaced with 'Kiss Off IPA'." }, { "row": 1776, "column": "Beer Name", "new_value": "Dog Days Summer Ale", "reason": "The beer name has been replaced with 'Dog Days Summer Ale'." }, { "row": 1777, "column": "Beer Name", "new_value": "1881 California Red", "reason": "The beer name has been replaced with '1881 California Red'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1774,\n \"column\": \"Beer Name\",\n \"new_value\": \"Alpha Blackback\",\n \"reason\": \"The beer name has been replaced with 'Alpha Blackback'.\"\n },\n {\n \"row\": 1775,\n \"column\": \"Beer Name\",\n \"new_value\": \"Kiss Off IPA\",\n \"reason\": \"The beer name has been replaced with 'Kiss Off IPA'.\"\n },\n {\n \"row\": 1776,\n \"column\": \"Beer Name\",\n \"new_value\": \"Dog Days Summer Ale\",\n \"reason\": \"The beer name has been replaced with 'Dog Days Summer Ale'.\"\n },\n {\n \"row\": 1777,\n \"column\": \"Beer Name\",\n \"new_value\": \"1881 California Red\",\n \"reason\": \"The beer name has been replaced with '1881 California Red'.\"\n }\n ]\n}\n```" }, { "task_index": 13, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 3, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "881", "index": "882", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "82%", "Sample": "11 patients", "Stateavg": "al_ami-5" }, { "_row": "882", "index": "883", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "883", "index": "884", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" }, { "_row": "884", "index": "885", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "xl", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "87%", "Sample": "67 patients", "Stateavg": "al_hf-1" } ], "ground_truth": [ { "row": 881, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 883, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 884, "column": "State", "clean_value": "al" } ], "predicted_repairs": [ { "row": 881, "column": "Index", "new_value": "882", "reason": "The new value for index is invalid." }, { "row": 882, "column": "ProviderNumber", "new_value": "10045", "reason": "The new value for ProviderNumber is invalid." }, { "row": 883, "column": "Address1", "new_value": "1653 temple avenue north", "reason": "The new value for Address1 is invalid." }, { "row": 884, "column": "Address2", "new_value": "", "reason": "The new value for Address2 is missing or invalid." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 881,\n \"column\": \"Index\",\n \"new_value\": \"882\",\n \"reason\": \"The new value for index is invalid.\"\n },\n {\n \"row\": 882,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10045\",\n \"reason\": \"The new value for ProviderNumber is invalid.\"\n },\n {\n \"row\": 883,\n \"column\": \"Address1\",\n \"new_value\": \"1653 temple avenue north\",\n \"reason\": \"The new value for Address1 is invalid.\"\n },\n {\n \"row\": 884,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address2 is missing or invalid.\"\n }\n ]\n}\n```" }, { "task_index": 14, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_value": 3 }, "target_rows": [ { "_row": "1675", "tuple_id": "1676", "src": "wunderground", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:45 a.m.", "sched_arr_time": "4:37 p.m.", "act_arr_time": "4:57 p.m." }, { "_row": "1676", "tuple_id": "1677", "src": "wunderground", "flight": "AA-2957-DFW-CVG", "sched_dep_time": "7:55 a.m.", "act_dep_time": "8:05 a.m.", "sched_arr_time": "10:55 a.m.", "act_arr_time": "10:58 a.m." }, { "_row": "1677", "tuple_id": "1678", "src": "wunderground", "flight": "AA-1664-MIA-ATL", "sched_dep_time": "10:15 a.m.", "act_dep_time": "10:19 a.m.", "sched_arr_time": "11:43 a.m.", "act_arr_time": "11:50 a.m." }, { "_row": "1678", "tuple_id": "1679", "src": "wunderground", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "7:50 a.m.", "act_arr_time": "7:59 a.m." } ], "ground_truth": [ { "row": 1675, "column": "act_dep_time", "clean_value": "11:30 a.m." }, { "row": 1675, "column": "sched_arr_time", "clean_value": "4:57 p.m." }, { "row": 1675, "column": "act_arr_time", "clean_value": "5:05 p.m." }, { "row": 1676, "column": "act_dep_time", "clean_value": "8:04 a.m." }, { "row": 1676, "column": "sched_arr_time", "clean_value": "11:05 a.m." }, { "row": 1676, "column": "act_arr_time", "clean_value": "11:01 a.m." }, { "row": 1677, "column": "act_dep_time", "clean_value": "10:18 a.m." }, { "row": 1677, "column": "sched_arr_time", "clean_value": "12:10 p.m." }, { "row": 1677, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 1678, "column": "sched_arr_time", "clean_value": "8:00 a.m." }, { "row": 1678, "column": "act_arr_time", "clean_value": "8:06 a.m." } ], "predicted_repairs": [ { "row": 1675, "column": "act_arr_time", "new_value": "10:58 a.m.", "reason": "The act_arr_time for flight AA-2957-DFW-CVG has been updated to 10:55 a.m." }, { "row": 1676, "column": "act_arr_time", "new_value": "11:50 a.m.", "reason": "The act_arr_time for flight AA-1664-MIA-ATL has been updated to 11:43 a.m." }, { "row": 1677, "column": "act_arr_time", "new_value": "11:50 a.m.", "reason": "The act_arr_time for flight AA-3979-CVG-ORD has been updated to 11:43 a.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1675,\n \"column\": \"act_arr_time\",\n \"new_value\": \"10:58 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-2957-DFW-CVG has been updated to 10:55 a.m.\"\n },\n {\n \"row\": 1676,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:50 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-1664-MIA-ATL has been updated to 11:43 a.m.\"\n },\n {\n \"row\": 1677,\n \"column\": \"act_arr_time\",\n \"new_value\": \"11:50 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-3979-CVG-ORD has been updated to 11:43 a.m.\"\n }\n ]\n}\n```" }, { "task_index": 16, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 3, "schema_case_error": 3 }, "target_rows": [ { "_row": "734", "index": "735", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "99%", "Sample": "411 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "735", "index": "736", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scix-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "98%", "Sample": "417 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "736", "index": "737", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912xalabamaxhighwayx157", "Address2": "empty", "Address3": "empty", "City": "cuxxman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "98%", "Sample": "405 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "737", "index": "738", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 735, "column": "MeasureCode", "clean_value": "scip-inf-2" }, { "row": 736, "column": "Address1", "clean_value": "1912 alabama highway 157" }, { "row": 736, "column": "City", "clean_value": "cullman" } ], "predicted_repairs": [ { "row": 734, "column": "Index", "new_value": "735", "reason": "The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue." }, { "row": 735, "column": "Index", "new_value": "736", "reason": "The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue." }, { "row": 736, "column": "Index", "new_value": "737", "reason": "The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 734,\n \"column\": \"Index\",\n \"new_value\": \"735\",\n \"reason\": \"The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue.\"\n },\n {\n \"row\": 735,\n \"column\": \"Index\",\n \"new_value\": \"736\",\n \"reason\": \"The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue.\"\n },\n {\n \"row\": 736,\n \"column\": \"Index\",\n \"new_value\": \"737\",\n \"reason\": \"The address '1912 Alabama Highway 157' was found to have a surgical infection prevention issue.\"\n }\n ]\n}\n```" }, { "task_index": 17, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "wrong_value": 4 }, "target_rows": [ { "_row": "167", "tuple_id": "168", "src": "boston", "flight": "UA-3515-IAD-MSP", "sched_dep_time": "", "act_dep_time": "8:26 a.m.", "sched_arr_time": "", "act_arr_time": "9:54 a.m." }, { "_row": "168", "tuple_id": "169", "src": "boston", "flight": "AA-3468-CVG-MIA", "sched_dep_time": "7:00 a.m.", "act_dep_time": "7:25 a.m.", "sched_arr_time": "9:55 a.m.", "act_arr_time": "9:42 a.m." }, { "_row": "169", "tuple_id": "170", "src": "boston", "flight": "AA-484-DFW-MIA", "sched_dep_time": "4:15 p.m.", "act_dep_time": "4:30 p.m.", "sched_arr_time": "7:55 p.m.", "act_arr_time": "7:35 p.m." }, { "_row": "170", "tuple_id": "171", "src": "boston", "flight": "AA-1886-BOS-MIA", "sched_dep_time": "", "act_dep_time": "10:55 a.m.", "sched_arr_time": "", "act_arr_time": "1:34 p.m." } ], "ground_truth": [ { "row": 167, "column": "sched_dep_time", "clean_value": "8:15 a.m." }, { "row": 167, "column": "act_dep_time", "clean_value": "8:12 a.m." }, { "row": 167, "column": "sched_arr_time", "clean_value": "10:06 a.m." }, { "row": 167, "column": "act_arr_time", "clean_value": "9:56 a.m." }, { "row": 168, "column": "act_arr_time", "clean_value": "9:45 a.m." }, { "row": 169, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 169, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 170, "column": "sched_dep_time", "clean_value": "10:45 a.m." }, { "row": 170, "column": "sched_arr_time", "clean_value": "2:20 p.m." }, { "row": 170, "column": "act_arr_time", "clean_value": "1:40 p.m." } ], "predicted_repairs": [ { "row": 167, "column": "act_arr_time", "new_value": "9:54 a.m.", "reason": "The act_arr_time for flight UA-3515-IAD-MSP has been updated to 9:54 a.m." }, { "row": 168, "column": "act_arr_time", "new_value": "9:42 a.m.", "reason": "The act_arr_time for flight AA-3468-CVG-MIA has been updated to 9:42 a.m." }, { "row": 169, "column": "act_arr_time", "new_value": "7:35 p.m.", "reason": "The act_arr_time for flight AA-484-DFW-MIA has been updated to 7:35 p.m." }, { "row": 170, "column": "act_arr_time", "new_value": "1:34 p.m.", "reason": "The act_arr_time for flight AA-1886-BOS-MIA has been updated to 1:34 p.m." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 167,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:54 a.m.\",\n \"reason\": \"The act_arr_time for flight UA-3515-IAD-MSP has been updated to 9:54 a.m.\"\n },\n {\n \"row\": 168,\n \"column\": \"act_arr_time\",\n \"new_value\": \"9:42 a.m.\",\n \"reason\": \"The act_arr_time for flight AA-3468-CVG-MIA has been updated to 9:42 a.m.\"\n },\n {\n \"row\": 169,\n \"column\": \"act_arr_time\",\n \"new_value\": \"7:35 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-484-DFW-MIA has been updated to 7:35 p.m.\"\n },\n {\n \"row\": 170,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:34 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-1886-BOS-MIA has been updated to 1:34 p.m.\"\n }\n ]\n}\n```" }, { "task_index": 18, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 7, "schema_case_error": 4 }, "target_rows": [ { "_row": "1589", "index": "1590", "id": "785", "beer-name": "Old Chub (2003)", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1590", "index": "1591", "id": "745", "beer-name": "Dale's Pale Ale (2008)", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1591", "index": "1592", "id": "744", "beer-name": "Dale's Pale Ale (2006)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.065%", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons CO", "state": "" }, { "_row": "1592", "index": "1593", "id": "743", "beer-name": "Dale's Pale Ale (2004)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" } ], "ground_truth": [ { "row": 1589, "column": "ounces", "clean_value": "12" }, { "row": 1590, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "abv", "clean_value": "0.065" }, { "row": 1591, "column": "city", "clean_value": "Lyons" }, { "row": 1591, "column": "state", "clean_value": "CO" }, { "row": 1592, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1589, "column": "Beer-Name", "new_value": "Old Chub (2003)", "reason": "The beer name has been replaced with 'Old Chub (2003)'." }, { "row": 1590, "column": "Beer-Name", "new_value": "Dale's Pale Ale (2008)", "reason": "The beer name has been replaced with 'Dale's Pale Ale (2008)'." }, { "row": 1591, "column": "Beer-Name", "new_value": "Dale's Pale Ale (2006)", "reason": "The beer name has been replaced with 'Dale's Pale Ale (2006)'." }, { "row": 1592, "column": "Beer-Name", "new_value": "Dale's Pale Ale (2004)", "reason": "The beer name has been replaced with 'Dale's Pale Ale (2004)'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1589,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Old Chub (2003)\",\n \"reason\": \"The beer name has been replaced with 'Old Chub (2003)'.\"\n },\n {\n \"row\": 1590,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Dale's Pale Ale (2008)\",\n \"reason\": \"The beer name has been replaced with 'Dale's Pale Ale (2008)'.\"\n },\n {\n \"row\": 1591,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Dale's Pale Ale (2006)\",\n \"reason\": \"The beer name has been replaced with 'Dale's Pale Ale (2006)'.\"\n },\n {\n \"row\": 1592,\n \"column\": \"Beer-Name\",\n \"new_value\": \"Dale's Pale Ale (2004)\",\n \"reason\": \"The beer name has been replaced with 'Dale's Pale Ale (2004)'.\"\n }\n ]\n}\n```" }, { "task_index": 19, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "512", "index": "513", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "513", "index": "514", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "chxrokxx", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "100%", "Sample": "6 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "514", "index": "515", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "1xx%", "Sample": "5 patients", "Stateavg": "al_scip-vte-1" }, { "_row": "515", "index": "516", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-2", "MeasureName": "patients who got treatment at the right time (within 24 hours before or after their surgery) to help prevent blood clots after certain types of surgery", "Score": "100%", "Sample": "5 patients", "Stateavg": "al_scip-vte-2" } ], "ground_truth": [ { "row": 513, "column": "CountyName", "clean_value": "cherokee" }, { "row": 514, "column": "Score", "clean_value": "100%" } ], "predicted_repairs": [ { "row": 512, "column": "Index", "new_value": "513", "reason": "The address '400 northwood dr' has been replaced with '513'." }, { "row": 513, "column": "ProviderNumber", "new_value": "10022", "reason": "The address '400 northwood dr' has been replaced with '10022'." }, { "row": 514, "column": "Address1", "new_value": "400 northwood dr", "reason": "The address '400 northwood dr' has been replaced with '400 northwood dr'." }, { "row": 515, "column": "Address2", "new_value": "", "reason": "The address '400 northwood dr' has been replaced with an empty string." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 512,\n \"column\": \"Index\",\n \"new_value\": \"513\",\n \"reason\": \"The address '400 northwood dr' has been replaced with '513'.\"\n },\n {\n \"row\": 513,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10022\",\n \"reason\": \"The address '400 northwood dr' has been replaced with '10022'.\"\n },\n {\n \"row\": 514,\n \"column\": \"Address1\",\n \"new_value\": \"400 northwood dr\",\n \"reason\": \"The address '400 northwood dr' has been replaced with '400 northwood dr'.\"\n },\n {\n \"row\": 515,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The address '400 northwood dr' has been replaced with an empty string.\"\n }\n ]\n}\n```" }, { "task_index": 22, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 2, "schema_case_error": 4 }, "target_rows": [ { "_row": "870", "index": "871", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "80%", "Sample": "15 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "871", "index": "872", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "87%", "Sample": "15 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "872", "index": "873", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntaxy non-pxofit - pxivate", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "87%", "Sample": "15 patiexts", "Stateavg": "al_scip-inf-3" }, { "_row": "873", "index": "874", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 872, "column": "HospitalOwner", "clean_value": "voluntary non-profit - private" }, { "row": 872, "column": "Sample", "clean_value": "15 patients" } ], "predicted_repairs": [ { "row": 870, "column": "Index", "new_value": "870", "reason": "The address '1256 military street south' does not match any allowed column name." }, { "row": 871, "column": "Index", "new_value": "871", "reason": "The address '1256 military street south' does not match any allowed column name." }, { "row": 872, "column": "Index", "new_value": "872", "reason": "The address '1256 military street south' does not match any allowed column name." }, { "row": 873, "column": "Index", "new_value": "873", "reason": "The address '1256 military street south' does not match any allowed column name." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 870,\n \"column\": \"Index\",\n \"new_value\": \"870\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n },\n {\n \"row\": 871,\n \"column\": \"Index\",\n \"new_value\": \"871\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n },\n {\n \"row\": 872,\n \"column\": \"Index\",\n \"new_value\": \"872\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n },\n {\n \"row\": 873,\n \"column\": \"Index\",\n \"new_value\": \"873\",\n \"reason\": \"The address '1256 military street south' does not match any allowed column name.\"\n }\n ]\n}\n```" }, { "task_index": 23, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 4 }, "target_rows": [ { "_row": "324", "tuple_id": "325", "src": "weather", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:20 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "2:49 p.m." }, { "_row": "325", "tuple_id": "326", "src": "weather", "flight": "UA-854-SFO-IAH", "sched_dep_time": "7:53 a.m.", "act_dep_time": "8:07 a.m.", "sched_arr_time": "1:39 p.m.", "act_arr_time": "1:23 p.m." }, { "_row": "326", "tuple_id": "327", "src": "weather", "flight": "AA-415-BOS-ORD", "sched_dep_time": "8:35 a.m.", "act_dep_time": "", "sched_arr_time": "10:40 a.m.", "act_arr_time": "" }, { "_row": "327", "tuple_id": "328", "src": "weather", "flight": "AA-85-JFK-SFO", "sched_dep_time": "3:05 p.m.", "act_dep_time": "", "sched_arr_time": "6:30 p.m.", "act_arr_time": "" } ], "ground_truth": [ { "row": 324, "column": "act_dep_time", "clean_value": "1:19 p.m." }, { "row": 324, "column": "act_arr_time", "clean_value": "3:13 p.m." }, { "row": 325, "column": "act_dep_time", "clean_value": "7:49 a.m." }, { "row": 325, "column": "act_arr_time", "clean_value": "1:30 p.m." }, { "row": 326, "column": "act_dep_time", "clean_value": "8:56 a.m." }, { "row": 326, "column": "act_arr_time", "clean_value": "10:16 a.m." }, { "row": 327, "column": "act_dep_time", "clean_value": "3:36 p.m." }, { "row": 327, "column": "act_arr_time", "clean_value": "6:43 p.m." } ], "predicted_repairs": [ { "row": 324, "column": "act_arr_time", "new_value": "1:23 p.m.", "reason": "The act_arr_time for flight AA-854-SFO-IAH has been updated to 1:23 PM." }, { "row": 325, "column": "act_arr_time", "new_value": "", "reason": "The act_arr_time for flight AA-85-JFK-SFO is missing or incorrect." }, { "row": 326, "column": "act_arr_time", "new_value": "", "reason": "The act_arr_time for flight AA-415-BOS-ORD is missing or incorrect." }, { "row": 327, "column": "act_arr_time", "new_value": "", "reason": "The act_arr_time for flight AA-789-ORD-DEN is missing or incorrect." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 324,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:23 p.m.\",\n \"reason\": \"The act_arr_time for flight AA-854-SFO-IAH has been updated to 1:23 PM.\"\n },\n {\n \"row\": 325,\n \"column\": \"act_arr_time\",\n \"new_value\": \"\",\n \"reason\": \"The act_arr_time for flight AA-85-JFK-SFO is missing or incorrect.\"\n },\n {\n \"row\": 326,\n \"column\": \"act_arr_time\",\n \"new_value\": \"\",\n \"reason\": \"The act_arr_time for flight AA-415-BOS-ORD is missing or incorrect.\"\n },\n {\n \"row\": 327,\n \"column\": \"act_arr_time\",\n \"new_value\": \"\",\n \"reason\": \"The act_arr_time for flight AA-789-ORD-DEN is missing or incorrect.\"\n }\n ]\n}\n```" }, { "task_index": 26, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 2 }, "target_rows": [ { "_row": "471", "tuple_id": "472", "src": "flightview", "flight": "AA-4344-ORD-DTW", "sched_dep_time": "", "act_dep_time": "12:14 p.m.", "sched_arr_time": "", "act_arr_time": "2:01 p.m." }, { "_row": "472", "tuple_id": "473", "src": "flightview", "flight": "UA-257-JFK-SFO", "sched_dep_time": "2:30 p.m.", "act_dep_time": "2:43 p.m.", "sched_arr_time": "6:15 p.m.", "act_arr_time": "5:42 p.m." }, { "_row": "473", "tuple_id": "474", "src": "flightview", "flight": "UA-2945-PHL-CLT", "sched_dep_time": "12:00 p.m.", "act_dep_time": "12:08 p.m.", "sched_arr_time": "1:45 p.m.", "act_arr_time": "1:14 p.m." }, { "_row": "474", "tuple_id": "475", "src": "flightview", "flight": "CO-63-EWR-IAH", "sched_dep_time": "", "act_dep_time": "5:38 p.m.", "sched_arr_time": "", "act_arr_time": "8:03 p.m." } ], "ground_truth": [ { "row": 471, "column": "sched_dep_time", "clean_value": "11:45 a.m." }, { "row": 471, "column": "act_dep_time", "clean_value": "12:13 p.m." }, { "row": 471, "column": "sched_arr_time", "clean_value": "2:00 p.m." }, { "row": 471, "column": "act_arr_time", "clean_value": "2:10 p.m." }, { "row": 472, "column": "act_dep_time", "clean_value": "2:26 p.m." }, { "row": 473, "column": "sched_dep_time", "clean_value": "12:00 a.m." }, { "row": 473, "column": "act_dep_time", "clean_value": "3:11 a.m." }, { "row": 473, "column": "act_arr_time", "clean_value": "1:15 p.m." }, { "row": 474, "column": "sched_dep_time", "clean_value": "5:25 p.m." }, { "row": 474, "column": "act_dep_time", "clean_value": "5:22 p.m." }, { "row": 474, "column": "sched_arr_time", "clean_value": "8:22 p.m." } ], "predicted_repairs": [ { "row": 471, "column": "act_arr_time", "new_value": "5:42 p.m.", "reason": "The act_arr_time for flight UA-257-JFK-SFO has been updated to 5:42 PM." }, { "row": 472, "column": "act_arr_time", "new_value": "1:14 p.m.", "reason": "The act_arr_time for flight UA-2945-PHL-CLT has been updated to 1:14 PM." }, { "row": 473, "column": "act_arr_time", "new_value": "8:03 p.m.", "reason": "The act_arr_time for flight CO-63-EWR-IAH has been updated to 8:03 PM." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 471,\n \"column\": \"act_arr_time\",\n \"new_value\": \"5:42 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-257-JFK-SFO has been updated to 5:42 PM.\"\n },\n {\n \"row\": 472,\n \"column\": \"act_arr_time\",\n \"new_value\": \"1:14 p.m.\",\n \"reason\": \"The act_arr_time for flight UA-2945-PHL-CLT has been updated to 1:14 PM.\"\n },\n {\n \"row\": 473,\n \"column\": \"act_arr_time\",\n \"new_value\": \"8:03 p.m.\",\n \"reason\": \"The act_arr_time for flight CO-63-EWR-IAH has been updated to 8:03 PM.\"\n }\n ]\n}\n```" }, { "task_index": 27, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "379", "index": "380", "id": "397", "beer-name": "SummerBright Ale", "style": "American Pale Wheat Ale", "ounces": "12.0 ounce", "abv": "0.045", "ibu": "15", "brewery_id": "391", "brewery-name": "Breckenridge Brewery", "city": "Denver", "state": "CO" }, { "_row": "380", "index": "381", "id": "193", "beer-name": "Lucky U IPA", "style": "American IPA", "ounces": "12.0 ounce", "abv": "0.062%", "ibu": "68", "brewery_id": "391", "brewery-name": "Breckenridge Brewery", "city": "Denver", "state": "CO" }, { "_row": "381", "index": "382", "id": "83", "beer-name": "Avalanche Ale", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.054", "ibu": "19", "brewery_id": "391", "brewery-name": "Breckenridge Brewery", "city": "Denver CO", "state": "" }, { "_row": "382", "index": "383", "id": "1802", "beer-name": "You're My Boy, Blue", "style": "Fruit / Vegetable Beer", "ounces": "12.0 oz.", "abv": "0.05", "ibu": "N/A", "brewery_id": "308", "brewery-name": "Brew Bus Brewing", "city": "Tampa", "state": "FL" } ], "ground_truth": [ { "row": 379, "column": "ounces", "clean_value": "12" }, { "row": 380, "column": "ounces", "clean_value": "12" }, { "row": 380, "column": "abv", "clean_value": "0.062" }, { "row": 381, "column": "ounces", "clean_value": "12" }, { "row": 381, "column": "city", "clean_value": "Denver" }, { "row": 381, "column": "state", "clean_value": "CO" }, { "row": 382, "column": "ounces", "clean_value": "12" }, { "row": 382, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 379, "column": "abv", "new_value": "0.045", "reason": "The beer name has been replaced with 'SummerBright Ale'." }, { "row": 380, "column": "abv", "new_value": "0.062%", "reason": "The beer name has been replaced with 'Lucky U IPA'." }, { "row": 381, "column": "abv", "new_value": "0.054", "reason": "The beer name has been replaced with 'Avalanche Ale'." }, { "row": 382, "column": "abv", "new_value": "0.05", "reason": "The beer name has been replaced with 'You're My Boy, Blue'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 379,\n \"column\": \"abv\",\n \"new_value\": \"0.045\",\n \"reason\": \"The beer name has been replaced with 'SummerBright Ale'.\"\n },\n {\n \"row\": 380,\n \"column\": \"abv\",\n \"new_value\": \"0.062%\",\n \"reason\": \"The beer name has been replaced with 'Lucky U IPA'.\"\n },\n {\n \"row\": 381,\n \"column\": \"abv\",\n \"new_value\": \"0.054\",\n \"reason\": \"The beer name has been replaced with 'Avalanche Ale'.\"\n },\n {\n \"row\": 382,\n \"column\": \"abv\",\n \"new_value\": \"0.05\",\n \"reason\": \"The beer name has been replaced with 'You're My Boy, Blue'.\"\n }\n ]\n}\n```" }, { "task_index": 28, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "missed_repair": 1, "schema_case_error": 4 }, "target_rows": [ { "_row": "958", "index": "959", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprise", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-4", "MeasureName": "heart attack patients given smoking cessation advice/counseling", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-4" }, { "_row": "959", "index": "960", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprise", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "100%", "Sample": "2 patients", "Stateavg": "al_ami-5" }, { "_row": "960", "index": "961", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprxse", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "961", "index": "962", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprise", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" } ], "ground_truth": [ { "row": 960, "column": "City", "clean_value": "enterprise" } ], "predicted_repairs": [ { "row": 958, "column": "Index", "new_value": "Enterprise", "reason": "The address '400 n Edwards Street' is invalid as it does not have a specific location." }, { "row": 959, "column": "Index", "new_value": "Enterprise", "reason": "The address '400 n Edwards Street' is invalid as it does not have a specific location." }, { "row": 960, "column": "Index", "new_value": "Enterprise", "reason": "The address '400 n Edwards Street' is invalid as it does not have a specific location." }, { "row": 961, "column": "Index", "new_value": "Enterprise", "reason": "The address '400 n Edwards Street' is invalid as it does not have a specific location." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 958,\n \"column\": \"Index\",\n \"new_value\": \"Enterprise\",\n \"reason\": \"The address '400 n Edwards Street' is invalid as it does not have a specific location.\"\n },\n {\n \"row\": 959,\n \"column\": \"Index\",\n \"new_value\": \"Enterprise\",\n \"reason\": \"The address '400 n Edwards Street' is invalid as it does not have a specific location.\"\n },\n {\n \"row\": 960,\n \"column\": \"Index\",\n \"new_value\": \"Enterprise\",\n \"reason\": \"The address '400 n Edwards Street' is invalid as it does not have a specific location.\"\n },\n {\n \"row\": 961,\n \"column\": \"Index\",\n \"new_value\": \"Enterprise\",\n \"reason\": \"The address '400 n Edwards Street' is invalid as it does not have a specific location.\"\n }\n ]\n}\n```" }, { "task_index": 29, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_cell": 4 }, "target_rows": [ { "_row": "931", "tuple_id": "932", "src": "flightarrival", "flight": "AA-3-JFK-LAX", "sched_dep_time": "12:00 p.m.", "act_dep_time": "12:12 p.m.", "sched_arr_time": "3:15 p.m.", "act_arr_time": "3:10 p.m." }, { "_row": "932", "tuple_id": "933", "src": "flightarrival", "flight": "CO-1694-LAX-IAH", "sched_dep_time": "7:15 p.m.", "act_dep_time": "7:15 p.m. (Estimated)", "sched_arr_time": "12:21 a.m.", "act_arr_time": "12:21 a.m. (Estimated)" }, { "_row": "933", "tuple_id": "934", "src": "flightarrival", "flight": "CO-1193-EWR-MCO", "sched_dep_time": "9:15 a.m.", "act_dep_time": "", "sched_arr_time": "12:18 p.m.", "act_arr_time": "" }, { "_row": "934", "tuple_id": "935", "src": "flightarrival", "flight": "UA-2906-PHL-MCO", "sched_dep_time": "3:50 p.m.", "act_dep_time": "4:46 p.m.", "sched_arr_time": "6:23 p.m.", "act_arr_time": "6:36 p.m." } ], "ground_truth": [ { "row": 931, "column": "act_dep_time", "clean_value": "12:11 p.m." }, { "row": 931, "column": "act_arr_time", "clean_value": "3:16 p.m." }, { "row": 932, "column": "act_dep_time", "clean_value": "7:15 p.m." }, { "row": 932, "column": "act_arr_time", "clean_value": "12:21 a.m." }, { "row": 933, "column": "act_dep_time", "clean_value": "9:14 a.m." }, { "row": 933, "column": "act_arr_time", "clean_value": "12:09 p.m." }, { "row": 934, "column": "act_dep_time", "clean_value": "4:28 p.m." }, { "row": 934, "column": "act_arr_time", "clean_value": "6:38 p.m." } ], "predicted_repairs": [ { "row": 931, "column": "Column", "new_value": "value", "reason": "Why" }, { "row": 932, "column": "Column", "new_value": "value", "reason": "Why" }, { "row": 933, "column": "Column", "new_value": "value", "reason": "Why" }, { "row": 934, "column": "Column", "new_value": "value", "reason": "Why" } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 931,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n },\n {\n \"row\": 932,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n },\n {\n \"row\": 933,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n },\n {\n \"row\": 934,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"Why\"\n }\n ]\n}\n```" }, { "task_index": 31, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "521", "index": "522", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yxs", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "522", "index": "523", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "96%", "Sample": "27 patients", "Stateavg": "al_ami-8a" }, { "_row": "523", "index": "524", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "100%", "Sample": "25x patients", "Stateavg": "al_hf-1" }, { "_row": "524", "index": "525", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "100%", "Sample": "292 patients", "Stateavg": "al_hf-2" } ], "ground_truth": [ { "row": 521, "column": "EmergencyService", "clean_value": "yes" }, { "row": 523, "column": "Sample", "clean_value": "257 patients" } ], "predicted_repairs": [ { "row": 521, "column": "Index", "new_value": "522", "reason": "The index has been updated to '522'." }, { "row": 522, "column": "ProviderNumber", "new_value": "10023", "reason": "The ProviderNumber has been updated to '10023'." }, { "row": 523, "column": "Address1", "new_value": "2105 east south boulevard", "reason": "The Address1 has been updated to '2105 east south boulevard'." }, { "row": 524, "column": "Address2", "new_value": "", "reason": "The Address2 has been removed as it is empty." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 521,\n \"column\": \"Index\",\n \"new_value\": \"522\",\n \"reason\": \"The index has been updated to '522'.\"\n },\n {\n \"row\": 522,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10023\",\n \"reason\": \"The ProviderNumber has been updated to '10023'.\"\n },\n {\n \"row\": 523,\n \"column\": \"Address1\",\n \"new_value\": \"2105 east south boulevard\",\n \"reason\": \"The Address1 has been updated to '2105 east south boulevard'.\"\n },\n {\n \"row\": 524,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The Address2 has been removed as it is empty.\"\n }\n ]\n}\n```" }, { "task_index": 32, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "wrong_cell": 4 }, "target_rows": [ { "_row": "655", "tuple_id": "656", "src": "panynj", "flight": "AA-466-IAH-MIA", "sched_dep_time": "6:00 a.m.", "act_dep_time": "6:09 a.m.", "sched_arr_time": "9:20 a.m.", "act_arr_time": "9:05 a.m." }, { "_row": "656", "tuple_id": "657", "src": "panynj", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:45 a.m.", "sched_arr_time": "4:57 p.m.", "act_arr_time": "5:03 p.m." }, { "_row": "657", "tuple_id": "658", "src": "panynj", "flight": "CO-89-IAH-EWR", "sched_dep_time": "", "act_dep_time": "6:17 a.m.", "sched_arr_time": "", "act_arr_time": "10:27 a.m." }, { "_row": "658", "tuple_id": "659", "src": "panynj", "flight": "CO-1088-CLE-IAH", "sched_dep_time": "", "act_dep_time": "9:01 a.m.", "sched_arr_time": "", "act_arr_time": "10:56 a.m." } ], "ground_truth": [ { "row": 655, "column": "act_dep_time", "clean_value": "6:08 a.m." }, { "row": 656, "column": "act_dep_time", "clean_value": "11:30 a.m." }, { "row": 656, "column": "act_arr_time", "clean_value": "5:05 p.m." }, { "row": 657, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 657, "column": "act_dep_time", "clean_value": "6:02 a.m." }, { "row": 657, "column": "sched_arr_time", "clean_value": "10:20 a.m." }, { "row": 658, "column": "sched_dep_time", "clean_value": "8:40 a.m." }, { "row": 658, "column": "act_dep_time", "clean_value": "8:40 a.m." }, { "row": 658, "column": "sched_arr_time", "clean_value": "10:54 a.m." } ], "predicted_repairs": [ { "row": 655, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 656, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 657, "column": "Column", "new_value": "value", "reason": "why" }, { "row": 658, "column": "Column", "new_value": "value", "reason": "why" } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 655,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 656,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 657,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n },\n {\n \"row\": 658,\n \"column\": \"Column\",\n \"new_value\": \"value\",\n \"reason\": \"why\"\n }\n ]\n}\n```" }, { "task_index": 33, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 13, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 13, "overrepair": 4 }, "target_rows": [ { "_row": "541", "index": "542", "id": "61", "beer-name": "Supper Club Lager", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "", "ibu": "N/A", "brewery_id": "192", "brewery-name": "Capital Brewery", "city": "Middleton", "state": "WI" }, { "_row": "542", "index": "543", "id": "784", "beer-name": "Carolina Lighthouse (2007)", "style": "American Blonde Ale", "ounces": "12.0 ounce", "abv": "0.04", "ibu": "N/A", "brewery_id": "504", "brewery-name": "Carolina Beer & Beverage", "city": "Mooresville NC", "state": "" }, { "_row": "543", "index": "544", "id": "783", "beer-name": "Carolina Blonde (2006)", "style": "American Blonde Ale", "ounces": "12.0 ounce", "abv": "0.05%", "ibu": "N/A", "brewery_id": "504", "brewery-name": "Carolina Beer & Beverage", "city": "Mooresville NC", "state": "" }, { "_row": "544", "index": "545", "id": "782", "beer-name": "Carolina Blonde Light (2005)", "style": "American Blonde Ale", "ounces": "12.0 oz", "abv": "0.035", "ibu": "N/A", "brewery_id": "504", "brewery-name": "Carolina Beer & Beverage", "city": "Mooresville", "state": "NC" } ], "ground_truth": [ { "row": 541, "column": "ounces", "clean_value": "12" }, { "row": 541, "column": "ibu", "clean_value": "" }, { "row": 542, "column": "ounces", "clean_value": "12" }, { "row": 542, "column": "ibu", "clean_value": "" }, { "row": 542, "column": "city", "clean_value": "Mooresville" }, { "row": 542, "column": "state", "clean_value": "NC" }, { "row": 543, "column": "ounces", "clean_value": "12" }, { "row": 543, "column": "abv", "clean_value": "0.05" }, { "row": 543, "column": "ibu", "clean_value": "" }, { "row": 543, "column": "city", "clean_value": "Mooresville" }, { "row": 543, "column": "state", "clean_value": "NC" }, { "row": 544, "column": "ounces", "clean_value": "12" }, { "row": 544, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 541, "column": "style", "new_value": "American Pale Lager", "reason": "The beer name has been changed to American Pale Lager." }, { "row": 542, "column": "style", "new_value": "American Blonde Ale", "reason": "The beer name has been changed to American Blonde Ale." }, { "row": 543, "column": "style", "new_value": "American Blonde Ale", "reason": "The beer name has been changed to American Blonde Ale." }, { "row": 544, "column": "style", "new_value": "American Blonde Ale", "reason": "The beer name has been changed to American Blonde Ale." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 541,\n \"column\": \"style\",\n \"new_value\": \"American Pale Lager\",\n \"reason\": \"The beer name has been changed to American Pale Lager.\"\n },\n {\n \"row\": 542,\n \"column\": \"style\",\n \"new_value\": \"American Blonde Ale\",\n \"reason\": \"The beer name has been changed to American Blonde Ale.\"\n },\n {\n \"row\": 543,\n \"column\": \"style\",\n \"new_value\": \"American Blonde Ale\",\n \"reason\": \"The beer name has been changed to American Blonde Ale.\"\n },\n {\n \"row\": 544,\n \"column\": \"style\",\n \"new_value\": \"American Blonde Ale\",\n \"reason\": \"The beer name has been changed to American Blonde Ale.\"\n }\n ]\n}\n```" }, { "task_index": 34, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 1, "overrepair": 3, "schema_case_error": 1 }, "target_rows": [ { "_row": "460", "index": "461", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "91%", "Sample": "255 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "461", "index": "462", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "84%", "Sample": "245 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "462", "index": "463", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "x patients", "Stateavg": "al_scip-inf-4" }, { "_row": "463", "index": "464", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "97%", "Sample": "369 patients", "Stateavg": "al_scip-inf-6" } ], "ground_truth": [ { "row": 462, "column": "Sample", "clean_value": "0 patients" } ], "predicted_repairs": [ { "row": 460, "column": "Index", "new_value": "461", "reason": "The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names." }, { "row": 461, "column": "ProviderNumber", "new_value": "10019", "reason": "The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names." }, { "row": 462, "column": "Address1", "new_value": "1300 south Montgomery avenue", "reason": "The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names." }, { "row": 463, "column": "Address2", "new_value": "", "reason": "The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 460,\n \"column\": \"Index\",\n \"new_value\": \"461\",\n \"reason\": \"The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names.\"\n },\n {\n \"row\": 461,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10019\",\n \"reason\": \"The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names.\"\n },\n {\n \"row\": 462,\n \"column\": \"Address1\",\n \"new_value\": \"1300 south Montgomery avenue\",\n \"reason\": \"The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names.\"\n },\n {\n \"row\": 463,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The address '1300 south Montgomery Avenue' was found in the target rows but does not match any of the allowed column names.\"\n }\n ]\n}\n```" }, { "task_index": 37, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.087, "precision": 0.05, "recall": 0.3333, "tp": 1, "fp": 19, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 2, "overrepair": 18, "schema_case_error": 1 }, "target_rows": [ { "_row": "502", "index": "503", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "chxrokxx", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-2", "MeasureName": "pneumonia patients assessed and given pneumococcal vaccination", "Score": "93%", "Sample": "44 paxienxs", "Stateavg": "al_pn-2" }, { "_row": "503", "index": "504", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-3b", "MeasureName": "pneumonia patients whose initial emergency room blood culture was performed prior to the administration of the first hospital dose of antibiotics", "Score": "97%", "Sample": "33 patients", "Stateavg": "al_pn-3b" }, { "_row": "504", "index": "505", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "ax", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-4", "MeasureName": "pneumonia patients given smoking cessation advice/counseling", "Score": "100%", "Sample": "20 patients", "Stateavg": "al_pn-4" }, { "_row": "505", "index": "506", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-5c", "MeasureName": "pneumonia patients given initial antibiotic(s) within 6 hours after arrival", "Score": "89%", "Sample": "56 patients", "Stateavg": "al_pn-5c" } ], "ground_truth": [ { "row": 502, "column": "CountyName", "clean_value": "cherokee" }, { "row": 502, "column": "Sample", "clean_value": "44 patients" }, { "row": 504, "column": "State", "clean_value": "al" } ], "predicted_repairs": [ { "row": 502, "column": "Index", "new_value": "503", "reason": "The new value for index is incorrect." }, { "row": 503, "column": "ProviderNumber", "new_value": "10022", "reason": "The new value for ProviderNumber is incorrect." }, { "row": 504, "column": "Address1", "new_value": "400 northwood dr", "reason": "The new value for Address1 is incorrect." }, { "row": 504, "column": "Address2", "new_value": "", "reason": "The new value for Address2 is missing or incorrect." }, { "row": 504, "column": "Address3", "new_value": "", "reason": "The new value for Address3 is missing or incorrect." }, { "row": 504, "column": "City", "new_value": "centre", "reason": "The new value for City is incorrect." }, { "row": 504, "column": "CountyName", "new_value": "cherokee", "reason": "The new value for CountyName is incorrect." }, { "row": 504, "column": "EmergencyService", "new_value": "yes", "reason": "The new value for EmergencyService is incorrect." }, { "row": 504, "column": "HospitalName", "new_value": "cherokee medical center", "reason": "The new value for HospitalName is incorrect." }, { "row": 504, "column": "HospitalOwner", "new_value": "voluntary non-profit - private", "reason": "The new value for HospitalOwner is incorrect." }, { "row": 504, "column": "HospitalType", "new_value": "acute care hospitals", "reason": "The new value for HospitalType is incorrect." }, { "row": 504, "column": "MeasureCode", "new_value": "pn-4", "reason": "The new value for MeasureCode is incorrect." }, { "row": 504, "column": "MeasureName", "new_value": "pneumonia patients given initial antibiotic(s) within 6 hours after arrival", "reason": "The new value for MeasureName is incorrect." }, { "row": 504, "column": "PhoneNumber", "new_value": "2569275531", "reason": "The new value for PhoneNumber is incorrect." }, { "row": 504, "column": "ProviderNumber", "new_value": "10022", "reason": "The new value for ProviderNumber is incorrect." }, { "row": 504, "column": "Sample", "new_value": "20 patients", "reason": "The new value for Sample is incorrect." }, { "row": 504, "column": "Score", "new_value": "100%", "reason": "The new value for Score is incorrect." }, { "row": 504, "column": "State", "new_value": "al", "reason": "The new value for State is incorrect." }, { "row": 504, "column": "Stateavg", "new_value": "al_pn-4", "reason": "The new value for Stateavg is incorrect." }, { "row": 504, "column": "ZipCode", "new_value": "35960", "reason": "The new value for ZipCode is incorrect." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 502,\n \"column\": \"Index\",\n \"new_value\": \"503\",\n \"reason\": \"The new value for index is incorrect.\"\n },\n {\n \"row\": 503,\n \"column\": \"ProviderNumber\",\n \"new_value\": \"10022\",\n \"reason\": \"The new value for ProviderNumber is incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"Address1\",\n \"new_value\": \"400 northwood dr\",\n \"reason\": \"The new value for Address1 is incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"Address2\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address2 is missing or incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"Address3\",\n \"new_value\": \"\",\n \"reason\": \"The new value for Address3 is missing or incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"City\",\n \"new_value\": \"centre\",\n \"reason\": \"The new value for City is incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"CountyName\",\n \"new_value\": \"cherokee\",\n \"reason\": \"The new value for CountyName is incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"EmergencyService\",\n \"new_value\": \"yes\",\n \"reason\": \"The new value for EmergencyService is incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"HospitalName\",\n \"new_value\": \"cherokee medical center\",\n \"reason\": \"The new value for HospitalName is incorrect.\"\n },\n {\n \"row\": 504,\n \"column\": \"HospitalOwner\",\n \"" }, { "task_index": 38, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 1, "failure_taxonomy": { "missed_repair": 8, "schema_case_error": 1, "wrong_cell": 3 }, "target_rows": [ { "_row": "1394", "tuple_id": "1395", "src": "orbitz", "flight": "UA-858-PVG-SFO", "sched_dep_time": "1:45 p.m.", "act_dep_time": "1:32 p.m.", "sched_arr_time": "8:27aDec 1", "act_arr_time": "8:02aDec 1" }, { "_row": "1395", "tuple_id": "1396", "src": "orbitz", "flight": "UA-2704-DTW-PHX", "sched_dep_time": "11:15aDec 1", "act_dep_time": "11:15aDec 1", "sched_arr_time": "1:40 p.m.", "act_arr_time": "2:00 p.m." }, { "_row": "1396", "tuple_id": "1397", "src": "orbitz", "flight": "AA-3063-SLC-LAX", "sched_dep_time": "8:20 p.m.", "act_dep_time": "8:30 p.m.", "sched_arr_time": "9:18 p.m.", "act_arr_time": "" }, { "_row": "1397", "tuple_id": "1398", "src": "orbitz", "flight": "UA-2708-EWR-CLT", "sched_dep_time": "2:55 p.m.", "act_dep_time": "2:52 p.m.", "sched_arr_time": "4:53 p.m.", "act_arr_time": "4:44 p.m." } ], "ground_truth": [ { "row": 1394, "column": "sched_arr_time", "clean_value": "8:27 a.m." }, { "row": 1394, "column": "act_arr_time", "clean_value": "8:02 a.m." }, { "row": 1395, "column": "sched_dep_time", "clean_value": "11:15 a.m." }, { "row": 1395, "column": "act_dep_time", "clean_value": "11:15 a.m." }, { "row": 1396, "column": "act_dep_time", "clean_value": "8:39 p.m." }, { "row": 1396, "column": "sched_arr_time", "clean_value": "9:20 p.m." }, { "row": 1396, "column": "act_arr_time", "clean_value": "9:20 p.m." }, { "row": 1397, "column": "act_dep_time", "clean_value": "2:55 p.m." } ], "predicted_repairs": [ { "row": 1394, "column": "Tuple ID", "new_value": "1395", "reason": "The 'Tuple ID' column has been updated to '1395'." }, { "row": 1395, "column": "Flight", "new_value": "UA-2704-DTW-PHX", "reason": "The 'Flight' column has been updated to 'UA-2704-DTW-PHX'." }, { "row": 1396, "column": "Schedule Arr Time", "new_value": "", "reason": "The 'Schedule Arr Time' column is empty." }, { "row": 1397, "column": "Act Dep Time", "new_value": "8:30 p.m.", "reason": "The 'Act Dep Time' column has been updated to '8:30 p.m.'." } ], "decoded_preview": "```json\n{\n \"action\": \"submit_repairs\",\n \"repairs\": [\n {\n \"row\": 1394,\n \"column\": \"Tuple ID\",\n \"new_value\": \"1395\",\n \"reason\": \"The 'Tuple ID' column has been updated to '1395'.\"\n },\n {\n \"row\": 1395,\n \"column\": \"Flight\",\n \"new_value\": \"UA-2704-DTW-PHX\",\n \"reason\": \"The 'Flight' column has been updated to 'UA-2704-DTW-PHX'.\"\n },\n {\n \"row\": 1396,\n \"column\": \"Schedule Arr Time\",\n \"new_value\": \"\",\n \"reason\": \"The 'Schedule Arr Time' column is empty.\"\n },\n {\n \"row\": 1397,\n \"column\": \"Act Dep Time\",\n \"new_value\": \"8:30 p.m.\",\n \"reason\": \"The 'Act Dep Time' column has been updated to '8:30 p.m.'.\"\n }\n ]\n}\n```" } ] } }, "sft": { "model_label": "sft", "task_scores": [ { "task_index": 1, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4 } }, { "task_index": 2, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 } }, { "task_index": 3, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 4, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 4 } }, { "task_index": 5, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 6, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 7, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 8, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 9, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 } }, { "task_index": 10, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 11, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 14, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "wrong_value": 4 } }, { "task_index": 12, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 4 } }, { "task_index": 13, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 } }, { "task_index": 14, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_value": 4 } }, { "task_index": 15, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 16, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 } }, { "task_index": 17, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 3, "wrong_cell": 1 } }, { "task_index": 18, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 1 } }, { "task_index": 19, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 } }, { "task_index": 20, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 21, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 2, "wrong_value": 2 } }, { "task_index": 22, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 } }, { "task_index": 23, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 4 } }, { "task_index": 24, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 25, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 26, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 2, "wrong_value": 2 } }, { "task_index": 27, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 28, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 4 } }, { "task_index": 29, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.1667, "precision": 0.25, "recall": 0.125, "tp": 1, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 3 } }, { "task_index": 30, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 31, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 } }, { "task_index": 32, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 33, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 13, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "overrepair": 2, "wrong_value": 1 } }, { "task_index": 34, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 4 } }, { "task_index": 35, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 36, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 } }, { "task_index": 37, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 3, "parse_ok": false, "parse_error_kind": "truncated_json", "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3 } }, { "task_index": 38, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 2, "wrong_value": 2 } }, { "task_index": 39, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 40, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 41, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 42, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9 } }, { "task_index": 43, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 4 } }, { "task_index": 44, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 2, "wrong_value": 2 } }, { "task_index": 45, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 46, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 } }, { "task_index": 47, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.25, "precision": 0.25, "recall": 0.25, "tp": 1, "fp": 3, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 3 } }, { "task_index": 48, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 49, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 5, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4, "wrong_cell": 1 } }, { "task_index": 50, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 51, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.1538, "precision": 0.3333, "recall": 0.1, "tp": 1, "fp": 2, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_value": 2 } }, { "task_index": 52, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 5, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 5, "failure_taxonomy": { "missed_repair": 2, "schema_case_error": 5 } }, { "task_index": 53, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 54, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 55, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 56, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 } }, { "task_index": 57, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 } }, { "task_index": 58, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 } }, { "task_index": 59, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_value": 4 } }, { "task_index": 60, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5 } }, { "task_index": 61, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 4 } }, { "task_index": 62, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 15, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 15, "overrepair": 4 } }, { "task_index": 63, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5 } }, { "task_index": 64, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 4 } }, { "task_index": 65, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 66, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.2, "precision": 0.25, "recall": 0.1667, "tp": 1, "fp": 3, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 2, "wrong_value": 1 } }, { "task_index": 67, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 3, "failure_taxonomy": { "missed_repair": 1, "schema_case_error": 3 } }, { "task_index": 68, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 2, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 16, "overrepair": 2 } }, { "task_index": 69, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 70, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "schema_case_error": 4 } }, { "task_index": 71, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 } }, { "task_index": 72, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 73, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 } }, { "task_index": 74, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 75, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 2, "wrong_value": 2 } }, { "task_index": 76, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 4 } }, { "task_index": 77, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_value": 4 } }, { "task_index": 78, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 } }, { "task_index": 79, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 5, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 4, "wrong_cell": 1 } }, { "task_index": 80, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 1 } }, { "task_index": 81, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 } }, { "task_index": 82, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 } }, { "task_index": 83, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 15, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 84, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6 } }, { "task_index": 85, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "schema_case_error": 4 } }, { "task_index": 86, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 1, "wrong_value": 3 } }, { "task_index": 87, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 88, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 } }, { "task_index": 89, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 90, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 4 } }, { "task_index": 91, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 4 } }, { "task_index": 92, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "wrong_value": 4 } }, { "task_index": 93, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 } }, { "task_index": 94, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 1 } }, { "task_index": 95, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } }, { "task_index": 96, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 2, "wrong_value": 2 } }, { "task_index": 97, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.2857, "precision": 0.25, "recall": 0.3333, "tp": 1, "fp": 3, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3 } }, { "task_index": 98, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_value": 4 } }, { "task_index": 99, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 3, "wrong_value": 1 } }, { "task_index": 100, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 } } ], "failure_samples": [ { "task_index": 1, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4 }, "target_rows": [ { "_row": "55", "index": "56", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-2", "MeasureName": "pneumonia patients assessed and given pneumococcal vaccination", "Score": "97%", "Sample": "172 patients", "Stateavg": "al_pn-2" }, { "_row": "56", "index": "57", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boxz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-3b", "MeasureName": "pneumonia patients whose initial emergency room blood culture was performed prior to the administration of the first hospital dose of antibiotics", "Score": "97%", "Sample": "120 patients", "Stateavg": "al_pn-xb" }, { "_row": "57", "index": "58", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505xuxsxhighwayx431xnorth", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2x6x938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-4", "MeasureName": "pneumonia patients given smoking cessation advice/counseling", "Score": "97%", "Sample": "98 patients", "Stateavg": "al_pn-4" }, { "_row": "58", "index": "59", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-5c", "MeasureName": "pneumonia patients given initial antibiotic(s) within 6 hours after arrival", "Score": "96%", "Sample": "211 patients", "Stateavg": "al_pn-5c" } ], "ground_truth": [ { "row": 56, "column": "City", "clean_value": "boaz" }, { "row": 56, "column": "Stateavg", "clean_value": "al_pn-3b" }, { "row": 57, "column": "Address1", "clean_value": "2505 u s highway 431 north" }, { "row": 57, "column": "PhoneNumber", "clean_value": "2565938310" } ], "predicted_repairs": [], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":55,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'\"},{\"row\":56,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'\"},{\"row\":57,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'\"},{\"row\":58,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'}]}" }, { "task_index": 2, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 }, "target_rows": [ { "_row": "792", "tuple_id": "793", "src": "mia", "flight": "AA-2050-ORD-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "2:45P 12-01-11", "act_arr_time": "2:46P" }, { "_row": "793", "tuple_id": "794", "src": "mia", "flight": "AA-1165-JFK-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "10:34A 12-01-11", "act_arr_time": "10:08A" }, { "_row": "794", "tuple_id": "795", "src": "mia", "flight": "AA-484-DFW-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "7:55P 12-01-11", "act_arr_time": "7:39P" }, { "_row": "795", "tuple_id": "796", "src": "mia", "flight": "AA-466-IAH-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "9:20A 12-01-11", "act_arr_time": "9:04A" } ], "ground_truth": [ { "row": 792, "column": "sched_dep_time", "clean_value": "10:40 a.m." }, { "row": 792, "column": "act_dep_time", "clean_value": "11:05 a.m." }, { "row": 792, "column": "sched_arr_time", "clean_value": "2:45 p.m." }, { "row": 792, "column": "act_arr_time", "clean_value": "2:46 p.m." }, { "row": 793, "column": "sched_dep_time", "clean_value": "6:59 a.m." }, { "row": 793, "column": "act_dep_time", "clean_value": "7:22 a.m." }, { "row": 793, "column": "sched_arr_time", "clean_value": "10:34 a.m." }, { "row": 793, "column": "act_arr_time", "clean_value": "10:04 a.m." }, { "row": 794, "column": "sched_dep_time", "clean_value": "4:15 p.m." }, { "row": 794, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 794, "column": "sched_arr_time", "clean_value": "7:55 p.m." }, { "row": 794, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 795, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 795, "column": "act_dep_time", "clean_value": "6:08 a.m." }, { "row": 795, "column": "sched_arr_time", "clean_value": "9:20 a.m." }, { "row": 795, "column": "act_arr_time", "clean_value": "9:05 a.m." } ], "predicted_repairs": [ { "row": 792, "column": "act_arr_time", "new_value": "2:46P", "reason": "The new value for act_arr_time is incorrect." }, { "row": 793, "column": "act_arr_time", "new_value": "10:08A", "reason": "The new value for act_arr_time is incorrect." }, { "row": 794, "column": "act_arr_time", "new_value": "7:39P", "reason": "The new value for act_arr_time is incorrect." }, { "row": 795, "column": "act_arr_time", "new_value": "9:04A", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":792,\"column\":\"act_arr_time\",\"new_value\":\"2:46P\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":793,\"column\":\"act_arr_time\",\"new_value\":\"10:08A\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":794,\"column\":\"act_arr_time\",\"new_value\":\"7:39P\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":795,\"column\":\"act_arr_time\",\"new_value\":\"9:04A\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 3, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "1363", "index": "1364", "id": "2358", "beer-name": "Minhas Light (2012)", "style": "Light Lager", "ounces": "12.0 oz.", "abv": "0.04", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1364", "index": "1365", "id": "2282", "beer-name": "Huber", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "0.05%", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1365", "index": "1366", "id": "2281", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "16.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1366", "index": "1367", "id": "2280", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "12.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" } ], "ground_truth": [ { "row": 1363, "column": "ounces", "clean_value": "12" }, { "row": 1363, "column": "ibu", "clean_value": "" }, { "row": 1364, "column": "ounces", "clean_value": "12" }, { "row": 1364, "column": "abv", "clean_value": "0.05" }, { "row": 1364, "column": "ibu", "clean_value": "" }, { "row": 1365, "column": "ounces", "clean_value": "16" }, { "row": 1365, "column": "ibu", "clean_value": "" }, { "row": 1366, "column": "ounces", "clean_value": "12" }, { "row": 1366, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1363, "column": "abv", "new_value": "0.04", "reason": "The new value for abv is 0.04 instead of the expected 0.05." }, { "row": 1364, "column": "abv", "new_value": "0.05%", "reason": "The new value for abv is 0.05% instead of the expected 0.04." }, { "row": 1365, "column": "abv", "new_value": "0.062", "reason": "The new value for abv is 0.062 instead of the expected 0.05." }, { "row": 1366, "column": "abv", "new_value": "0.062", "reason": "The new value for abv is 0.062 instead of the expected 0.05." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1363,\"column\":\"abv\",\"new_value\":\"0.04\",\"reason\":\"The new value for abv is 0.04 instead of the expected 0.05.\"},{\"row\":1364,\"column\":\"abv\",\"new_value\":\"0.05%\",\"reason\":\"The new value for abv is 0.05% instead of the expected 0.04.\"},{\"row\":1365,\"column\":\"abv\",\"new_value\":\"0.062\",\"reason\":\"The new value for abv is 0.062 instead of the expected 0.05.\"},{\"row\":1366,\"column\":\"abv\",\"new_value\":\"0.062\",\"reason\":\"The new value for abv is 0.062 instead of the expected 0.05.\"}]}" }, { "task_index": 4, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 4 }, "target_rows": [ { "_row": "711", "index": "712", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "1xx%", "Sample": "9 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "712", "index": "713", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection xrevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "713", "index": "714", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "33x28365x1", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery paxienxs needing hair removed from xhe surgical area before surgery who had hair removed using a safer mexhod (elecxric clippers or hair removal cream c nox a razor)", "Score": "100%", "Sample": "33 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "714", "index": "715", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "88%", "Sample": "24 patients", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [ { "row": 711, "column": "Score", "clean_value": "100%" }, { "row": 712, "column": "Condition", "clean_value": "surgical infection prevention" }, { "row": 713, "column": "PhoneNumber", "clean_value": "3342836541" }, { "row": 713, "column": "MeasureName", "clean_value": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)" } ], "predicted_repairs": [ { "row": 711, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 712, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 713, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 714, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":711,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"},{\"row\":712,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"},{\"row\":713,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"},{\"row\":714,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"}]}" }, { "task_index": 5, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1727", "tuple_id": "1728", "src": "ua", "flight": "UA-397-JFK-SFO", "sched_dep_time": "8:00 a.m.", "act_dep_time": "8:29 a.m.", "sched_arr_time": "11:55 a.m.", "act_arr_time": "11:58 a.m." }, { "_row": "1728", "tuple_id": "1729", "src": "ua", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1729", "tuple_id": "1730", "src": "ua", "flight": "UA-2830-MCO-CLT", "sched_dep_time": "3:27 p.m.", "act_dep_time": "3:27 p.m.", "sched_arr_time": "5:05 p.m.", "act_arr_time": "5:17 p.m." }, { "_row": "1730", "tuple_id": "1731", "src": "ua", "flight": "UA-5487-SFO-MRY", "sched_dep_time": "10:39 a.m.", "act_dep_time": "10:33 a.m.", "sched_arr_time": "11:19 a.m.", "act_arr_time": "11:21 a.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1727, "column": "act_arr_time", "new_value": "11:58 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1728, "column": "act_arr_time", "new_value": "9:43 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1729, "column": "act_arr_time", "new_value": "5:17 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1730, "column": "act_arr_time", "new_value": "11:21 a.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1727,\"column\":\"act_arr_time\",\"new_value\":\"11:58 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1728,\"column\":\"act_arr_time\",\"new_value\":\"9:43 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1729,\"column\":\"act_arr_time\",\"new_value\":\"5:17 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1730,\"column\":\"act_arr_time\",\"new_value\":\"11:21 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 6, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "1840", "index": "1841", "id": "1539", "beer-name": "Monkey Fist IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.069%", "ibu": "65", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1841", "index": "1842", "id": "975", "beer-name": "Shipyard Summer Ale", "style": "American Pale Wheat Ale", "ounces": "12.0 oz", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1842", "index": "1843", "id": "814", "beer-name": "Pumpkinhead Ale", "style": "Pumpkin Ale", "ounces": "12.0 oz.", "abv": "0.047", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1843", "index": "1844", "id": "727", "beer-name": "Shipyard Export", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" } ], "ground_truth": [ { "row": 1840, "column": "ounces", "clean_value": "12" }, { "row": 1840, "column": "abv", "clean_value": "0.069" }, { "row": 1841, "column": "ounces", "clean_value": "12" }, { "row": 1841, "column": "ibu", "clean_value": "" }, { "row": 1842, "column": "ounces", "clean_value": "12" }, { "row": 1842, "column": "ibu", "clean_value": "" }, { "row": 1843, "column": "ounces", "clean_value": "12" }, { "row": 1843, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1840, "column": "abv", "new_value": "0.069%", "reason": "The new value for abv is incorrect." }, { "row": 1841, "column": "ibu", "new_value": "65", "reason": "The new value for ibu is incorrect." }, { "row": 1842, "column": "style", "new_value": "American IPA", "reason": "The new value for style is incorrect." }, { "row": 1843, "column": "ibu", "new_value": "N/A", "reason": "The new value for ibu is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1840,\"column\":\"abv\",\"new_value\":\"0.069%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1841,\"column\":\"ibu\",\"new_value\":\"65\",\"reason\":\"The new value for ibu is incorrect.\"},{\"row\":1842,\"column\":\"style\",\"new_value\":\"American IPA\",\"reason\":\"The new value for style is incorrect.\"},{\"row\":1843,\"column\":\"ibu\",\"new_value\":\"N/A\",\"reason\":\"The new value for ibu is incorrect.\"}]}" }, { "task_index": 7, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "483", "index": "484", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "xl", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-card-2", "MeasureName": "surgery patients who were taking heart drugs called beta blockers before coming to the hospital who were kept on the beta blockers during the period just before and after their surgery", "Score": "100%", "Sample": "12 patients", "Stateavg": "al_scip-card-2" }, { "_row": "484", "index": "485", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "1x6 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "94%", "Sample": "52 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "485", "index": "486", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "xzark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "96%", "Sample": "52 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "486", "index": "487", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "85%", "Sample": "48 patients", "Stateavg": "al_scip-inf-3" } ], "ground_truth": [ { "row": 483, "column": "State", "clean_value": "al" }, { "row": 484, "column": "Address1", "clean_value": "126 hospital ave" }, { "row": 485, "column": "City", "clean_value": "ozark" } ], "predicted_repairs": [ { "row": 483, "column": "Address1", "new_value": "126 hospital ave", "reason": "The address is incorrect." }, { "row": 484, "column": "Address1", "new_value": "1x6 hospital ave", "reason": "The address is incorrect." }, { "row": 485, "column": "Address1", "new_value": "126 hospital ave", "reason": "The address is incorrect." }, { "row": 486, "column": "Address1", "new_value": "126 hospital ave", "reason": "The address is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":483,\"column\":\"Address1\",\"new_value\":\"126 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"},{\"row\":484,\"column\":\"Address1\",\"new_value\":\"1x6 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"},{\"row\":485,\"column\":\"Address1\",\"new_value\":\"126 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"},{\"row\":486,\"column\":\"Address1\",\"new_value\":\"126 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"}]}" }, { "task_index": 8, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "2025", "tuple_id": "2026", "src": "allegiantair", "flight": "UA-2708-EWR-CLT", "sched_dep_time": "", "act_dep_time": "3:04 p.m.", "sched_arr_time": "", "act_arr_time": "4:24 p.m." }, { "_row": "2026", "tuple_id": "2027", "src": "allegiantair", "flight": "UA-62-IAH-EWR", "sched_dep_time": "", "act_dep_time": "2:59 p.m.", "sched_arr_time": "", "act_arr_time": "7:10 p.m." }, { "_row": "2027", "tuple_id": "2028", "src": "allegiantair", "flight": "UA-1500-IAH-GUA", "sched_dep_time": "", "act_dep_time": "9:43 a.m.", "sched_arr_time": "", "act_arr_time": "12:12 p.m." }, { "_row": "2028", "tuple_id": "2029", "src": "allegiantair", "flight": "AA-3804-PHL-ORD", "sched_dep_time": "2:35 p.m.", "act_dep_time": "2:44 p.m.", "sched_arr_time": "4:05 p.m.", "act_arr_time": "3:36 p.m." } ], "ground_truth": [ { "row": 2025, "column": "sched_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "act_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "sched_arr_time", "clean_value": "4:53 p.m." }, { "row": 2025, "column": "act_arr_time", "clean_value": "4:44 p.m." }, { "row": 2026, "column": "sched_dep_time", "clean_value": "2:30 p.m." }, { "row": 2026, "column": "act_dep_time", "clean_value": "2:48 p.m." }, { "row": 2026, "column": "sched_arr_time", "clean_value": "7:03 p.m." }, { "row": 2027, "column": "sched_dep_time", "clean_value": "8:55 a.m." }, { "row": 2027, "column": "act_dep_time", "clean_value": "9:16 a.m." }, { "row": 2027, "column": "sched_arr_time", "clean_value": "11:45 a.m." }, { "row": 2027, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 2028, "column": "act_arr_time", "clean_value": "3:43 p.m." } ], "predicted_repairs": [ { "row": 2025, "column": "act_arr_time", "new_value": "4:24 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 2026, "column": "act_arr_time", "new_value": "7:10 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 2027, "column": "act_arr_time", "new_value": "12:12 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 2028, "column": "act_arr_time", "new_value": "3:36 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":2025,\"column\":\"act_arr_time\",\"new_value\":\"4:24 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":2026,\"column\":\"act_arr_time\",\"new_value\":\"7:10 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":2027,\"column\":\"act_arr_time\",\"new_value\":\"12:12 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":2028,\"column\":\"act_arr_time\",\"new_value\":\"3:36 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 9, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 }, "target_rows": [ { "_row": "657", "index": "658", "id": "685", "beer-name": "Lava Lake Wit", "style": "Witbier", "ounces": "12.0 oz.", "abv": "0.052", "ibu": "15", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "658", "index": "659", "id": "613", "beer-name": "Mountain Livin' Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.06", "ibu": "N/A", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "659", "index": "660", "id": "356", "beer-name": "Crazy Mountain Amber Ale", "style": "American Amber / Red Ale", "ounces": "12.0 ounce", "abv": "0.052", "ibu": "25", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "660", "index": "661", "id": "2029", "beer-name": "Tropicalia", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.065", "ibu": "65", "brewery_id": "247", "brewery-name": "Creature Comforts", "city": "Athens", "state": "GA" } ], "ground_truth": [ { "row": 657, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ibu", "clean_value": "" }, { "row": 659, "column": "ounces", "clean_value": "12" }, { "row": 660, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 657, "column": "abv", "new_value": "0.052", "reason": "The new value for abv is 0.052 which does not exist in the dataset." }, { "row": 658, "column": "abv", "new_value": "0.06", "reason": "The new value for abv is 0.06 which does not exist in the dataset." }, { "row": 659, "column": "abv", "new_value": "0.052", "reason": "The new value for abv is 0.052 which does not exist in the dataset." }, { "row": 660, "column": "abv", "new_value": "0.065", "reason": "The new value for abv is 0.065 which does not exist in the dataset." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":657,\"column\":\"abv\",\"new_value\":\"0.052\",\"reason\":\"The new value for abv is 0.052 which does not exist in the dataset.\"},{\"row\":658,\"column\":\"abv\",\"new_value\":\"0.06\",\"reason\":\"The new value for abv is 0.06 which does not exist in the dataset.\"},{\"row\":659,\"column\":\"abv\",\"new_value\":\"0.052\",\"reason\":\"The new value for abv is 0.052 which does not exist in the dataset.\"},{\"row\":660,\"column\":\"abv\",\"new_value\":\"0.065\",\"reason\":\"The new value for abv is 0.065 which does not exist in the dataset.\"}]}" }, { "task_index": 10, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "122", "index": "123", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-4", "MeasureName": "heart attack patients given smoking cessation advice/counseling", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-4" }, { "_row": "123", "index": "124", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "0%", "Sample": "1 patients", "Stateavg": "al_ami-5" }, { "_row": "124", "index": "125", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "125", "index": "126", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" } ], "ground_truth": [], "predicted_repairs": [ { "row": 122, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." }, { "row": 123, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." }, { "row": 124, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." }, { "row": 125, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":122,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"},{\"row\":123,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"},{\"row\":124,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"},{\"row\":125,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"}]}" }, { "task_index": 11, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 14, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "wrong_value": 4 }, "target_rows": [ { "_row": "1535", "tuple_id": "1536", "src": "flytecomm", "flight": "CO-1193-EWR-MCO", "sched_dep_time": "9:15 a.m.", "act_dep_time": "", "sched_arr_time": "12:18 p.m.", "act_arr_time": "" }, { "_row": "1536", "tuple_id": "1537", "src": "flytecomm", "flight": "AA-3842-MSP-ORD", "sched_dep_time": "", "act_dep_time": "6:57 a.m.", "sched_arr_time": "", "act_arr_time": "7:49 a.m." }, { "_row": "1537", "tuple_id": "1538", "src": "flytecomm", "flight": "AA-643-MIA-ORD", "sched_dep_time": "", "act_dep_time": "7:31 a.m.", "sched_arr_time": "", "act_arr_time": "9:26 a.m." }, { "_row": "1538", "tuple_id": "1539", "src": "flytecomm", "flight": "AA-1007-MIA-PHX", "sched_dep_time": "", "act_dep_time": "5:09 p.m.", "sched_arr_time": "", "act_arr_time": "7:43 p.m." } ], "ground_truth": [ { "row": 1535, "column": "act_dep_time", "clean_value": "9:14 a.m." }, { "row": 1535, "column": "act_arr_time", "clean_value": "12:09 p.m." }, { "row": 1536, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 1536, "column": "act_dep_time", "clean_value": "6:56 a.m." }, { "row": 1536, "column": "sched_arr_time", "clean_value": "7:30 a.m." }, { "row": 1536, "column": "act_arr_time", "clean_value": "7:51 a.m." }, { "row": 1537, "column": "sched_dep_time", "clean_value": "7:10 a.m." }, { "row": 1537, "column": "act_dep_time", "clean_value": "7:30 a.m." }, { "row": 1537, "column": "sched_arr_time", "clean_value": "9:35 a.m." }, { "row": 1537, "column": "act_arr_time", "clean_value": "9:31 a.m." }, { "row": 1538, "column": "sched_dep_time", "clean_value": "4:55 p.m." }, { "row": 1538, "column": "act_dep_time", "clean_value": "5:08 p.m." }, { "row": 1538, "column": "sched_arr_time", "clean_value": "8:05 p.m." }, { "row": 1538, "column": "act_arr_time", "clean_value": "7:55 p.m." } ], "predicted_repairs": [ { "row": 1535, "column": "act_arr_time", "new_value": "7:49 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1536, "column": "act_arr_time", "new_value": "9:26 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1537, "column": "act_arr_time", "new_value": "7:43 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1538, "column": "act_arr_time", "new_value": "7:49 a.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1535,\"column\":\"act_arr_time\",\"new_value\":\"7:49 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1536,\"column\":\"act_arr_time\",\"new_value\":\"9:26 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1537,\"column\":\"act_arr_time\",\"new_value\":\"7:43 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1538,\"column\":\"act_arr_time\",\"new_value\":\"7:49 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 12, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 4 }, "target_rows": [ { "_row": "1774", "index": "1775", "id": "1841", "beer-name": "Alpha Blackback", "style": "American Black Ale", "ounces": "12.0 oz", "abv": "0.07200000000000001%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1775", "index": "1776", "id": "1782", "beer-name": "Kiss Off IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.063%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1776", "index": "1777", "id": "1552", "beer-name": "Dog Days Summer Ale", "style": "K\u00f6lsch", "ounces": "12.0 oz.", "abv": "0.045%", "ibu": "28", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1777", "index": "1778", "id": "1479", "beer-name": "1881 California Red", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.055999999999999994%", "ibu": "35", "brewery_id": "397", "brewery-name": "Ruhstaller Beer Company", "city": "Sacramento", "state": "CA" } ], "ground_truth": [ { "row": 1774, "column": "ounces", "clean_value": "12" }, { "row": 1774, "column": "abv", "clean_value": "0.072" }, { "row": 1774, "column": "ibu", "clean_value": "" }, { "row": 1775, "column": "ounces", "clean_value": "12" }, { "row": 1775, "column": "abv", "clean_value": "0.063" }, { "row": 1775, "column": "ibu", "clean_value": "" }, { "row": 1776, "column": "ounces", "clean_value": "12" }, { "row": 1776, "column": "abv", "clean_value": "0.045" }, { "row": 1777, "column": "ounces", "clean_value": "12" }, { "row": 1777, "column": "abv", "clean_value": "0.056" } ], "predicted_repairs": [ { "row": 1777, "column": "beer-name", "new_value": "1881 California Red", "reason": "This beer has a different name than the other beers in the contract." }, { "row": 1776, "column": "beer-name", "new_value": "Kiss Off IPA", "reason": "This beer has a different style than the other beers in the contract." }, { "row": 1775, "column": "beer-name", "new_value": "Alpha Blackback", "reason": "This beer has a different brewery name than the other beers in the contract." }, { "row": 1774, "column": "beer-name", "new_value": "Kiss Off IPA", "reason": "This beer has a different style than the other beers in the contract." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1777,\"column\":\"beer-name\",\"new_value\":\"1881 California Red\",\"reason\":\"This beer has a different name than the other beers in the contract.\"},{\"row\":1776,\"column\":\"beer-name\",\"new_value\":\"Kiss Off IPA\",\"reason\":\"This beer has a different style than the other beers in the contract.\"},{\"row\":1775,\"column\":\"beer-name\",\"new_value\":\"Alpha Blackback\",\"reason\":\"This beer has a different brewery name than the other beers in the contract.\"},{\"row\":1774,\"column\":\"beer-name\",\"new_value\":\"Kiss Off IPA\",\"reason\":\"This beer has a different style than the other beers in the contract.\"}]}" }, { "task_index": 13, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 }, "target_rows": [ { "_row": "881", "index": "882", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "82%", "Sample": "11 patients", "Stateavg": "al_ami-5" }, { "_row": "882", "index": "883", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "883", "index": "884", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" }, { "_row": "884", "index": "885", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "xl", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "87%", "Sample": "67 patients", "Stateavg": "al_hf-1" } ], "ground_truth": [ { "row": 881, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 883, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 884, "column": "State", "clean_value": "al" } ], "predicted_repairs": [ { "row": 881, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." }, { "row": 882, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." }, { "row": 883, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." }, { "row": 884, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":881,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"},{\"row\":882,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"},{\"row\":883,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"},{\"row\":884,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"}]}" }, { "task_index": 14, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_value": 4 }, "target_rows": [ { "_row": "1675", "tuple_id": "1676", "src": "wunderground", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:45 a.m.", "sched_arr_time": "4:37 p.m.", "act_arr_time": "4:57 p.m." }, { "_row": "1676", "tuple_id": "1677", "src": "wunderground", "flight": "AA-2957-DFW-CVG", "sched_dep_time": "7:55 a.m.", "act_dep_time": "8:05 a.m.", "sched_arr_time": "10:55 a.m.", "act_arr_time": "10:58 a.m." }, { "_row": "1677", "tuple_id": "1678", "src": "wunderground", "flight": "AA-1664-MIA-ATL", "sched_dep_time": "10:15 a.m.", "act_dep_time": "10:19 a.m.", "sched_arr_time": "11:43 a.m.", "act_arr_time": "11:50 a.m." }, { "_row": "1678", "tuple_id": "1679", "src": "wunderground", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "7:50 a.m.", "act_arr_time": "7:59 a.m." } ], "ground_truth": [ { "row": 1675, "column": "act_dep_time", "clean_value": "11:30 a.m." }, { "row": 1675, "column": "sched_arr_time", "clean_value": "4:57 p.m." }, { "row": 1675, "column": "act_arr_time", "clean_value": "5:05 p.m." }, { "row": 1676, "column": "act_dep_time", "clean_value": "8:04 a.m." }, { "row": 1676, "column": "sched_arr_time", "clean_value": "11:05 a.m." }, { "row": 1676, "column": "act_arr_time", "clean_value": "11:01 a.m." }, { "row": 1677, "column": "act_dep_time", "clean_value": "10:18 a.m." }, { "row": 1677, "column": "sched_arr_time", "clean_value": "12:10 p.m." }, { "row": 1677, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 1678, "column": "sched_arr_time", "clean_value": "8:00 a.m." }, { "row": 1678, "column": "act_arr_time", "clean_value": "8:06 a.m." } ], "predicted_repairs": [ { "row": 1675, "column": "act_arr_time", "new_value": "4:57 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1676, "column": "act_arr_time", "new_value": "10:58 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1677, "column": "act_arr_time", "new_value": "11:50 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1678, "column": "act_arr_time", "new_value": "7:59 a.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1675,\"column\":\"act_arr_time\",\"new_value\":\"4:57 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1676,\"column\":\"act_arr_time\",\"new_value\":\"10:58 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1677,\"column\":\"act_arr_time\",\"new_value\":\"11:50 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1678,\"column\":\"act_arr_time\",\"new_value\":\"7:59 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 15, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "1813", "index": "1814", "id": "307", "beer-name": "Santa Fe Oktoberfest", "style": "M\u00e4rzen / Oktoberfest", "ounces": "12.0 oz.", "abv": "", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1814", "index": "1815", "id": "305", "beer-name": "Imperial Java Stout", "style": "Russian Imperial Stout", "ounces": "12.0 oz.", "abv": "0.08%", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1815", "index": "1816", "id": "304", "beer-name": "Freestyle Pilsner", "style": "German Pilsener", "ounces": "12.0 oz.", "abv": "0.055", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1816", "index": "1817", "id": "217", "beer-name": "Happy Camper IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.066", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" } ], "ground_truth": [ { "row": 1813, "column": "ounces", "clean_value": "12" }, { "row": 1813, "column": "ibu", "clean_value": "" }, { "row": 1814, "column": "ounces", "clean_value": "12" }, { "row": 1814, "column": "abv", "clean_value": "0.08" }, { "row": 1814, "column": "ibu", "clean_value": "" }, { "row": 1815, "column": "ounces", "clean_value": "12" }, { "row": 1815, "column": "ibu", "clean_value": "" }, { "row": 1816, "column": "ounces", "clean_value": "12" }, { "row": 1816, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1813, "column": "abv", "new_value": "0.08%", "reason": "The new value for abv is incorrect." }, { "row": 1814, "column": "abv", "new_value": "0.055", "reason": "The new value for abv is incorrect." }, { "row": 1815, "column": "abv", "new_value": "0.066", "reason": "The new value for abv is incorrect." }, { "row": 1816, "column": "abv", "new_value": "0.08%", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1813,\"column\":\"abv\",\"new_value\":\"0.08%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1814,\"column\":\"abv\",\"new_value\":\"0.055\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1815,\"column\":\"abv\",\"new_value\":\"0.066\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1816,\"column\":\"abv\",\"new_value\":\"0.08%\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 16, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 }, "target_rows": [ { "_row": "734", "index": "735", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "99%", "Sample": "411 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "735", "index": "736", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scix-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "98%", "Sample": "417 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "736", "index": "737", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912xalabamaxhighwayx157", "Address2": "empty", "Address3": "empty", "City": "cuxxman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "98%", "Sample": "405 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "737", "index": "738", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 735, "column": "MeasureCode", "clean_value": "scip-inf-2" }, { "row": 736, "column": "Address1", "clean_value": "1912 alabama highway 157" }, { "row": 736, "column": "City", "clean_value": "cullman" } ], "predicted_repairs": [ { "row": 734, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 735, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 736, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 737, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":734,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"},{\"row\":735,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"},{\"row\":736,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"},{\"row\":737,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"}]}" }, { "task_index": 17, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 3, "wrong_cell": 1 }, "target_rows": [ { "_row": "167", "tuple_id": "168", "src": "boston", "flight": "UA-3515-IAD-MSP", "sched_dep_time": "", "act_dep_time": "8:26 a.m.", "sched_arr_time": "", "act_arr_time": "9:54 a.m." }, { "_row": "168", "tuple_id": "169", "src": "boston", "flight": "AA-3468-CVG-MIA", "sched_dep_time": "7:00 a.m.", "act_dep_time": "7:25 a.m.", "sched_arr_time": "9:55 a.m.", "act_arr_time": "9:42 a.m." }, { "_row": "169", "tuple_id": "170", "src": "boston", "flight": "AA-484-DFW-MIA", "sched_dep_time": "4:15 p.m.", "act_dep_time": "4:30 p.m.", "sched_arr_time": "7:55 p.m.", "act_arr_time": "7:35 p.m." }, { "_row": "170", "tuple_id": "171", "src": "boston", "flight": "AA-1886-BOS-MIA", "sched_dep_time": "", "act_dep_time": "10:55 a.m.", "sched_arr_time": "", "act_arr_time": "1:34 p.m." } ], "ground_truth": [ { "row": 167, "column": "sched_dep_time", "clean_value": "8:15 a.m." }, { "row": 167, "column": "act_dep_time", "clean_value": "8:12 a.m." }, { "row": 167, "column": "sched_arr_time", "clean_value": "10:06 a.m." }, { "row": 167, "column": "act_arr_time", "clean_value": "9:56 a.m." }, { "row": 168, "column": "act_arr_time", "clean_value": "9:45 a.m." }, { "row": 169, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 169, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 170, "column": "sched_dep_time", "clean_value": "10:45 a.m." }, { "row": 170, "column": "sched_arr_time", "clean_value": "2:20 p.m." }, { "row": 170, "column": "act_arr_time", "clean_value": "1:40 p.m." } ], "predicted_repairs": [ { "row": 170, "column": "flight", "new_value": "AA-1886-BOS-MIA", "reason": "The flight AA-1886-BOS-MIA is not listed in the contract version." }, { "row": 167, "column": "flight", "new_value": "UA-3515-IAD-MSP", "reason": "The flight UA-3515-IAD-MSP is not listed in the contract version." }, { "row": 169, "column": "flight", "new_value": "AA-484-DFW-MIA", "reason": "The flight AA-484-DFW-MIA is not listed in the contract version." }, { "row": 171, "column": "flight", "new_value": "NA", "reason": "No flights are listed in the contract version." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":170,\"column\":\"flight\",\"new_value\":\"AA-1886-BOS-MIA\",\"reason\":\"The flight AA-1886-BOS-MIA is not listed in the contract version.\"},{\"row\":167,\"column\":\"flight\",\"new_value\":\"UA-3515-IAD-MSP\",\"reason\":\"The flight UA-3515-IAD-MSP is not listed in the contract version.\"},{\"row\":169,\"column\":\"flight\",\"new_value\":\"AA-484-DFW-MIA\",\"reason\":\"The flight AA-484-DFW-MIA is not listed in the contract version.\"},{\"row\":171,\"column\":\"flight\",\"new_value\":\"NA\",\"reason\":\"No flights are listed in the contract version.\"}]}" }, { "task_index": 18, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 1 }, "target_rows": [ { "_row": "1589", "index": "1590", "id": "785", "beer-name": "Old Chub (2003)", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1590", "index": "1591", "id": "745", "beer-name": "Dale's Pale Ale (2008)", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1591", "index": "1592", "id": "744", "beer-name": "Dale's Pale Ale (2006)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.065%", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons CO", "state": "" }, { "_row": "1592", "index": "1593", "id": "743", "beer-name": "Dale's Pale Ale (2004)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" } ], "ground_truth": [ { "row": 1589, "column": "ounces", "clean_value": "12" }, { "row": 1590, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "abv", "clean_value": "0.065" }, { "row": 1591, "column": "city", "clean_value": "Lyons" }, { "row": 1591, "column": "state", "clean_value": "CO" }, { "row": 1592, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1592, "column": "style", "new_value": "Scottish Ale", "reason": "The beer name has been changed to 'Scottish Ale' which is a different style than the original 'Scottish Ale'." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1592,\"column\":\"style\",\"new_value\":\"Scottish Ale\",\"reason\":\"The beer name has been changed to 'Scottish Ale' which is a different style than the original 'Scottish Ale'.\"}]}" }, { "task_index": 19, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 }, "target_rows": [ { "_row": "512", "index": "513", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "513", "index": "514", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "chxrokxx", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "100%", "Sample": "6 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "514", "index": "515", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "1xx%", "Sample": "5 patients", "Stateavg": "al_scip-vte-1" }, { "_row": "515", "index": "516", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-2", "MeasureName": "patients who got treatment at the right time (within 24 hours before or after their surgery) to help prevent blood clots after certain types of surgery", "Score": "100%", "Sample": "5 patients", "Stateavg": "al_scip-vte-2" } ], "ground_truth": [ { "row": 513, "column": "CountyName", "clean_value": "cherokee" }, { "row": 514, "column": "Score", "clean_value": "100%" } ], "predicted_repairs": [ { "row": 512, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." }, { "row": 513, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." }, { "row": 514, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." }, { "row": 515, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":512,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"},{\"row\":513,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"},{\"row\":514,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"},{\"row\":515,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"}]}" }, { "task_index": 20, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "13", "tuple_id": "14", "src": "aa", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "8:00 a.m.", "act_arr_time": "8:06 a.m." }, { "_row": "14", "tuple_id": "15", "src": "aa", "flight": "AA-1279-DFW-PHX", "sched_dep_time": "1:00 p.m.", "act_dep_time": "2:04 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:30 p.m." }, { "_row": "15", "tuple_id": "16", "src": "aa", "flight": "AA-616-DFW-DTW", "sched_dep_time": "9:05 a.m.", "act_dep_time": "10:10 a.m.", "sched_arr_time": "12:35 p.m.", "act_arr_time": "1:27 p.m." }, { "_row": "16", "tuple_id": "17", "src": "aa", "flight": "AA-4344-ORD-DTW", "sched_dep_time": "11:45 a.m.", "act_dep_time": "12:13 p.m.", "sched_arr_time": "2:00 p.m.", "act_arr_time": "2:10 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 13, "column": "act_arr_time", "new_value": "8:06 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 14, "column": "act_arr_time", "new_value": "3:30 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 15, "column": "act_arr_time", "new_value": "1:27 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 16, "column": "act_arr_time", "new_value": "2:10 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":13,\"column\":\"act_arr_time\",\"new_value\":\"8:06 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":14,\"column\":\"act_arr_time\",\"new_value\":\"3:30 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":15,\"column\":\"act_arr_time\",\"new_value\":\"1:27 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":16,\"column\":\"act_arr_time\",\"new_value\":\"2:10 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 21, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 2, "wrong_value": 2 }, "target_rows": [ { "_row": "662", "index": "663", "id": "2293", "beer-name": "Aviator Raspberry Blonde", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.049%", "ibu": "25", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "663", "index": "664", "id": "1105", "beer-name": "3 Picket Porter", "style": "American Porter", "ounces": "12.0 oz.", "abv": "0.055%", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "664", "index": "665", "id": "1104", "beer-name": "Rusty Nail Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.056", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "665", "index": "666", "id": "2145", "beer-name": "Red Water Irish Style Red", "style": "American Amber / Red Ale", "ounces": "12.0 OZ.", "abv": "0.065", "ibu": "N/A", "brewery_id": "212", "brewery-name": "Crow Peak Brewing Company", "city": "Spearfish", "state": "SD" } ], "ground_truth": [ { "row": 662, "column": "ounces", "clean_value": "12" }, { "row": 662, "column": "abv", "clean_value": "0.049" }, { "row": 663, "column": "ounces", "clean_value": "12" }, { "row": 663, "column": "abv", "clean_value": "0.055" }, { "row": 663, "column": "ibu", "clean_value": "" }, { "row": 664, "column": "ounces", "clean_value": "12" }, { "row": 664, "column": "ibu", "clean_value": "" }, { "row": 665, "column": "ounces", "clean_value": "12" }, { "row": 665, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 662, "column": "abv", "new_value": "0.049%", "reason": "The new value for Abv is incorrect." }, { "row": 663, "column": "abv", "new_value": "0.055%", "reason": "The new value for Abv is incorrect." }, { "row": 664, "column": "abv", "new_value": "0.056%", "reason": "The new value for Abv is incorrect." }, { "row": 665, "column": "abv", "new_value": "0.065%", "reason": "The new value for Abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":662,\"column\":\"abv\",\"new_value\":\"0.049%\",\"reason\":\"The new value for Abv is incorrect.\"},{\"row\":663,\"column\":\"abv\",\"new_value\":\"0.055%\",\"reason\":\"The new value for Abv is incorrect.\"},{\"row\":664,\"column\":\"abv\",\"new_value\":\"0.056%\",\"reason\":\"The new value for Abv is incorrect.\"},{\"row\":665,\"column\":\"abv\",\"new_value\":\"0.065%\",\"reason\":\"The new value for Abv is incorrect.\"}]}" }, { "task_index": 22, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 }, "target_rows": [ { "_row": "870", "index": "871", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "80%", "Sample": "15 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "871", "index": "872", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "87%", "Sample": "15 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "872", "index": "873", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntaxy non-pxofit - pxivate", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "87%", "Sample": "15 patiexts", "Stateavg": "al_scip-inf-3" }, { "_row": "873", "index": "874", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 872, "column": "HospitalOwner", "clean_value": "voluntary non-profit - private" }, { "row": 872, "column": "Sample", "clean_value": "15 patients" } ], "predicted_repairs": [ { "row": 870, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." }, { "row": 871, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." }, { "row": 872, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." }, { "row": 873, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":870,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"},{\"row\":871,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"},{\"row\":872,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"},{\"row\":873,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"}]}" }, { "task_index": 23, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 4 }, "target_rows": [ { "_row": "324", "tuple_id": "325", "src": "weather", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:20 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "2:49 p.m." }, { "_row": "325", "tuple_id": "326", "src": "weather", "flight": "UA-854-SFO-IAH", "sched_dep_time": "7:53 a.m.", "act_dep_time": "8:07 a.m.", "sched_arr_time": "1:39 p.m.", "act_arr_time": "1:23 p.m." }, { "_row": "326", "tuple_id": "327", "src": "weather", "flight": "AA-415-BOS-ORD", "sched_dep_time": "8:35 a.m.", "act_dep_time": "", "sched_arr_time": "10:40 a.m.", "act_arr_time": "" }, { "_row": "327", "tuple_id": "328", "src": "weather", "flight": "AA-85-JFK-SFO", "sched_dep_time": "3:05 p.m.", "act_dep_time": "", "sched_arr_time": "6:30 p.m.", "act_arr_time": "" } ], "ground_truth": [ { "row": 324, "column": "act_dep_time", "clean_value": "1:19 p.m." }, { "row": 324, "column": "act_arr_time", "clean_value": "3:13 p.m." }, { "row": 325, "column": "act_dep_time", "clean_value": "7:49 a.m." }, { "row": 325, "column": "act_arr_time", "clean_value": "1:30 p.m." }, { "row": 326, "column": "act_dep_time", "clean_value": "8:56 a.m." }, { "row": 326, "column": "act_arr_time", "clean_value": "10:16 a.m." }, { "row": 327, "column": "act_dep_time", "clean_value": "3:36 p.m." }, { "row": 327, "column": "act_arr_time", "clean_value": "6:43 p.m." } ], "predicted_repairs": [ { "row": 324, "column": "act_arr_time", "new_value": "2:49 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 325, "column": "act_arr_time", "new_value": "1:23 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 326, "column": "act_arr_time", "new_value": "10:40 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 327, "column": "act_arr_time", "new_value": "", "reason": "The new value for act_arr_time is empty." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":324,\"column\":\"act_arr_time\",\"new_value\":\"2:49 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":325,\"column\":\"act_arr_time\",\"new_value\":\"1:23 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":326,\"column\":\"act_arr_time\",\"new_value\":\"10:40 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":327,\"column\":\"act_arr_time\",\"new_value\":\"\",\"reason\":\"The new value for act_arr_time is empty.\"}]}" }, { "task_index": 24, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "1597", "index": "1598", "id": "1533", "beer-name": "G'KNIGHT", "style": "American Double / Imperial IPA", "ounces": "12.0 OZ.", "abv": "0.087%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1598", "index": "1599", "id": "1532", "beer-name": "Ten Fidy", "style": "Russian Imperial Stout", "ounces": "12.0 oz", "abv": "0.099%", "ibu": "98", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1599", "index": "1600", "id": "1328", "beer-name": "Deviant Dale's IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.08%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1600", "index": "1601", "id": "1175", "beer-name": "Old Chub", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" } ], "ground_truth": [ { "row": 1597, "column": "ounces", "clean_value": "12" }, { "row": 1597, "column": "abv", "clean_value": "0.087" }, { "row": 1598, "column": "ounces", "clean_value": "12" }, { "row": 1598, "column": "abv", "clean_value": "0.099" }, { "row": 1599, "column": "ounces", "clean_value": "16" }, { "row": 1599, "column": "abv", "clean_value": "0.08" }, { "row": 1600, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1597, "column": "abv", "new_value": "0.087%", "reason": "The new value for abv is incorrect." }, { "row": 1598, "column": "abv", "new_value": "0.099%", "reason": "The new value for abv is incorrect." }, { "row": 1599, "column": "abv", "new_value": "0.08%", "reason": "The new value for abv is incorrect." }, { "row": 1600, "column": "abv", "new_value": "0.08", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1597,\"column\":\"abv\",\"new_value\":\"0.087%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1598,\"column\":\"abv\",\"new_value\":\"0.099%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1599,\"column\":\"abv\",\"new_value\":\"0.08%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1600,\"column\":\"abv\",\"new_value\":\"0.08\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 25, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "661", "index": "662", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-3" }, { "_row": "662", "index": "663", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-4" }, { "_row": "663", "index": "664", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-6" }, { "_row": "664", "index": "665", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [], "predicted_repairs": [ { "row": 661, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." }, { "row": 662, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." }, { "row": 663, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." }, { "row": 664, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":661,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"},{\"row\":662,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"},{\"row\":663,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"},{\"row\":664,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"}]}" } ], "failure_samples_by_slice": { "deterministic_normalization": [ { "task_index": 3, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "1363", "index": "1364", "id": "2358", "beer-name": "Minhas Light (2012)", "style": "Light Lager", "ounces": "12.0 oz.", "abv": "0.04", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1364", "index": "1365", "id": "2282", "beer-name": "Huber", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "0.05%", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1365", "index": "1366", "id": "2281", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "16.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" }, { "_row": "1366", "index": "1367", "id": "2280", "beer-name": "Clear Creek Ice", "style": "American Pale Lager", "ounces": "12.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "134", "brewery-name": "Minhas Craft Brewery", "city": "Monroe", "state": "WI" } ], "ground_truth": [ { "row": 1363, "column": "ounces", "clean_value": "12" }, { "row": 1363, "column": "ibu", "clean_value": "" }, { "row": 1364, "column": "ounces", "clean_value": "12" }, { "row": 1364, "column": "abv", "clean_value": "0.05" }, { "row": 1364, "column": "ibu", "clean_value": "" }, { "row": 1365, "column": "ounces", "clean_value": "16" }, { "row": 1365, "column": "ibu", "clean_value": "" }, { "row": 1366, "column": "ounces", "clean_value": "12" }, { "row": 1366, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1363, "column": "abv", "new_value": "0.04", "reason": "The new value for abv is 0.04 instead of the expected 0.05." }, { "row": 1364, "column": "abv", "new_value": "0.05%", "reason": "The new value for abv is 0.05% instead of the expected 0.04." }, { "row": 1365, "column": "abv", "new_value": "0.062", "reason": "The new value for abv is 0.062 instead of the expected 0.05." }, { "row": 1366, "column": "abv", "new_value": "0.062", "reason": "The new value for abv is 0.062 instead of the expected 0.05." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1363,\"column\":\"abv\",\"new_value\":\"0.04\",\"reason\":\"The new value for abv is 0.04 instead of the expected 0.05.\"},{\"row\":1364,\"column\":\"abv\",\"new_value\":\"0.05%\",\"reason\":\"The new value for abv is 0.05% instead of the expected 0.04.\"},{\"row\":1365,\"column\":\"abv\",\"new_value\":\"0.062\",\"reason\":\"The new value for abv is 0.062 instead of the expected 0.05.\"},{\"row\":1366,\"column\":\"abv\",\"new_value\":\"0.062\",\"reason\":\"The new value for abv is 0.062 instead of the expected 0.05.\"}]}" }, { "task_index": 6, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "1840", "index": "1841", "id": "1539", "beer-name": "Monkey Fist IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.069%", "ibu": "65", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1841", "index": "1842", "id": "975", "beer-name": "Shipyard Summer Ale", "style": "American Pale Wheat Ale", "ounces": "12.0 oz", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1842", "index": "1843", "id": "814", "beer-name": "Pumpkinhead Ale", "style": "Pumpkin Ale", "ounces": "12.0 oz.", "abv": "0.047", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" }, { "_row": "1843", "index": "1844", "id": "727", "beer-name": "Shipyard Export", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.051", "ibu": "N/A", "brewery_id": "385", "brewery-name": "Shipyard Brewing Company", "city": "Portland", "state": "ME" } ], "ground_truth": [ { "row": 1840, "column": "ounces", "clean_value": "12" }, { "row": 1840, "column": "abv", "clean_value": "0.069" }, { "row": 1841, "column": "ounces", "clean_value": "12" }, { "row": 1841, "column": "ibu", "clean_value": "" }, { "row": 1842, "column": "ounces", "clean_value": "12" }, { "row": 1842, "column": "ibu", "clean_value": "" }, { "row": 1843, "column": "ounces", "clean_value": "12" }, { "row": 1843, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1840, "column": "abv", "new_value": "0.069%", "reason": "The new value for abv is incorrect." }, { "row": 1841, "column": "ibu", "new_value": "65", "reason": "The new value for ibu is incorrect." }, { "row": 1842, "column": "style", "new_value": "American IPA", "reason": "The new value for style is incorrect." }, { "row": 1843, "column": "ibu", "new_value": "N/A", "reason": "The new value for ibu is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1840,\"column\":\"abv\",\"new_value\":\"0.069%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1841,\"column\":\"ibu\",\"new_value\":\"65\",\"reason\":\"The new value for ibu is incorrect.\"},{\"row\":1842,\"column\":\"style\",\"new_value\":\"American IPA\",\"reason\":\"The new value for style is incorrect.\"},{\"row\":1843,\"column\":\"ibu\",\"new_value\":\"N/A\",\"reason\":\"The new value for ibu is incorrect.\"}]}" }, { "task_index": 9, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 4 }, "target_rows": [ { "_row": "657", "index": "658", "id": "685", "beer-name": "Lava Lake Wit", "style": "Witbier", "ounces": "12.0 oz.", "abv": "0.052", "ibu": "15", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "658", "index": "659", "id": "613", "beer-name": "Mountain Livin' Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.06", "ibu": "N/A", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "659", "index": "660", "id": "356", "beer-name": "Crazy Mountain Amber Ale", "style": "American Amber / Red Ale", "ounces": "12.0 ounce", "abv": "0.052", "ibu": "25", "brewery_id": "63", "brewery-name": "Crazy Mountain Brewing Company", "city": "Edwards", "state": "CO" }, { "_row": "660", "index": "661", "id": "2029", "beer-name": "Tropicalia", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.065", "ibu": "65", "brewery_id": "247", "brewery-name": "Creature Comforts", "city": "Athens", "state": "GA" } ], "ground_truth": [ { "row": 657, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ounces", "clean_value": "12" }, { "row": 658, "column": "ibu", "clean_value": "" }, { "row": 659, "column": "ounces", "clean_value": "12" }, { "row": 660, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 657, "column": "abv", "new_value": "0.052", "reason": "The new value for abv is 0.052 which does not exist in the dataset." }, { "row": 658, "column": "abv", "new_value": "0.06", "reason": "The new value for abv is 0.06 which does not exist in the dataset." }, { "row": 659, "column": "abv", "new_value": "0.052", "reason": "The new value for abv is 0.052 which does not exist in the dataset." }, { "row": 660, "column": "abv", "new_value": "0.065", "reason": "The new value for abv is 0.065 which does not exist in the dataset." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":657,\"column\":\"abv\",\"new_value\":\"0.052\",\"reason\":\"The new value for abv is 0.052 which does not exist in the dataset.\"},{\"row\":658,\"column\":\"abv\",\"new_value\":\"0.06\",\"reason\":\"The new value for abv is 0.06 which does not exist in the dataset.\"},{\"row\":659,\"column\":\"abv\",\"new_value\":\"0.052\",\"reason\":\"The new value for abv is 0.052 which does not exist in the dataset.\"},{\"row\":660,\"column\":\"abv\",\"new_value\":\"0.065\",\"reason\":\"The new value for abv is 0.065 which does not exist in the dataset.\"}]}" }, { "task_index": 15, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "1813", "index": "1814", "id": "307", "beer-name": "Santa Fe Oktoberfest", "style": "M\u00e4rzen / Oktoberfest", "ounces": "12.0 oz.", "abv": "", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1814", "index": "1815", "id": "305", "beer-name": "Imperial Java Stout", "style": "Russian Imperial Stout", "ounces": "12.0 oz.", "abv": "0.08%", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1815", "index": "1816", "id": "304", "beer-name": "Freestyle Pilsner", "style": "German Pilsener", "ounces": "12.0 oz.", "abv": "0.055", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" }, { "_row": "1816", "index": "1817", "id": "217", "beer-name": "Happy Camper IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.066", "ibu": "N/A", "brewery_id": "392", "brewery-name": "Santa Fe Brewing Company", "city": "Santa Fe", "state": "NM" } ], "ground_truth": [ { "row": 1813, "column": "ounces", "clean_value": "12" }, { "row": 1813, "column": "ibu", "clean_value": "" }, { "row": 1814, "column": "ounces", "clean_value": "12" }, { "row": 1814, "column": "abv", "clean_value": "0.08" }, { "row": 1814, "column": "ibu", "clean_value": "" }, { "row": 1815, "column": "ounces", "clean_value": "12" }, { "row": 1815, "column": "ibu", "clean_value": "" }, { "row": 1816, "column": "ounces", "clean_value": "12" }, { "row": 1816, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1813, "column": "abv", "new_value": "0.08%", "reason": "The new value for abv is incorrect." }, { "row": 1814, "column": "abv", "new_value": "0.055", "reason": "The new value for abv is incorrect." }, { "row": 1815, "column": "abv", "new_value": "0.066", "reason": "The new value for abv is incorrect." }, { "row": 1816, "column": "abv", "new_value": "0.08%", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1813,\"column\":\"abv\",\"new_value\":\"0.08%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1814,\"column\":\"abv\",\"new_value\":\"0.055\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1815,\"column\":\"abv\",\"new_value\":\"0.066\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1816,\"column\":\"abv\",\"new_value\":\"0.08%\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 21, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 2, "wrong_value": 2 }, "target_rows": [ { "_row": "662", "index": "663", "id": "2293", "beer-name": "Aviator Raspberry Blonde", "style": "American Blonde Ale", "ounces": "12.0 oz.", "abv": "0.049%", "ibu": "25", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "663", "index": "664", "id": "1105", "beer-name": "3 Picket Porter", "style": "American Porter", "ounces": "12.0 oz.", "abv": "0.055%", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "664", "index": "665", "id": "1104", "beer-name": "Rusty Nail Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.056", "ibu": "N/A", "brewery_id": "169", "brewery-name": "Crooked Fence Brewing Company", "city": "Garden City", "state": "ID" }, { "_row": "665", "index": "666", "id": "2145", "beer-name": "Red Water Irish Style Red", "style": "American Amber / Red Ale", "ounces": "12.0 OZ.", "abv": "0.065", "ibu": "N/A", "brewery_id": "212", "brewery-name": "Crow Peak Brewing Company", "city": "Spearfish", "state": "SD" } ], "ground_truth": [ { "row": 662, "column": "ounces", "clean_value": "12" }, { "row": 662, "column": "abv", "clean_value": "0.049" }, { "row": 663, "column": "ounces", "clean_value": "12" }, { "row": 663, "column": "abv", "clean_value": "0.055" }, { "row": 663, "column": "ibu", "clean_value": "" }, { "row": 664, "column": "ounces", "clean_value": "12" }, { "row": 664, "column": "ibu", "clean_value": "" }, { "row": 665, "column": "ounces", "clean_value": "12" }, { "row": 665, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 662, "column": "abv", "new_value": "0.049%", "reason": "The new value for Abv is incorrect." }, { "row": 663, "column": "abv", "new_value": "0.055%", "reason": "The new value for Abv is incorrect." }, { "row": 664, "column": "abv", "new_value": "0.056%", "reason": "The new value for Abv is incorrect." }, { "row": 665, "column": "abv", "new_value": "0.065%", "reason": "The new value for Abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":662,\"column\":\"abv\",\"new_value\":\"0.049%\",\"reason\":\"The new value for Abv is incorrect.\"},{\"row\":663,\"column\":\"abv\",\"new_value\":\"0.055%\",\"reason\":\"The new value for Abv is incorrect.\"},{\"row\":664,\"column\":\"abv\",\"new_value\":\"0.056%\",\"reason\":\"The new value for Abv is incorrect.\"},{\"row\":665,\"column\":\"abv\",\"new_value\":\"0.065%\",\"reason\":\"The new value for Abv is incorrect.\"}]}" }, { "task_index": 24, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "1597", "index": "1598", "id": "1533", "beer-name": "G'KNIGHT", "style": "American Double / Imperial IPA", "ounces": "12.0 OZ.", "abv": "0.087%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1598", "index": "1599", "id": "1532", "beer-name": "Ten Fidy", "style": "Russian Imperial Stout", "ounces": "12.0 oz", "abv": "0.099%", "ibu": "98", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1599", "index": "1600", "id": "1328", "beer-name": "Deviant Dale's IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.08%", "ibu": "85", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" }, { "_row": "1600", "index": "1601", "id": "1175", "beer-name": "Old Chub", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "389", "brewery-name": "Oskar Blues Brewery (North Carol...", "city": "Brevard", "state": "NC" } ], "ground_truth": [ { "row": 1597, "column": "ounces", "clean_value": "12" }, { "row": 1597, "column": "abv", "clean_value": "0.087" }, { "row": 1598, "column": "ounces", "clean_value": "12" }, { "row": 1598, "column": "abv", "clean_value": "0.099" }, { "row": 1599, "column": "ounces", "clean_value": "16" }, { "row": 1599, "column": "abv", "clean_value": "0.08" }, { "row": 1600, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1597, "column": "abv", "new_value": "0.087%", "reason": "The new value for abv is incorrect." }, { "row": 1598, "column": "abv", "new_value": "0.099%", "reason": "The new value for abv is incorrect." }, { "row": 1599, "column": "abv", "new_value": "0.08%", "reason": "The new value for abv is incorrect." }, { "row": 1600, "column": "abv", "new_value": "0.08", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1597,\"column\":\"abv\",\"new_value\":\"0.087%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1598,\"column\":\"abv\",\"new_value\":\"0.099%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1599,\"column\":\"abv\",\"new_value\":\"0.08%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1600,\"column\":\"abv\",\"new_value\":\"0.08\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 30, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "374", "index": "375", "id": "1288", "beer-name": "Bozone Hefe Weizen", "style": "Hefeweizen", "ounces": "12.0 oz.", "abv": "0.06", "ibu": "25", "brewery_id": "219", "brewery-name": "Bozeman Brewing Company", "city": "Bozeman", "state": "MT" }, { "_row": "375", "index": "376", "id": "470", "beer-name": "Bozone Select Amber Ale", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.055%", "ibu": "N/A", "brewery_id": "219", "brewery-name": "Bozeman Brewing Company", "city": "Bozeman", "state": "MT" }, { "_row": "376", "index": "377", "id": "2167", "beer-name": "Evil Owl", "style": "American Amber / Red Ale", "ounces": "12.0 oz. Alumi-Tek", "abv": "0.052", "ibu": "40", "brewery_id": "207", "brewery-name": "Branchline Brewing Company", "city": "San Antonio", "state": "TX" }, { "_row": "377", "index": "378", "id": "2204", "beer-name": "Post Time K\u00f6lsch", "style": "K\u00f6lsch", "ounces": "16.0 oz", "abv": "0.05", "ibu": "N/A", "brewery_id": "195", "brewery-name": "Breakside Brewery", "city": "Portland", "state": "OR" } ], "ground_truth": [ { "row": 374, "column": "ounces", "clean_value": "12" }, { "row": 375, "column": "ounces", "clean_value": "12" }, { "row": 375, "column": "abv", "clean_value": "0.055" }, { "row": 375, "column": "ibu", "clean_value": "" }, { "row": 376, "column": "ounces", "clean_value": "12" }, { "row": 377, "column": "ounces", "clean_value": "16" }, { "row": 377, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 374, "column": "abv", "new_value": "0.06", "reason": "The new value for abv is 0.06 instead of the expected 0.06." }, { "row": 375, "column": "abv", "new_value": "0.055%", "reason": "The new value for abv is 0.055% instead of the expected 0.055%." }, { "row": 376, "column": "abv", "new_value": "0.052", "reason": "The new value for abv is 0.052 instead of the expected 0.052." }, { "row": 377, "column": "abv", "new_value": "0.05", "reason": "The new value for abv is 0.05 instead of the expected 0.05." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":374,\"column\":\"abv\",\"new_value\":\"0.06\",\"reason\":\"The new value for abv is 0.06 instead of the expected 0.06.\"},{\"row\":375,\"column\":\"abv\",\"new_value\":\"0.055%\",\"reason\":\"The new value for abv is 0.055% instead of the expected 0.055%.\"},{\"row\":376,\"column\":\"abv\",\"new_value\":\"0.052\",\"reason\":\"The new value for abv is 0.052 instead of the expected 0.052.\"},{\"row\":377,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The new value for abv is 0.05 instead of the expected 0.05.\"}]}" }, { "task_index": 36, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 }, "target_rows": [ { "_row": "2211", "index": "2212", "id": "114", "beer-name": "Triangle White Ale", "style": "Witbier", "ounces": "12.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "524", "brewery-name": "Triangle Brewing Company", "city": "Durham", "state": "NC" }, { "_row": "2212", "index": "2213", "id": "113", "beer-name": "Triangle Belgian Golden Ale", "style": "Belgian Strong Pale Ale", "ounces": "12.0 ounce", "abv": "0.08%", "ibu": "N/A", "brewery_id": "524", "brewery-name": "Triangle Brewing Company", "city": "Durham", "state": "NC" }, { "_row": "2213", "index": "2214", "id": "2445", "beer-name": "Troegenator", "style": "Doppelbock", "ounces": "16.0 ounce", "abv": "0.082", "ibu": "N/A", "brewery_id": "97", "brewery-name": "Tr\u00f6egs Brewing Company", "city": "Hershey", "state": "PA" }, { "_row": "2214", "index": "2215", "id": "2444", "beer-name": "Nugget Nectar", "style": "American Amber / Red Ale", "ounces": "16.0 ounce", "abv": "0.075", "ibu": "93", "brewery_id": "97", "brewery-name": "Tr\u00f6egs Brewing Company", "city": "Hershey", "state": "PA" } ], "ground_truth": [ { "row": 2211, "column": "ounces", "clean_value": "12" }, { "row": 2211, "column": "ibu", "clean_value": "" }, { "row": 2212, "column": "ounces", "clean_value": "12" }, { "row": 2212, "column": "abv", "clean_value": "0.08" }, { "row": 2212, "column": "ibu", "clean_value": "" }, { "row": 2213, "column": "ounces", "clean_value": "16" }, { "row": 2213, "column": "ibu", "clean_value": "" }, { "row": 2214, "column": "ounces", "clean_value": "16" } ], "predicted_repairs": [ { "row": 2211, "column": "beer-name", "new_value": "Triangle White Ale", "reason": "The beer name has been changed to 'Triangle White Ale'." }, { "row": 2212, "column": "beer-name", "new_value": "Triangle Belgian Golden Ale", "reason": "The beer name has been changed to 'Triangle Belgian Golden Ale'." }, { "row": 2213, "column": "beer-name", "new_value": "Troegenator", "reason": "The beer name has been changed to 'Troegenator'." }, { "row": 2214, "column": "beer-name", "new_value": "Nugget Nectar", "reason": "The beer name has been changed to 'Nugget Nectar'." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":2211,\"column\":\"beer-name\",\"new_value\":\"Triangle White Ale\",\"reason\":\"The beer name has been changed to 'Triangle White Ale'.\"},{\"row\":2212,\"column\":\"beer-name\",\"new_value\":\"Triangle Belgian Golden Ale\",\"reason\":\"The beer name has been changed to 'Triangle Belgian Golden Ale'.\"},{\"row\":2213,\"column\":\"beer-name\",\"new_value\":\"Troegenator\",\"reason\":\"The beer name has been changed to 'Troegenator'.\"},{\"row\":2214,\"column\":\"beer-name\",\"new_value\":\"Nugget Nectar\",\"reason\":\"The beer name has been changed to 'Nugget Nectar'.\"}]}" }, { "task_index": 39, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "1271", "index": "1272", "id": "1671", "beer-name": "Gillespie Brown Ale", "style": "American Brown Ale", "ounces": "12.0 oz", "abv": "0.095", "ibu": "49", "brewery_id": "346", "brewery-name": "Manzanita Brewing Company", "city": "Santee", "state": "CA" }, { "_row": "1272", "index": "1273", "id": "1670", "beer-name": "Manzanita Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 OZ.", "abv": "0.066", "ibu": "44", "brewery_id": "346", "brewery-name": "Manzanita Brewing Company", "city": "Santee", "state": "CA" }, { "_row": "1273", "index": "1274", "id": "1262", "beer-name": "Marble Pilsner", "style": "German Pilsener", "ounces": "12.0 oz", "abv": "0.047%", "ibu": "N/A", "brewery_id": "443", "brewery-name": "Marble Brewery", "city": "Albuquerque", "state": "NM" }, { "_row": "1274", "index": "1275", "id": "845", "beer-name": "Marble India Pale Ale", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.062", "ibu": "N/A", "brewery_id": "443", "brewery-name": "Marble Brewery", "city": "Albuquerque", "state": "NM" } ], "ground_truth": [ { "row": 1271, "column": "ounces", "clean_value": "12" }, { "row": 1272, "column": "ounces", "clean_value": "12" }, { "row": 1273, "column": "ounces", "clean_value": "12" }, { "row": 1273, "column": "abv", "clean_value": "0.047" }, { "row": 1273, "column": "ibu", "clean_value": "" }, { "row": 1274, "column": "ounces", "clean_value": "12" }, { "row": 1274, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1271, "column": "abv", "new_value": "0.095", "reason": "The new value for abv is incorrect." }, { "row": 1272, "column": "abv", "new_value": "0.066", "reason": "The new value for abv is incorrect." }, { "row": 1273, "column": "abv", "new_value": "0.047%", "reason": "The new value for abv is incorrect." }, { "row": 1274, "column": "abv", "new_value": "0.062", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1271,\"column\":\"abv\",\"new_value\":\"0.095\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1272,\"column\":\"abv\",\"new_value\":\"0.066\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1273,\"column\":\"abv\",\"new_value\":\"0.047%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1274,\"column\":\"abv\",\"new_value\":\"0.062\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 48, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "491", "index": "492", "id": "49", "beer-name": "Porkslap Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.043%", "ibu": "N/A", "brewery_id": "556", "brewery-name": "Butternuts Beer and Ale", "city": "Garrattsville", "state": "NY" }, { "_row": "492", "index": "493", "id": "2657", "beer-name": "Blackbeard", "style": "American Double / Imperial Stout", "ounces": "12.0 ounce", "abv": "0.093", "ibu": "N/A", "brewery_id": "5", "brewery-name": "COAST Brewing Company", "city": "Charleston", "state": "SC" }, { "_row": "493", "index": "494", "id": "2656", "beer-name": "Rye Knot", "style": "American Brown Ale", "ounces": "12.0 oz. Alumi-Tek", "abv": "0.062", "ibu": "N/A", "brewery_id": "5", "brewery-name": "COAST Brewing Company", "city": "Charleston", "state": "SC" }, { "_row": "494", "index": "495", "id": "2655", "beer-name": "Dead Arm", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.06", "ibu": "N/A", "brewery_id": "5", "brewery-name": "COAST Brewing Company", "city": "Charleston", "state": "SC" } ], "ground_truth": [ { "row": 491, "column": "ounces", "clean_value": "12" }, { "row": 491, "column": "abv", "clean_value": "0.043" }, { "row": 491, "column": "ibu", "clean_value": "" }, { "row": 492, "column": "ounces", "clean_value": "12" }, { "row": 492, "column": "ibu", "clean_value": "" }, { "row": 493, "column": "ounces", "clean_value": "12" }, { "row": 493, "column": "ibu", "clean_value": "" }, { "row": 494, "column": "ounces", "clean_value": "12" }, { "row": 494, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 491, "column": "abv", "new_value": "0.043%", "reason": "The new value for abv is incorrect." }, { "row": 492, "column": "abv", "new_value": "0.093", "reason": "The new value for abv is incorrect." }, { "row": 493, "column": "abv", "new_value": "0.062", "reason": "The new value for abv is incorrect." }, { "row": 494, "column": "abv", "new_value": "0.06", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":491,\"column\":\"abv\",\"new_value\":\"0.043%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":492,\"column\":\"abv\",\"new_value\":\"0.093\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":493,\"column\":\"abv\",\"new_value\":\"0.062\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":494,\"column\":\"abv\",\"new_value\":\"0.06\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 51, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.1538, "precision": 0.3333, "recall": 0.1, "tp": 1, "fp": 2, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_value": 2 }, "target_rows": [ { "_row": "2265", "index": "2266", "id": "877", "beer-name": "Draught Hard Apple Cider", "style": "Cider", "ounces": "16.0 oz", "abv": "0.065", "ibu": "N/A", "brewery_id": "338", "brewery-name": "Uncle John's Fruit House Winery", "city": "St. John's", "state": "MI" }, { "_row": "2266", "index": "2267", "id": "606", "beer-name": "Scotty K NA", "style": "Low Alcohol Beer", "ounces": "16.0 ounce", "abv": "0.001%", "ibu": "N/A", "brewery_id": "522", "brewery-name": "Uncommon Brewers", "city": "Santa Cruz", "state": "CA" }, { "_row": "2267", "index": "2268", "id": "543", "beer-name": "Bacon Brown Ale", "style": "American Brown Ale", "ounces": "16.0 oz", "abv": "0.068%", "ibu": "N/A", "brewery_id": "522", "brewery-name": "Uncommon Brewers", "city": "Santa Cruz", "state": "CA" }, { "_row": "2268", "index": "2269", "id": "347", "beer-name": "Golden State Ale", "style": "Belgian Pale Ale", "ounces": "16.0 oz.", "abv": "0.064", "ibu": "N/A", "brewery_id": "522", "brewery-name": "Uncommon Brewers", "city": "Santa Cruz", "state": "CA" } ], "ground_truth": [ { "row": 2265, "column": "ounces", "clean_value": "16" }, { "row": 2265, "column": "ibu", "clean_value": "" }, { "row": 2266, "column": "ounces", "clean_value": "16" }, { "row": 2266, "column": "abv", "clean_value": "0.001" }, { "row": 2266, "column": "ibu", "clean_value": "" }, { "row": 2267, "column": "ounces", "clean_value": "16" }, { "row": 2267, "column": "abv", "clean_value": "0.068" }, { "row": 2267, "column": "ibu", "clean_value": "" }, { "row": 2268, "column": "ounces", "clean_value": "16" }, { "row": 2268, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 2268, "column": "ibu", "new_value": "N/A", "reason": "The beer has an incorrect IBU value (should be 0.064 but is currently 0.068). This change will affect the beer's alcohol content." }, { "row": 2267, "column": "abv", "new_value": "0.068", "reason": "The beer has an incorrect ABV value (should be 0.065 but is currently 0.001%). This change will affect the beer's alcohol content." }, { "row": 2266, "column": "ibu", "new_value": "N/A", "reason": "The beer has an incorrect IBU value (should be 0.001% but is currently 0.065). This change will affect the beer's alcohol content." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":2268,\"column\":\"ibu\",\"new_value\":\"N/A\",\"reason\":\"The beer has an incorrect IBU value (should be 0.064 but is currently 0.068). This change will affect the beer's alcohol content.\"},{\"row\":2267,\"column\":\"abv\",\"new_value\":\"0.068\",\"reason\":\"The beer has an incorrect ABV value (should be 0.065 but is currently 0.001%). This change will affect the beer's alcohol content.\"},{\"row\":2266,\"column\":\"ibu\",\"new_value\":\"N/A\",\"reason\":\"The beer has an incorrect IBU value (should be 0.001% but is currently 0.065). This change will affect the beer's alcohol content.\"}]}" }, { "task_index": 54, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "123", "index": "124", "id": "1293", "beer-name": "Angry Orchard Crisp Apple", "style": "Cider", "ounces": "16.0 oz.", "abv": "0.05%", "ibu": "N/A", "brewery_id": "434", "brewery-name": "Angry Orchard Cider Company", "city": "Cincinnati", "state": "OH" }, { "_row": "124", "index": "125", "id": "1292", "beer-name": "Angry Orchard Crisp Apple", "style": "Cider", "ounces": "12.0 OZ.", "abv": "0.05", "ibu": "N/A", "brewery_id": "434", "brewery-name": "Angry Orchard Cider Company", "city": "Cincinnati", "state": "OH" }, { "_row": "125", "index": "126", "id": "2207", "beer-name": "Golden One", "style": "Belgian Pale Ale", "ounces": "12.0 oz.", "abv": "0.068", "ibu": "N/A", "brewery_id": "193", "brewery-name": "Anthem Brewing Company", "city": "Oklahoma City", "state": "OK" }, { "_row": "126", "index": "127", "id": "2040", "beer-name": "Arjuna", "style": "Witbier", "ounces": "12.0 ounce", "abv": "0.06", "ibu": "N/A", "brewery_id": "193", "brewery-name": "Anthem Brewing Company", "city": "Oklahoma City", "state": "OK" } ], "ground_truth": [ { "row": 123, "column": "ounces", "clean_value": "16" }, { "row": 123, "column": "abv", "clean_value": "0.05" }, { "row": 123, "column": "ibu", "clean_value": "" }, { "row": 124, "column": "ounces", "clean_value": "12" }, { "row": 124, "column": "ibu", "clean_value": "" }, { "row": 125, "column": "ounces", "clean_value": "12" }, { "row": 125, "column": "ibu", "clean_value": "" }, { "row": 126, "column": "ounces", "clean_value": "12" }, { "row": 126, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 123, "column": "abv", "new_value": "0.05%", "reason": "The beer name is incorrect." }, { "row": 124, "column": "abv", "new_value": "0.05", "reason": "The beer name is incorrect." }, { "row": 125, "column": "abv", "new_value": "0.068", "reason": "The beer name is incorrect." }, { "row": 126, "column": "abv", "new_value": "0.06", "reason": "The beer name is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":123,\"column\":\"abv\",\"new_value\":\"0.05%\",\"reason\":\"The beer name is incorrect.\"},{\"row\":124,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The beer name is incorrect.\"},{\"row\":125,\"column\":\"abv\",\"new_value\":\"0.068\",\"reason\":\"The beer name is incorrect.\"},{\"row\":126,\"column\":\"abv\",\"new_value\":\"0.06\",\"reason\":\"The beer name is incorrect.\"}]}" }, { "task_index": 57, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 }, "target_rows": [ { "_row": "782", "index": "783", "id": "1731", "beer-name": "Peaches & Cream", "style": "Fruit / Vegetable Beer", "ounces": "16.0 oz.", "abv": "0.046", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "783", "index": "784", "id": "1022", "beer-name": "Quaff India Style Session Ale", "style": "American IPA", "ounces": "16.0 OZ.", "abv": "0.051", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "784", "index": "785", "id": "895", "beer-name": "Loki Red Ale (2013)", "style": "American Amber / Red Ale", "ounces": "16.0 OZ.", "abv": "0.075", "ibu": "53", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "785", "index": "786", "id": "682", "beer-name": "Mjolnir Imperial IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.069", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" } ], "ground_truth": [ { "row": 782, "column": "ounces", "clean_value": "16" }, { "row": 782, "column": "ibu", "clean_value": "" }, { "row": 783, "column": "ounces", "clean_value": "16" }, { "row": 783, "column": "ibu", "clean_value": "" }, { "row": 784, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 782, "column": "abv", "new_value": "0.046", "reason": "The beer name is incorrect." }, { "row": 783, "column": "abv", "new_value": "0.051", "reason": "The beer name is incorrect." }, { "row": 784, "column": "abv", "new_value": "0.075", "reason": "The beer name is incorrect." }, { "row": 785, "column": "abv", "new_value": "0.069", "reason": "The beer name is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":782,\"column\":\"abv\",\"new_value\":\"0.046\",\"reason\":\"The beer name is incorrect.\"},{\"row\":783,\"column\":\"abv\",\"new_value\":\"0.051\",\"reason\":\"The beer name is incorrect.\"},{\"row\":784,\"column\":\"abv\",\"new_value\":\"0.075\",\"reason\":\"The beer name is incorrect.\"},{\"row\":785,\"column\":\"abv\",\"new_value\":\"0.069\",\"reason\":\"The beer name is incorrect.\"}]}" }, { "task_index": 72, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 5, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "1325", "index": "1326", "id": "1508", "beer-name": "Shark Bait", "style": "Fruit / Vegetable Beer", "ounces": "12.0 oz", "abv": "0.053%", "ibu": "11", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" }, { "_row": "1326", "index": "1327", "id": "1507", "beer-name": "Gator Tail Brown Ale", "style": "American Brown Ale", "ounces": "12.0 ounce", "abv": "0.053", "ibu": "30", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" }, { "_row": "1327", "index": "1328", "id": "1506", "beer-name": "Miami Vice IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.071", "ibu": "62", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" }, { "_row": "1328", "index": "1329", "id": "1325", "beer-name": "Big Rod Coconut Ale", "style": "American Blonde Ale", "ounces": "12.0 oz", "abv": "0.053", "ibu": "16", "brewery_id": "393", "brewery-name": "Miami Brewing Company", "city": "Miami", "state": "FL" } ], "ground_truth": [ { "row": 1325, "column": "ounces", "clean_value": "12" }, { "row": 1325, "column": "abv", "clean_value": "0.053" }, { "row": 1326, "column": "ounces", "clean_value": "12" }, { "row": 1327, "column": "ounces", "clean_value": "12" }, { "row": 1328, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1325, "column": "abv", "new_value": "0.053%", "reason": "The new value for abv is incorrect." }, { "row": 1326, "column": "abv", "new_value": "0.053", "reason": "The new value for abv is incorrect." }, { "row": 1327, "column": "abv", "new_value": "0.071", "reason": "The new value for abv is incorrect." }, { "row": 1328, "column": "abv", "new_value": "0.053", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1325,\"column\":\"abv\",\"new_value\":\"0.053%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1326,\"column\":\"abv\",\"new_value\":\"0.053\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1327,\"column\":\"abv\",\"new_value\":\"0.071\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1328,\"column\":\"abv\",\"new_value\":\"0.053\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 78, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 4 }, "target_rows": [ { "_row": "783", "index": "784", "id": "1022", "beer-name": "Quaff India Style Session Ale", "style": "American IPA", "ounces": "16.0 OZ.", "abv": "0.051", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "784", "index": "785", "id": "895", "beer-name": "Loki Red Ale (2013)", "style": "American Amber / Red Ale", "ounces": "16.0 OZ.", "abv": "0.075", "ibu": "53", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "785", "index": "786", "id": "682", "beer-name": "Mjolnir Imperial IPA", "style": "American Double / Imperial IPA", "ounces": "16.0 oz", "abv": "0.069", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" }, { "_row": "786", "index": "787", "id": "112", "beer-name": "Fearless Scottish Ale", "style": "Scottish Ale", "ounces": "16.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "201", "brewery-name": "Fearless Brewing Company", "city": "Estacada", "state": "OR" } ], "ground_truth": [ { "row": 783, "column": "ounces", "clean_value": "16" }, { "row": 783, "column": "ibu", "clean_value": "" }, { "row": 784, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ounces", "clean_value": "16" }, { "row": 785, "column": "ibu", "clean_value": "" }, { "row": 786, "column": "ounces", "clean_value": "16" }, { "row": 786, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 783, "column": "abv", "new_value": "0.051", "reason": "The beer name is incorrect." }, { "row": 784, "column": "abv", "new_value": "0.075", "reason": "The beer name is incorrect." }, { "row": 785, "column": "abv", "new_value": "0.069", "reason": "The beer name is incorrect." }, { "row": 786, "column": "abv", "new_value": "0.05", "reason": "The beer name is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":783,\"column\":\"abv\",\"new_value\":\"0.051\",\"reason\":\"The beer name is incorrect.\"},{\"row\":784,\"column\":\"abv\",\"new_value\":\"0.075\",\"reason\":\"The beer name is incorrect.\"},{\"row\":785,\"column\":\"abv\",\"new_value\":\"0.069\",\"reason\":\"The beer name is incorrect.\"},{\"row\":786,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The beer name is incorrect.\"}]}" }, { "task_index": 81, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 }, "target_rows": [ { "_row": "299", "index": "300", "id": "1025", "beer-name": "N Street Drive-In 50th Anniversary IPA", "style": "American Double / Imperial IPA", "ounces": "12.0 ounce", "abv": "", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" }, { "_row": "300", "index": "301", "id": "1012", "beer-name": "467 Ethan's Stout", "style": "American Stout", "ounces": "12.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" }, { "_row": "301", "index": "302", "id": "942", "beer-name": "1335 Wicked Snout", "style": "Saison / Farmhouse Ale", "ounces": "12.0 ounce", "abv": "0.064", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" }, { "_row": "302", "index": "303", "id": "937", "beer-name": "543 Skull Creek Fresh Hopped Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.045", "ibu": "N/A", "brewery_id": "380", "brewery-name": "Blue Blood Brewing Company", "city": "Lincoln", "state": "NE" } ], "ground_truth": [ { "row": 299, "column": "ounces", "clean_value": "12" }, { "row": 299, "column": "ibu", "clean_value": "" }, { "row": 300, "column": "ounces", "clean_value": "12" }, { "row": 300, "column": "ibu", "clean_value": "" }, { "row": 301, "column": "ounces", "clean_value": "12" }, { "row": 301, "column": "ibu", "clean_value": "" }, { "row": 302, "column": "ounces", "clean_value": "12" }, { "row": 302, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 299, "column": "abv", "new_value": "0.05", "reason": "The beer name is incorrect." }, { "row": 300, "column": "abv", "new_value": "0.064", "reason": "The beer name is incorrect." }, { "row": 301, "column": "abv", "new_value": "0.045", "reason": "The beer name is incorrect." }, { "row": 302, "column": "abv", "new_value": "0.05", "reason": "The beer name is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":299,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The beer name is incorrect.\"},{\"row\":300,\"column\":\"abv\",\"new_value\":\"0.064\",\"reason\":\"The beer name is incorrect.\"},{\"row\":301,\"column\":\"abv\",\"new_value\":\"0.045\",\"reason\":\"The beer name is incorrect.\"},{\"row\":302,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The beer name is incorrect.\"}]}" }, { "task_index": 84, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6 }, "target_rows": [ { "_row": "2014", "index": "2015", "id": "139", "beer-name": "Point Amber Classic", "style": "American Amber / Red Lager", "ounces": "12.0 oz.", "abv": "0.047", "ibu": "14", "brewery_id": "131", "brewery-name": "Stevens Point Brewery", "city": "Stevens Point", "state": "WI" }, { "_row": "2015", "index": "2016", "id": "138", "beer-name": "Point Special Lager", "style": "American Adjunct Lager", "ounces": "12.0 oz", "abv": "0.047", "ibu": "9", "brewery_id": "131", "brewery-name": "Stevens Point Brewery", "city": "Stevens Point", "state": "WI" }, { "_row": "2016", "index": "2017", "id": "953", "beer-name": "Wisco Disco", "style": "American Amber / Red Ale", "ounces": "16.0 ounce", "abv": "0.051%", "ibu": "31", "brewery_id": "486", "brewery-name": "Stillmank Beer Company", "city": "Green Bay", "state": "WI" }, { "_row": "2017", "index": "2018", "id": "1983", "beer-name": "Brontide", "style": "American Black Ale", "ounces": "12.0 OZ.", "abv": "0.05", "ibu": "N/A", "brewery_id": "255", "brewery-name": "Stillwater Artisanal Ales", "city": "Baltimore", "state": "MD" } ], "ground_truth": [ { "row": 2014, "column": "ounces", "clean_value": "12" }, { "row": 2015, "column": "ounces", "clean_value": "12" }, { "row": 2016, "column": "ounces", "clean_value": "16" }, { "row": 2016, "column": "abv", "clean_value": "0.051" }, { "row": 2017, "column": "ounces", "clean_value": "12" }, { "row": 2017, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":2014,\"column\":\"abv\",\"new_value\":\"0.047\",\"reason\":\"The beer name is incorrect.\"},{\"row\":2015,\"column\":\"abv\",\"new_value\":\"0.047\",\"reason\":\"The beer name is incorrect.\"},{\"row\":2016,\"column\":\"abv\",\"new_value\":\"0.051%\",(\"The beer abv value is too low.\"),\"reason\":\"The beer abv value is too low.\"},{\"row\":2017,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The beer abv value is too low.\"}]}" }, { "task_index": 87, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "203", "index": "204", "id": "1855", "beer-name": "Tarnation California-Style Lager", "style": "California Common / Steam Beer", "ounces": "12.0 oz", "abv": "0.053", "ibu": "N/A", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" }, { "_row": "204", "index": "205", "id": "1778", "beer-name": "On the Count of 3 (2015)", "style": "Hefeweizen", "ounces": "16.0 oz", "abv": "0.07%", "ibu": "42", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" }, { "_row": "205", "index": "206", "id": "1209", "beer-name": "Summer Swelter", "style": "American Pale Wheat Ale", "ounces": "12.0 oz", "abv": "0.047", "ibu": "N/A", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" }, { "_row": "206", "index": "207", "id": "954", "beer-name": "Phantom Punch Winter Stout", "style": "Foreign / Export Stout", "ounces": "12.0 oz.", "abv": "0.068", "ibu": "N/A", "brewery_id": "292", "brewery-name": "Baxter Brewing Company", "city": "Lewiston", "state": "ME" } ], "ground_truth": [ { "row": 203, "column": "ounces", "clean_value": "12" }, { "row": 203, "column": "ibu", "clean_value": "" }, { "row": 204, "column": "ounces", "clean_value": "16" }, { "row": 204, "column": "abv", "clean_value": "0.07" }, { "row": 205, "column": "ounces", "clean_value": "12" }, { "row": 205, "column": "ibu", "clean_value": "" }, { "row": 206, "column": "ounces", "clean_value": "12" }, { "row": 206, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 203, "column": "abv", "new_value": "0.053", "reason": "The new value for abv is incorrect." }, { "row": 204, "column": "abv", "new_value": "0.07%", "reason": "The new value for abv is incorrect." }, { "row": 205, "column": "abv", "new_value": "0.047", "reason": "The new value for abv is incorrect." }, { "row": 206, "column": "abv", "new_value": "0.068", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":203,\"column\":\"abv\",\"new_value\":\"0.053\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":204,\"column\":\"abv\",\"new_value\":\"0.07%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":205,\"column\":\"abv\",\"new_value\":\"0.047\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":206,\"column\":\"abv\",\"new_value\":\"0.068\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 93, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 4 }, "target_rows": [ { "_row": "1413", "index": "1414", "id": "132", "beer-name": "Full Moon Belgian White Ale (2007)", "style": "Witbier", "ounces": "12.0 oz.", "abv": "0.085", "ibu": "N/A", "brewery_id": "507", "brewery-name": "Mudshark Brewing Company", "city": "Lake Havasu City", "state": "AZ" }, { "_row": "1414", "index": "1415", "id": "131", "beer-name": "Dry Heat Hefeweizen (2006)", "style": "Hefeweizen", "ounces": "12.0 OZ.", "abv": "0.055", "ibu": "N/A", "brewery_id": "507", "brewery-name": "Mudshark Brewing Company", "city": "Lake Havasu City", "state": "AZ" }, { "_row": "1415", "index": "1416", "id": "1598", "beer-name": "Mustang Sixty-Six", "style": "American Amber / Red Lager", "ounces": "12.0 ounce", "abv": "0.05", "ibu": "N/A", "brewery_id": "366", "brewery-name": "Mustang Brewing Company", "city": "Mustang", "state": "OK" }, { "_row": "1416", "index": "1417", "id": "862", "beer-name": "Mustang '33", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "0.04", "ibu": "N/A", "brewery_id": "366", "brewery-name": "Mustang Brewing Company", "city": "Mustang", "state": "OK" } ], "ground_truth": [ { "row": 1413, "column": "ounces", "clean_value": "12" }, { "row": 1413, "column": "ibu", "clean_value": "" }, { "row": 1414, "column": "ounces", "clean_value": "12" }, { "row": 1414, "column": "ibu", "clean_value": "" }, { "row": 1415, "column": "ounces", "clean_value": "12" }, { "row": 1415, "column": "ibu", "clean_value": "" }, { "row": 1416, "column": "ounces", "clean_value": "12" }, { "row": 1416, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 1413, "column": "abv", "new_value": "0.085", "reason": "The new value for abv is incorrect." }, { "row": 1414, "column": "abv", "new_value": "0.055", "reason": "The new value for abv is incorrect." }, { "row": 1415, "column": "abv", "new_value": "0.05", "reason": "The new value for abv is incorrect." }, { "row": 1416, "column": "abv", "new_value": "0.04", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1413,\"column\":\"abv\",\"new_value\":\"0.085\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1414,\"column\":\"abv\",\"new_value\":\"0.055\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1415,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":1416,\"column\":\"abv\",\"new_value\":\"0.04\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 99, "dataset": "beers", "inferability": "deterministic_normalization", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 6, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 5, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "979", "index": "980", "id": "1106", "beer-name": "Pablo Beach Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.05%", "ibu": "30", "brewery_id": "466", "brewery-name": "Green Room Brewing", "city": "Jacksonville", "state": "FL" }, { "_row": "980", "index": "981", "id": "2314", "beer-name": "Wild Trail Pale Ale", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.057", "ibu": "44", "brewery_id": "156", "brewery-name": "Greenbrier Valley Brewing Company", "city": "Lewisburg", "state": "WV" }, { "_row": "981", "index": "982", "id": "2313", "beer-name": "Mothman Black IPA", "style": "American Black Ale", "ounces": "12.0 ounce", "abv": "0.067", "ibu": "71", "brewery_id": "156", "brewery-name": "Greenbrier Valley Brewing Company", "city": "Lewisburg", "state": "WV" }, { "_row": "982", "index": "983", "id": "2461", "beer-name": "Autumn Winds Fest Beer", "style": "M\u00e4rzen / Oktoberfest", "ounces": "16.0 ounce", "abv": "0.058", "ibu": "N/A", "brewery_id": "86", "brewery-name": "Grey Sail Brewing Company", "city": "Westerly", "state": "RI" } ], "ground_truth": [ { "row": 979, "column": "ounces", "clean_value": "12" }, { "row": 979, "column": "abv", "clean_value": "0.05" }, { "row": 980, "column": "ounces", "clean_value": "12" }, { "row": 981, "column": "ounces", "clean_value": "12" }, { "row": 982, "column": "ounces", "clean_value": "16" }, { "row": 982, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 979, "column": "abv", "new_value": "0.05%", "reason": "The beer name is incorrect." }, { "row": 980, "column": "abv", "new_value": "0.057", "reason": "The beer name is incorrect." }, { "row": 981, "column": "abv", "new_value": "0.067", "reason": "The beer name is incorrect." }, { "row": 982, "column": "abv", "new_value": "0.058", "reason": "The beer name is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":979,\"column\":\"abv\",\"new_value\":\"0.05%\",\"reason\":\"The beer name is incorrect.\"},{\"row\":980,\"column\":\"abv\",\"new_value\":\"0.057\",\"reason\":\"The beer name is incorrect.\"},{\"row\":981,\"column\":\"abv\",\"new_value\":\"0.067\",\"reason\":\"The beer name is incorrect.\"},{\"row\":982,\"column\":\"abv\",\"new_value\":\"0.058\",\"reason\":\"The beer name is incorrect.\"}]}" } ], "not_inferable_from_prompt": [ { "task_index": 5, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1727", "tuple_id": "1728", "src": "ua", "flight": "UA-397-JFK-SFO", "sched_dep_time": "8:00 a.m.", "act_dep_time": "8:29 a.m.", "sched_arr_time": "11:55 a.m.", "act_arr_time": "11:58 a.m." }, { "_row": "1728", "tuple_id": "1729", "src": "ua", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1729", "tuple_id": "1730", "src": "ua", "flight": "UA-2830-MCO-CLT", "sched_dep_time": "3:27 p.m.", "act_dep_time": "3:27 p.m.", "sched_arr_time": "5:05 p.m.", "act_arr_time": "5:17 p.m." }, { "_row": "1730", "tuple_id": "1731", "src": "ua", "flight": "UA-5487-SFO-MRY", "sched_dep_time": "10:39 a.m.", "act_dep_time": "10:33 a.m.", "sched_arr_time": "11:19 a.m.", "act_arr_time": "11:21 a.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1727, "column": "act_arr_time", "new_value": "11:58 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1728, "column": "act_arr_time", "new_value": "9:43 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1729, "column": "act_arr_time", "new_value": "5:17 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1730, "column": "act_arr_time", "new_value": "11:21 a.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1727,\"column\":\"act_arr_time\",\"new_value\":\"11:58 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1728,\"column\":\"act_arr_time\",\"new_value\":\"9:43 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1729,\"column\":\"act_arr_time\",\"new_value\":\"5:17 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1730,\"column\":\"act_arr_time\",\"new_value\":\"11:21 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 10, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "122", "index": "123", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-4", "MeasureName": "heart attack patients given smoking cessation advice/counseling", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-4" }, { "_row": "123", "index": "124", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "0%", "Sample": "1 patients", "Stateavg": "al_ami-5" }, { "_row": "124", "index": "125", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "125", "index": "126", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" } ], "ground_truth": [], "predicted_repairs": [ { "row": 122, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." }, { "row": 123, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." }, { "row": 124, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." }, { "row": 125, "column": "Address1", "new_value": "101 hospital circle", "reason": "The address does not exist." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":122,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"},{\"row\":123,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"},{\"row\":124,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"},{\"row\":125,\"column\":\"Address1\",\"new_value\":\"101 hospital circle\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '101 hospital circle' does not exist.\"}]}" }, { "task_index": 20, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "13", "tuple_id": "14", "src": "aa", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "8:00 a.m.", "act_arr_time": "8:06 a.m." }, { "_row": "14", "tuple_id": "15", "src": "aa", "flight": "AA-1279-DFW-PHX", "sched_dep_time": "1:00 p.m.", "act_dep_time": "2:04 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:30 p.m." }, { "_row": "15", "tuple_id": "16", "src": "aa", "flight": "AA-616-DFW-DTW", "sched_dep_time": "9:05 a.m.", "act_dep_time": "10:10 a.m.", "sched_arr_time": "12:35 p.m.", "act_arr_time": "1:27 p.m." }, { "_row": "16", "tuple_id": "17", "src": "aa", "flight": "AA-4344-ORD-DTW", "sched_dep_time": "11:45 a.m.", "act_dep_time": "12:13 p.m.", "sched_arr_time": "2:00 p.m.", "act_arr_time": "2:10 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 13, "column": "act_arr_time", "new_value": "8:06 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 14, "column": "act_arr_time", "new_value": "3:30 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 15, "column": "act_arr_time", "new_value": "1:27 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 16, "column": "act_arr_time", "new_value": "2:10 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":13,\"column\":\"act_arr_time\",\"new_value\":\"8:06 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":14,\"column\":\"act_arr_time\",\"new_value\":\"3:30 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":15,\"column\":\"act_arr_time\",\"new_value\":\"1:27 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":16,\"column\":\"act_arr_time\",\"new_value\":\"2:10 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 25, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "661", "index": "662", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-3" }, { "_row": "662", "index": "663", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-4" }, { "_row": "663", "index": "664", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-inf-6" }, { "_row": "664", "index": "665", "ProviderNumber": "10032", "HospitalName": "wedowee hospital", "Address1": "209 north main street", "Address2": "empty", "Address3": "empty", "City": "wedowee", "State": "al", "ZipCode": "36278", "CountyName": "randolph", "PhoneNumber": "2563572111", "HospitalType": "acute care hospitals", "HospitalOwner": "government - local", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "empty", "Sample": "empty", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [], "predicted_repairs": [ { "row": 661, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." }, { "row": 662, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." }, { "row": 663, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." }, { "row": 664, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid zip code." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":661,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"},{\"row\":662,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"},{\"row\":663,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"},{\"row\":664,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid zip code.\",\"repair_reason\":\"Invalid zip code\"}]}" }, { "task_index": 35, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1452", "tuple_id": "1453", "src": "ifly", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1453", "tuple_id": "1454", "src": "ifly", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:19 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:13 p.m." }, { "_row": "1454", "tuple_id": "1455", "src": "ifly", "flight": "AA-1434-DFW-MCO", "sched_dep_time": "7:15 a.m.", "act_dep_time": "7:21 a.m.", "sched_arr_time": "10:35 a.m.", "act_arr_time": "10:36 a.m." }, { "_row": "1455", "tuple_id": "1456", "src": "ifly", "flight": "UA-664-ORD-PHL", "sched_dep_time": "1:33 p.m.", "act_dep_time": "1:31 p.m.", "sched_arr_time": "4:31 p.m.", "act_arr_time": "4:23 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1452, "column": "act_arr_time", "new_value": "9:43 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1453, "column": "act_arr_time", "new_value": "3:13 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1454, "column": "act_arr_time", "new_value": "10:36 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1455, "column": "act_arr_time", "new_value": "4:23 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1452,\"column\":\"act_arr_time\",\"new_value\":\"9:43 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1453,\"column\":\"act_arr_time\",\"new_value\":\"3:13 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1454,\"column\":\"act_arr_time\",\"new_value\":\"10:36 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1455,\"column\":\"act_arr_time\",\"new_value\":\"4:23 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 40, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "299", "index": "300", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "empty", "Stateavg": "al_ami-7a" }, { "_row": "300", "index": "301", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "empty", "Stateavg": "al_ami-8a" }, { "_row": "301", "index": "302", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "empty", "Sample": "empty", "Stateavg": "al_hf-1" }, { "_row": "302", "index": "303", "ProviderNumber": "10018", "HospitalName": "callahan eye foundation hospital", "Address1": "1720 university blvd", "Address2": "empty", "Address3": "empty", "City": "birmingham", "State": "al", "ZipCode": "35233", "CountyName": "jefferson", "PhoneNumber": "2053258100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "empty", "Sample": "empty", "Stateavg": "al_hf-2" } ], "ground_truth": [], "predicted_repairs": [ { "row": 299, "column": "Address1", "new_value": "1720 university blvd", "reason": "The address is incorrect." }, { "row": 300, "column": "Address1", "new_value": "1720 university blvd", "reason": "The address is incorrect." }, { "row": 301, "column": "Address1", "new_value": "1720 university blvd", "reason": "The address is incorrect." }, { "row": 302, "column": "Address1", "new_value": "1720 university blvd", "reason": "The address is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":299,\"column\":\"Address1\",\"new_value\":\"1720 university blvd\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not exist or is not a valid location.\"},{\"row\":300,\"column\":\"Address1\",\"new_value\":\"1720 university blvd\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not exist or is not a valid location.\"},{\"row\":301,\"column\":\"Address1\",\"new_value\":\"1720 university blvd\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not exist or is not a valid location.\"},{\"row\":302,\"column\":\"Address1\",\"new_value\":\"1720 university blvd\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not exist or is not a valid location.\"}]}" }, { "task_index": 50, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1450", "tuple_id": "1451", "src": "ifly", "flight": "CO-89-IAH-EWR", "sched_dep_time": "6:00 a.m.", "act_dep_time": "6:02 a.m.", "sched_arr_time": "10:20 a.m.", "act_arr_time": "10:27 a.m." }, { "_row": "1451", "tuple_id": "1452", "src": "ifly", "flight": "UA-938-DEN-ORD", "sched_dep_time": "4:16 p.m.", "act_dep_time": "4:15 p.m.", "sched_arr_time": "7:35 p.m.", "act_arr_time": "7:36 p.m." }, { "_row": "1452", "tuple_id": "1453", "src": "ifly", "flight": "UA-3925-IAD-ORF", "sched_dep_time": "8:41 a.m.", "act_dep_time": "8:42 a.m.", "sched_arr_time": "9:54 a.m.", "act_arr_time": "9:43 a.m." }, { "_row": "1453", "tuple_id": "1454", "src": "ifly", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:19 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "3:13 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1450, "column": "act_arr_time", "new_value": "10:27 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1451, "column": "act_arr_time", "new_value": "7:36 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1452, "column": "act_arr_time", "new_value": "9:43 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1453, "column": "act_arr_time", "new_value": "3:13 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1450,\"column\":\"act_arr_time\",\"new_value\":\"10:27 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1451,\"column\":\"act_arr_time\",\"new_value\":\"7:36 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1452,\"column\":\"act_arr_time\",\"new_value\":\"9:43 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1453,\"column\":\"act_arr_time\",\"new_value\":\"3:13 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 55, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "910", "index": "911", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "88%", "Sample": "8 patients", "Stateavg": "al_ami-7a" }, { "_row": "911", "index": "912", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "100%", "Sample": "16 patients", "Stateavg": "al_ami-8a" }, { "_row": "912", "index": "913", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "100%", "Sample": "268 patients", "Stateavg": "al_hf-1" }, { "_row": "913", "index": "914", "ProviderNumber": "10046", "HospitalName": "riverview regional medical center", "Address1": "600 south third street", "Address2": "empty", "Address3": "empty", "City": "gadsden", "State": "al", "ZipCode": "35901", "CountyName": "etowah", "PhoneNumber": "2565435200", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "100%", "Sample": "350 patients", "Stateavg": "al_hf-2" } ], "ground_truth": [], "predicted_repairs": [ { "row": 910, "column": "Address1", "new_value": "600 south third street", "reason": "The address does not match any known hospital location." }, { "row": 911, "column": "Address1", "new_value": "600 south third street", "reason": "The address does not match any known hospital location." }, { "row": 912, "column": "Address1", "new_value": "600 south third street", "reason": "The address does not match any known hospital location." }, { "row": 913, "column": "Address1", "new_value": "600 south third street", "reason": "The address does not match any known hospital location." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":910,\"column\":\"Address1\",\"new_value\":\"600 south third street\",\"reason\":\"The address does not match any known hospital location.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital location.\"},{\"row\":911,\"column\":\"Address1\",\"new_value\":\"600 south third street\",\"reason\":\"The address does not match any known hospital location.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital location.\"},{\"row\":912,\"column\":\"Address1\",\"new_value\":\"600 south third street\",\"reason\":\"The address does not match any known hospital location.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital location.\"},{\"row\":913,\"column\":\"Address1\",\"new_value\":\"600 south third street\",\"reason\":\"The address does not match any known hospital location.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital location.\"}]}" }, { "task_index": 65, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "559", "tuple_id": "560", "src": "flightstats", "flight": "AA-446-DFW-PHL", "sched_dep_time": "11:50 a.m.", "act_dep_time": "12:12 p.m.", "sched_arr_time": "3:50 p.m.", "act_arr_time": "4:09 p.m." }, { "_row": "560", "tuple_id": "561", "src": "flightstats", "flight": "CO-1023-IAH-DEN", "sched_dep_time": "11:40 a.m.", "act_dep_time": "11:56 a.m.", "sched_arr_time": "1:17 p.m.", "act_arr_time": "1:14 p.m." }, { "_row": "561", "tuple_id": "562", "src": "flightstats", "flight": "AA-466-IAH-MIA", "sched_dep_time": "6:00 a.m.", "act_dep_time": "6:08 a.m.", "sched_arr_time": "9:20 a.m.", "act_arr_time": "9:05 a.m." }, { "_row": "562", "tuple_id": "563", "src": "flightstats", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:30 a.m.", "sched_arr_time": "4:57 p.m.", "act_arr_time": "5:05 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 559, "column": "act_arr_time", "new_value": "4:09 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 560, "column": "act_arr_time", "new_value": "1:14 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 561, "column": "act_arr_time", "new_value": "9:05 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 562, "column": "act_arr_time", "new_value": "5:05 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":559,\"column\":\"act_arr_time\",\"new_value\":\"4:09 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":560,\"column\":\"act_arr_time\",\"new_value\":\"1:14 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":561,\"column\":\"act_arr_time\",\"new_value\":\"9:05 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":562,\"column\":\"act_arr_time\",\"new_value\":\"5:05 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 70, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "schema_case_error": 4 }, "target_rows": [ { "_row": "458", "index": "459", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-card-2", "MeasureName": "surgery patients who were taking heart drugs called beta blockers before coming to the hospital who were kept on the beta blockers during the period just before and after their surgery", "Score": "81%", "Sample": "54 patients", "Stateavg": "al_scip-card-2" }, { "_row": "459", "index": "460", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "92%", "Sample": "253 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "460", "index": "461", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "91%", "Sample": "255 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "461", "index": "462", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "84%", "Sample": "245 patients", "Stateavg": "al_scip-inf-3" } ], "ground_truth": [], "predicted_repairs": [ { "row": 458, "column": "Index", "new_value": "459", "reason": "The patient's address has been updated to include a new street name." }, { "row": 459, "column": "Index", "new_value": "460", "reason": "The patient's address has been updated to include a new street name." }, { "row": 460, "column": "Index", "new_value": "461", "reason": "The patient's address has been updated to include a new street name." }, { "row": 461, "column": "Index", "new_value": "462", "reason": "The patient's address has been updated to include a new street name." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":458,\"column\":\"Index\",\"new_value\":\"459\",\"reason\":\"The patient's address has been updated to include a new street name.\",\"action\":\"update\"},{\"row\":459,\"column\":\"Index\",\"new_value\":\"460\",\"reason\":\"The patient's address has been updated to include a new street name.\",\"action\":\"update\"},{\"row\":460,\"column\":\"Index\",\"new_value\":\"461\",\"reason\":\"The patient's address has been updated to include a new street name.\",\"action\":\"update\"},{\"row\":461,\"column\":\"Index\",\"new_value\":\"462\",\"reason\":\"The patient's address has been updated to include a new street name.\",\"action\":\"update\"}]}" }, { "task_index": 80, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 1 }, "target_rows": [ { "_row": "589", "tuple_id": "590", "src": "flightstats", "flight": "UA-2906-PHL-MCO", "sched_dep_time": "3:50 p.m.", "act_dep_time": "4:28 p.m.", "sched_arr_time": "6:23 p.m.", "act_arr_time": "6:38 p.m." }, { "_row": "590", "tuple_id": "591", "src": "flightstats", "flight": "UA-938-DEN-ORD", "sched_dep_time": "4:16 p.m.", "act_dep_time": "4:15 p.m.", "sched_arr_time": "7:35 p.m.", "act_arr_time": "7:36 p.m." }, { "_row": "591", "tuple_id": "592", "src": "flightstats", "flight": "AA-1221-MCO-ORD", "sched_dep_time": "8:00 p.m.", "act_dep_time": "8:23 p.m.", "sched_arr_time": "9:45 p.m.", "act_arr_time": "9:53 p.m." }, { "_row": "592", "tuple_id": "593", "src": "flightstats", "flight": "CO-16-LAX-EWR", "sched_dep_time": "10:25 a.m.", "act_dep_time": "10:20 a.m.", "sched_arr_time": "6:44 p.m.", "act_arr_time": "6:34 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 592, "column": "flight", "new_value": "CO-16-LAX-EWR", "reason": "The flight CO-16-LAX-EWR is scheduled to depart at 6:44 PM instead of the expected 6:34 PM." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":592,\"column\":\"flight\",\"new_value\":\"CO-16-LAX-EWR\",\"reason\":\"The flight CO-16-LAX-EWR is scheduled to depart at 6:44 PM instead of the expected 6:34 PM.\"}]}" }, { "task_index": 85, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 4, "failure_taxonomy": { "schema_case_error": 4 }, "target_rows": [ { "_row": "141", "index": "142", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "100%", "Sample": "4 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "142", "index": "143", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "100%", "Sample": "4 patients", "Stateavg": "al_scip-vte-1" }, { "_row": "143", "index": "144", "ProviderNumber": "10008", "HospitalName": "crenshaw community hospital", "Address1": "101 hospital circle", "Address2": "empty", "Address3": "empty", "City": "luverne", "State": "al", "ZipCode": "36049", "CountyName": "crenshaw", "PhoneNumber": "3343353374", "HospitalType": "acute care hospitals", "HospitalOwner": "government - federal", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-2", "MeasureName": "patients who got treatment at the right time (within 24 hours before or after their surgery) to help prevent blood clots after certain types of surgery", "Score": "100%", "Sample": "4 patients", "Stateavg": "al_scip-vte-2" }, { "_row": "144", "index": "145", "ProviderNumber": "10009", "HospitalName": "hartselle medical center", "Address1": "201 pine street northwest", "Address2": "empty", "Address3": "empty", "City": "hartselle", "State": "al", "ZipCode": "35640", "CountyName": "morgan", "PhoneNumber": "2567736511", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-1", "MeasureName": "heart attack patients given aspirin at arrival", "Score": "100%", "Sample": "6 patients", "Stateavg": "al_ami-1" } ], "ground_truth": [], "predicted_repairs": [ { "row": 141, "column": "Index", "new_value": "10008", "reason": "The patient's condition is surgical infection prevention." }, { "row": 142, "column": "Index", "new_value": "10008", "reason": "The patient's condition is heart attack." }, { "row": 143, "column": "Index", "new_value": "10009", "reason": "The patient's condition is heart attack." }, { "row": 144, "column": "Index", "new_value": "10008", "reason": "The patient's condition is surgical infection prevention." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":141,\"column\":\"Index\",\"new_value\":\"10008\",\"reason\":\"The patient's condition is surgical infection prevention.\",\"why\":\"This patient needs surgery and has a higher risk for blood clots post-surgery.\"},{\"row\":142,\"column\":\"Index\",\"new_value\":\"10008\",\"reason\":\"The patient's condition is heart attack.\",\"why\":\"This patient requires immediate medical attention due to a heart attack.\"},{\"row\":143,\"column\":\"Index\",\"new_value\":\"10009\",\"reason\":\"The patient's condition is heart attack.\",\"why\":\"This patient needs urgent medical attention due to a heart attack.\"},{\"row\":144,\"column\":\"Index\",\"new_value\":\"10008\",\"reason\":\"The patient's condition is surgical infection prevention.\",\"why\":\"This patient needs surgery and has a higher risk for blood clots post-surgery.\"}]}" }, { "task_index": 95, "dataset": "flights", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "1431", "tuple_id": "1432", "src": "CO", "flight": "CO-1614-LAX-IAH", "sched_dep_time": "12:30 a.m.", "act_dep_time": "12:41 a.m.", "sched_arr_time": "5:35 a.m.", "act_arr_time": "5:26 a.m." }, { "_row": "1432", "tuple_id": "1433", "src": "CO", "flight": "CO-1088-CLE-IAH", "sched_dep_time": "8:40 a.m.", "act_dep_time": "8:40 a.m.", "sched_arr_time": "10:54 a.m.", "act_arr_time": "10:56 a.m." }, { "_row": "1433", "tuple_id": "1434", "src": "CO", "flight": "CO-58-DEN-IAH", "sched_dep_time": "11:25 a.m.", "act_dep_time": "11:32 a.m.", "sched_arr_time": "2:50 p.m.", "act_arr_time": "3:31 p.m." }, { "_row": "1434", "tuple_id": "1435", "src": "CO", "flight": "CO-50-CLE-EWR", "sched_dep_time": "2:55 p.m.", "act_dep_time": "3:31 p.m.", "sched_arr_time": "4:49 p.m.", "act_arr_time": "5:26 p.m." } ], "ground_truth": [], "predicted_repairs": [ { "row": 1431, "column": "act_arr_time", "new_value": "5:26 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1432, "column": "act_arr_time", "new_value": "10:56 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1433, "column": "act_arr_time", "new_value": "3:31 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1434, "column": "act_arr_time", "new_value": "5:26 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1431,\"column\":\"act_arr_time\",\"new_value\":\"5:26 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1432,\"column\":\"act_arr_time\",\"new_value\":\"10:56 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1433,\"column\":\"act_arr_time\",\"new_value\":\"3:31 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1434,\"column\":\"act_arr_time\",\"new_value\":\"5:26 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 100, "dataset": "hospital", "inferability": "not_inferable_from_prompt", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 0, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "overrepair": 4 }, "target_rows": [ { "_row": "623", "index": "624", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "82%", "Sample": "527 patients", "Stateavg": "al_hf-1" }, { "_row": "624", "index": "625", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "100%", "Sample": "570 patients", "Stateavg": "al_hf-2" }, { "_row": "625", "index": "626", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-3", "MeasureName": "heart failure patients given ace inhibitor or arb for left ventricular systolic dysfunction (lvsd)", "Score": "92%", "Sample": "272 patients", "Stateavg": "al_hf-3" }, { "_row": "626", "index": "627", "ProviderNumber": "10029", "HospitalName": "east alabama medical center and snf", "Address1": "2000 pepperell parkway", "Address2": "empty", "Address3": "empty", "City": "opelika", "State": "al", "ZipCode": "36801", "CountyName": "lee", "PhoneNumber": "3347493411", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-4", "MeasureName": "heart failure patients given smoking cessation advice/counseling", "Score": "100%", "Sample": "101 patients", "Stateavg": "al_hf-4" } ], "ground_truth": [], "predicted_repairs": [ { "row": 623, "column": "Address1", "new_value": "2000 pepperell parkway", "reason": "The address does not exist." }, { "row": 624, "column": "Address1", "new_value": "2000 pepperell parkway", "reason": "The address does not exist." }, { "row": 625, "column": "Address1", "new_value": "2000 pepperell parkway", "reason": "The address does not exist." }, { "row": 626, "column": "Address1", "new_value": "2000 pepperell parkway", "reason": "The address does not exist." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":623,\"column\":\"Address1\",\"new_value\":\"2000 pepperell parkway\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '2000 pepperell parkway' does not exist.\"},{\"row\":624,\"column\":\"Address1\",\"new_value\":\"2000 pepperell parkway\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '2000 pepperell parkway' does not exist.\"},{\"row\":625,\"column\":\"Address1\",\"new_value\":\"2000 pepperell parkway\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '2000 pepperell parkway' does not exist.\"},{\"row\":626,\"column\":\"Address1\",\"new_value\":\"2000 pepperell parkway\",\"reason\":\"The address does not exist.\",\"why\":\"This is a potential error as the address '2000 pepperell parkway' does not exist.\"}]}" } ], "external_reference_required": [ { "task_index": 1, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4 }, "target_rows": [ { "_row": "55", "index": "56", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-2", "MeasureName": "pneumonia patients assessed and given pneumococcal vaccination", "Score": "97%", "Sample": "172 patients", "Stateavg": "al_pn-2" }, { "_row": "56", "index": "57", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boxz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-3b", "MeasureName": "pneumonia patients whose initial emergency room blood culture was performed prior to the administration of the first hospital dose of antibiotics", "Score": "97%", "Sample": "120 patients", "Stateavg": "al_pn-xb" }, { "_row": "57", "index": "58", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505xuxsxhighwayx431xnorth", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2x6x938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-4", "MeasureName": "pneumonia patients given smoking cessation advice/counseling", "Score": "97%", "Sample": "98 patients", "Stateavg": "al_pn-4" }, { "_row": "58", "index": "59", "ProviderNumber": "10005", "HospitalName": "marshall medical center south", "Address1": "2505 u s highway 431 north", "Address2": "empty", "Address3": "empty", "City": "boaz", "State": "al", "ZipCode": "35957", "CountyName": "marshall", "PhoneNumber": "2565938310", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-5c", "MeasureName": "pneumonia patients given initial antibiotic(s) within 6 hours after arrival", "Score": "96%", "Sample": "211 patients", "Stateavg": "al_pn-5c" } ], "ground_truth": [ { "row": 56, "column": "City", "clean_value": "boaz" }, { "row": 56, "column": "Stateavg", "clean_value": "al_pn-3b" }, { "row": 57, "column": "Address1", "clean_value": "2505 u s highway 431 north" }, { "row": 57, "column": "PhoneNumber", "clean_value": "2565938310" } ], "predicted_repairs": [], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":55,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'\"},{\"row\":56,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'\"},{\"row\":57,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'\"},{\"row\":58,\"column\":\"ProviderNumber\",\"new_value\":\"10005\",\"reason\":\"Corrected Provider Number for patient with Condition 'pneumonia'}]}" }, { "task_index": 2, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 16, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "wrong_value": 4 }, "target_rows": [ { "_row": "792", "tuple_id": "793", "src": "mia", "flight": "AA-2050-ORD-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "2:45P 12-01-11", "act_arr_time": "2:46P" }, { "_row": "793", "tuple_id": "794", "src": "mia", "flight": "AA-1165-JFK-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "10:34A 12-01-11", "act_arr_time": "10:08A" }, { "_row": "794", "tuple_id": "795", "src": "mia", "flight": "AA-484-DFW-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "7:55P 12-01-11", "act_arr_time": "7:39P" }, { "_row": "795", "tuple_id": "796", "src": "mia", "flight": "AA-466-IAH-MIA", "sched_dep_time": "", "act_dep_time": "", "sched_arr_time": "9:20A 12-01-11", "act_arr_time": "9:04A" } ], "ground_truth": [ { "row": 792, "column": "sched_dep_time", "clean_value": "10:40 a.m." }, { "row": 792, "column": "act_dep_time", "clean_value": "11:05 a.m." }, { "row": 792, "column": "sched_arr_time", "clean_value": "2:45 p.m." }, { "row": 792, "column": "act_arr_time", "clean_value": "2:46 p.m." }, { "row": 793, "column": "sched_dep_time", "clean_value": "6:59 a.m." }, { "row": 793, "column": "act_dep_time", "clean_value": "7:22 a.m." }, { "row": 793, "column": "sched_arr_time", "clean_value": "10:34 a.m." }, { "row": 793, "column": "act_arr_time", "clean_value": "10:04 a.m." }, { "row": 794, "column": "sched_dep_time", "clean_value": "4:15 p.m." }, { "row": 794, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 794, "column": "sched_arr_time", "clean_value": "7:55 p.m." }, { "row": 794, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 795, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 795, "column": "act_dep_time", "clean_value": "6:08 a.m." }, { "row": 795, "column": "sched_arr_time", "clean_value": "9:20 a.m." }, { "row": 795, "column": "act_arr_time", "clean_value": "9:05 a.m." } ], "predicted_repairs": [ { "row": 792, "column": "act_arr_time", "new_value": "2:46P", "reason": "The new value for act_arr_time is incorrect." }, { "row": 793, "column": "act_arr_time", "new_value": "10:08A", "reason": "The new value for act_arr_time is incorrect." }, { "row": 794, "column": "act_arr_time", "new_value": "7:39P", "reason": "The new value for act_arr_time is incorrect." }, { "row": 795, "column": "act_arr_time", "new_value": "9:04A", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":792,\"column\":\"act_arr_time\",\"new_value\":\"2:46P\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":793,\"column\":\"act_arr_time\",\"new_value\":\"10:08A\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":794,\"column\":\"act_arr_time\",\"new_value\":\"7:39P\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":795,\"column\":\"act_arr_time\",\"new_value\":\"9:04A\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 4, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 4, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "overrepair": 4 }, "target_rows": [ { "_row": "711", "index": "712", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "1xx%", "Sample": "9 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "712", "index": "713", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection xrevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "713", "index": "714", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "33x28365x1", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery paxienxs needing hair removed from xhe surgical area before surgery who had hair removed using a safer mexhod (elecxric clippers or hair removal cream c nox a razor)", "Score": "100%", "Sample": "33 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "714", "index": "715", "ProviderNumber": "10034", "HospitalName": "community hospital inc", "Address1": "805 friendship road", "Address2": "empty", "Address3": "empty", "City": "tallassee", "State": "al", "ZipCode": "36078", "CountyName": "elmore", "PhoneNumber": "3342836541", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "no", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "88%", "Sample": "24 patients", "Stateavg": "al_scip-vte-1" } ], "ground_truth": [ { "row": 711, "column": "Score", "clean_value": "100%" }, { "row": 712, "column": "Condition", "clean_value": "surgical infection prevention" }, { "row": 713, "column": "PhoneNumber", "clean_value": "3342836541" }, { "row": 713, "column": "MeasureName", "clean_value": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)" } ], "predicted_repairs": [ { "row": 711, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 712, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 713, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 714, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":711,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"},{\"row\":712,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"},{\"row\":713,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"},{\"row\":714,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\"}]}" }, { "task_index": 7, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "483", "index": "484", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "xl", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-card-2", "MeasureName": "surgery patients who were taking heart drugs called beta blockers before coming to the hospital who were kept on the beta blockers during the period just before and after their surgery", "Score": "100%", "Sample": "12 patients", "Stateavg": "al_scip-card-2" }, { "_row": "484", "index": "485", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "1x6 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "94%", "Sample": "52 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "485", "index": "486", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "xzark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "96%", "Sample": "52 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "486", "index": "487", "ProviderNumber": "10021", "HospitalName": "dale medical center", "Address1": "126 hospital ave", "Address2": "empty", "Address3": "empty", "City": "ozark", "State": "al", "ZipCode": "36360", "CountyName": "dale", "PhoneNumber": "3347742601", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "85%", "Sample": "48 patients", "Stateavg": "al_scip-inf-3" } ], "ground_truth": [ { "row": 483, "column": "State", "clean_value": "al" }, { "row": 484, "column": "Address1", "clean_value": "126 hospital ave" }, { "row": 485, "column": "City", "clean_value": "ozark" } ], "predicted_repairs": [ { "row": 483, "column": "Address1", "new_value": "126 hospital ave", "reason": "The address is incorrect." }, { "row": 484, "column": "Address1", "new_value": "1x6 hospital ave", "reason": "The address is incorrect." }, { "row": 485, "column": "Address1", "new_value": "126 hospital ave", "reason": "The address is incorrect." }, { "row": 486, "column": "Address1", "new_value": "126 hospital ave", "reason": "The address is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":483,\"column\":\"Address1\",\"new_value\":\"126 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"},{\"row\":484,\"column\":\"Address1\",\"new_value\":\"1x6 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"},{\"row\":485,\"column\":\"Address1\",\"new_value\":\"126 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"},{\"row\":486,\"column\":\"Address1\",\"new_value\":\"126 hospital ave\",\"reason\":\"The address is incorrect.\",\"why\":\"This address does not match any allowed column values.\"}]}" }, { "task_index": 8, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 12, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 1, "wrong_value": 3 }, "target_rows": [ { "_row": "2025", "tuple_id": "2026", "src": "allegiantair", "flight": "UA-2708-EWR-CLT", "sched_dep_time": "", "act_dep_time": "3:04 p.m.", "sched_arr_time": "", "act_arr_time": "4:24 p.m." }, { "_row": "2026", "tuple_id": "2027", "src": "allegiantair", "flight": "UA-62-IAH-EWR", "sched_dep_time": "", "act_dep_time": "2:59 p.m.", "sched_arr_time": "", "act_arr_time": "7:10 p.m." }, { "_row": "2027", "tuple_id": "2028", "src": "allegiantair", "flight": "UA-1500-IAH-GUA", "sched_dep_time": "", "act_dep_time": "9:43 a.m.", "sched_arr_time": "", "act_arr_time": "12:12 p.m." }, { "_row": "2028", "tuple_id": "2029", "src": "allegiantair", "flight": "AA-3804-PHL-ORD", "sched_dep_time": "2:35 p.m.", "act_dep_time": "2:44 p.m.", "sched_arr_time": "4:05 p.m.", "act_arr_time": "3:36 p.m." } ], "ground_truth": [ { "row": 2025, "column": "sched_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "act_dep_time", "clean_value": "2:55 p.m." }, { "row": 2025, "column": "sched_arr_time", "clean_value": "4:53 p.m." }, { "row": 2025, "column": "act_arr_time", "clean_value": "4:44 p.m." }, { "row": 2026, "column": "sched_dep_time", "clean_value": "2:30 p.m." }, { "row": 2026, "column": "act_dep_time", "clean_value": "2:48 p.m." }, { "row": 2026, "column": "sched_arr_time", "clean_value": "7:03 p.m." }, { "row": 2027, "column": "sched_dep_time", "clean_value": "8:55 a.m." }, { "row": 2027, "column": "act_dep_time", "clean_value": "9:16 a.m." }, { "row": 2027, "column": "sched_arr_time", "clean_value": "11:45 a.m." }, { "row": 2027, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 2028, "column": "act_arr_time", "clean_value": "3:43 p.m." } ], "predicted_repairs": [ { "row": 2025, "column": "act_arr_time", "new_value": "4:24 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 2026, "column": "act_arr_time", "new_value": "7:10 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 2027, "column": "act_arr_time", "new_value": "12:12 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 2028, "column": "act_arr_time", "new_value": "3:36 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":2025,\"column\":\"act_arr_time\",\"new_value\":\"4:24 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":2026,\"column\":\"act_arr_time\",\"new_value\":\"7:10 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":2027,\"column\":\"act_arr_time\",\"new_value\":\"12:12 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":2028,\"column\":\"act_arr_time\",\"new_value\":\"3:36 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 11, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 14, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "wrong_value": 4 }, "target_rows": [ { "_row": "1535", "tuple_id": "1536", "src": "flytecomm", "flight": "CO-1193-EWR-MCO", "sched_dep_time": "9:15 a.m.", "act_dep_time": "", "sched_arr_time": "12:18 p.m.", "act_arr_time": "" }, { "_row": "1536", "tuple_id": "1537", "src": "flytecomm", "flight": "AA-3842-MSP-ORD", "sched_dep_time": "", "act_dep_time": "6:57 a.m.", "sched_arr_time": "", "act_arr_time": "7:49 a.m." }, { "_row": "1537", "tuple_id": "1538", "src": "flytecomm", "flight": "AA-643-MIA-ORD", "sched_dep_time": "", "act_dep_time": "7:31 a.m.", "sched_arr_time": "", "act_arr_time": "9:26 a.m." }, { "_row": "1538", "tuple_id": "1539", "src": "flytecomm", "flight": "AA-1007-MIA-PHX", "sched_dep_time": "", "act_dep_time": "5:09 p.m.", "sched_arr_time": "", "act_arr_time": "7:43 p.m." } ], "ground_truth": [ { "row": 1535, "column": "act_dep_time", "clean_value": "9:14 a.m." }, { "row": 1535, "column": "act_arr_time", "clean_value": "12:09 p.m." }, { "row": 1536, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 1536, "column": "act_dep_time", "clean_value": "6:56 a.m." }, { "row": 1536, "column": "sched_arr_time", "clean_value": "7:30 a.m." }, { "row": 1536, "column": "act_arr_time", "clean_value": "7:51 a.m." }, { "row": 1537, "column": "sched_dep_time", "clean_value": "7:10 a.m." }, { "row": 1537, "column": "act_dep_time", "clean_value": "7:30 a.m." }, { "row": 1537, "column": "sched_arr_time", "clean_value": "9:35 a.m." }, { "row": 1537, "column": "act_arr_time", "clean_value": "9:31 a.m." }, { "row": 1538, "column": "sched_dep_time", "clean_value": "4:55 p.m." }, { "row": 1538, "column": "act_dep_time", "clean_value": "5:08 p.m." }, { "row": 1538, "column": "sched_arr_time", "clean_value": "8:05 p.m." }, { "row": 1538, "column": "act_arr_time", "clean_value": "7:55 p.m." } ], "predicted_repairs": [ { "row": 1535, "column": "act_arr_time", "new_value": "7:49 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1536, "column": "act_arr_time", "new_value": "9:26 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1537, "column": "act_arr_time", "new_value": "7:43 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1538, "column": "act_arr_time", "new_value": "7:49 a.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1535,\"column\":\"act_arr_time\",\"new_value\":\"7:49 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1536,\"column\":\"act_arr_time\",\"new_value\":\"9:26 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1537,\"column\":\"act_arr_time\",\"new_value\":\"7:43 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1538,\"column\":\"act_arr_time\",\"new_value\":\"7:49 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 12, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 4 }, "target_rows": [ { "_row": "1774", "index": "1775", "id": "1841", "beer-name": "Alpha Blackback", "style": "American Black Ale", "ounces": "12.0 oz", "abv": "0.07200000000000001%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1775", "index": "1776", "id": "1782", "beer-name": "Kiss Off IPA", "style": "American IPA", "ounces": "12.0 oz.", "abv": "0.063%", "ibu": "N/A", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1776", "index": "1777", "id": "1552", "beer-name": "Dog Days Summer Ale", "style": "K\u00f6lsch", "ounces": "12.0 oz.", "abv": "0.045%", "ibu": "28", "brewery_id": "164", "brewery-name": "Round Guys Brewing", "city": "Lansdale", "state": "PA" }, { "_row": "1777", "index": "1778", "id": "1479", "beer-name": "1881 California Red", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.055999999999999994%", "ibu": "35", "brewery_id": "397", "brewery-name": "Ruhstaller Beer Company", "city": "Sacramento", "state": "CA" } ], "ground_truth": [ { "row": 1774, "column": "ounces", "clean_value": "12" }, { "row": 1774, "column": "abv", "clean_value": "0.072" }, { "row": 1774, "column": "ibu", "clean_value": "" }, { "row": 1775, "column": "ounces", "clean_value": "12" }, { "row": 1775, "column": "abv", "clean_value": "0.063" }, { "row": 1775, "column": "ibu", "clean_value": "" }, { "row": 1776, "column": "ounces", "clean_value": "12" }, { "row": 1776, "column": "abv", "clean_value": "0.045" }, { "row": 1777, "column": "ounces", "clean_value": "12" }, { "row": 1777, "column": "abv", "clean_value": "0.056" } ], "predicted_repairs": [ { "row": 1777, "column": "beer-name", "new_value": "1881 California Red", "reason": "This beer has a different name than the other beers in the contract." }, { "row": 1776, "column": "beer-name", "new_value": "Kiss Off IPA", "reason": "This beer has a different style than the other beers in the contract." }, { "row": 1775, "column": "beer-name", "new_value": "Alpha Blackback", "reason": "This beer has a different brewery name than the other beers in the contract." }, { "row": 1774, "column": "beer-name", "new_value": "Kiss Off IPA", "reason": "This beer has a different style than the other beers in the contract." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1777,\"column\":\"beer-name\",\"new_value\":\"1881 California Red\",\"reason\":\"This beer has a different name than the other beers in the contract.\"},{\"row\":1776,\"column\":\"beer-name\",\"new_value\":\"Kiss Off IPA\",\"reason\":\"This beer has a different style than the other beers in the contract.\"},{\"row\":1775,\"column\":\"beer-name\",\"new_value\":\"Alpha Blackback\",\"reason\":\"This beer has a different brewery name than the other beers in the contract.\"},{\"row\":1774,\"column\":\"beer-name\",\"new_value\":\"Kiss Off IPA\",\"reason\":\"This beer has a different style than the other beers in the contract.\"}]}" }, { "task_index": 13, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 }, "target_rows": [ { "_row": "881", "index": "882", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "82%", "Sample": "11 patients", "Stateavg": "al_ami-5" }, { "_row": "882", "index": "883", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "883", "index": "884", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "al", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "x0593x5966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" }, { "_row": "884", "index": "885", "ProviderNumber": "10045", "HospitalName": "fayette medical center", "Address1": "1653 temple avenue north", "Address2": "empty", "Address3": "empty", "City": "fayette", "State": "xl", "ZipCode": "35555", "CountyName": "fayette", "PhoneNumber": "2059325966", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - other", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "87%", "Sample": "67 patients", "Stateavg": "al_hf-1" } ], "ground_truth": [ { "row": 881, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 883, "column": "PhoneNumber", "clean_value": "2059325966" }, { "row": 884, "column": "State", "clean_value": "al" } ], "predicted_repairs": [ { "row": 881, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." }, { "row": 882, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." }, { "row": 883, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." }, { "row": 884, "column": "ProviderNumber", "new_value": "10045", "reason": "The patient's address does not match any hospital records." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":881,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"},{\"row\":882,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"},{\"row\":883,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"},{\"row\":884,\"column\":\"ProviderNumber\",\"new_value\":\"10045\",\"reason\":\"The patient's address does not match any hospital records.\",\"why\":\"This is a potential error as the address provided does not correspond to any hospital records.\"}]}" }, { "task_index": 14, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "wrong_value": 4 }, "target_rows": [ { "_row": "1675", "tuple_id": "1676", "src": "wunderground", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:45 a.m.", "sched_arr_time": "4:37 p.m.", "act_arr_time": "4:57 p.m." }, { "_row": "1676", "tuple_id": "1677", "src": "wunderground", "flight": "AA-2957-DFW-CVG", "sched_dep_time": "7:55 a.m.", "act_dep_time": "8:05 a.m.", "sched_arr_time": "10:55 a.m.", "act_arr_time": "10:58 a.m." }, { "_row": "1677", "tuple_id": "1678", "src": "wunderground", "flight": "AA-1664-MIA-ATL", "sched_dep_time": "10:15 a.m.", "act_dep_time": "10:19 a.m.", "sched_arr_time": "11:43 a.m.", "act_arr_time": "11:50 a.m." }, { "_row": "1678", "tuple_id": "1679", "src": "wunderground", "flight": "AA-3979-CVG-ORD", "sched_dep_time": "7:30 a.m.", "act_dep_time": "8:04 a.m.", "sched_arr_time": "7:50 a.m.", "act_arr_time": "7:59 a.m." } ], "ground_truth": [ { "row": 1675, "column": "act_dep_time", "clean_value": "11:30 a.m." }, { "row": 1675, "column": "sched_arr_time", "clean_value": "4:57 p.m." }, { "row": 1675, "column": "act_arr_time", "clean_value": "5:05 p.m." }, { "row": 1676, "column": "act_dep_time", "clean_value": "8:04 a.m." }, { "row": 1676, "column": "sched_arr_time", "clean_value": "11:05 a.m." }, { "row": 1676, "column": "act_arr_time", "clean_value": "11:01 a.m." }, { "row": 1677, "column": "act_dep_time", "clean_value": "10:18 a.m." }, { "row": 1677, "column": "sched_arr_time", "clean_value": "12:10 p.m." }, { "row": 1677, "column": "act_arr_time", "clean_value": "11:56 a.m." }, { "row": 1678, "column": "sched_arr_time", "clean_value": "8:00 a.m." }, { "row": 1678, "column": "act_arr_time", "clean_value": "8:06 a.m." } ], "predicted_repairs": [ { "row": 1675, "column": "act_arr_time", "new_value": "4:57 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1676, "column": "act_arr_time", "new_value": "10:58 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1677, "column": "act_arr_time", "new_value": "11:50 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1678, "column": "act_arr_time", "new_value": "7:59 a.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1675,\"column\":\"act_arr_time\",\"new_value\":\"4:57 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1676,\"column\":\"act_arr_time\",\"new_value\":\"10:58 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1677,\"column\":\"act_arr_time\",\"new_value\":\"11:50 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1678,\"column\":\"act_arr_time\",\"new_value\":\"7:59 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 16, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 3, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3, "overrepair": 4 }, "target_rows": [ { "_row": "734", "index": "735", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "99%", "Sample": "411 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "735", "index": "736", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scix-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "98%", "Sample": "417 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "736", "index": "737", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912xalabamaxhighwayx157", "Address2": "empty", "Address3": "empty", "City": "cuxxman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "98%", "Sample": "405 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "737", "index": "738", "ProviderNumber": "10035", "HospitalName": "cullman regional medical center", "Address1": "1912 alabama highway 157", "Address2": "empty", "Address3": "empty", "City": "cullman", "State": "al", "ZipCode": "35058", "CountyName": "cullman", "PhoneNumber": "2567372000", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 735, "column": "MeasureCode", "clean_value": "scip-inf-2" }, { "row": 736, "column": "Address1", "clean_value": "1912 alabama highway 157" }, { "row": 736, "column": "City", "clean_value": "cullman" } ], "predicted_repairs": [ { "row": 734, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 735, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 736, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." }, { "row": 737, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be found." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":734,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"},{\"row\":735,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"},{\"row\":736,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"},{\"row\":737,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be found.\",\"why\":\"This may indicate that the patient has been discharged from the hospital without a proper discharge plan or that their current discharge plan does not include all necessary medications.\"}]}" }, { "task_index": 17, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 10, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 10, "overrepair": 3, "wrong_cell": 1 }, "target_rows": [ { "_row": "167", "tuple_id": "168", "src": "boston", "flight": "UA-3515-IAD-MSP", "sched_dep_time": "", "act_dep_time": "8:26 a.m.", "sched_arr_time": "", "act_arr_time": "9:54 a.m." }, { "_row": "168", "tuple_id": "169", "src": "boston", "flight": "AA-3468-CVG-MIA", "sched_dep_time": "7:00 a.m.", "act_dep_time": "7:25 a.m.", "sched_arr_time": "9:55 a.m.", "act_arr_time": "9:42 a.m." }, { "_row": "169", "tuple_id": "170", "src": "boston", "flight": "AA-484-DFW-MIA", "sched_dep_time": "4:15 p.m.", "act_dep_time": "4:30 p.m.", "sched_arr_time": "7:55 p.m.", "act_arr_time": "7:35 p.m." }, { "_row": "170", "tuple_id": "171", "src": "boston", "flight": "AA-1886-BOS-MIA", "sched_dep_time": "", "act_dep_time": "10:55 a.m.", "sched_arr_time": "", "act_arr_time": "1:34 p.m." } ], "ground_truth": [ { "row": 167, "column": "sched_dep_time", "clean_value": "8:15 a.m." }, { "row": 167, "column": "act_dep_time", "clean_value": "8:12 a.m." }, { "row": 167, "column": "sched_arr_time", "clean_value": "10:06 a.m." }, { "row": 167, "column": "act_arr_time", "clean_value": "9:56 a.m." }, { "row": 168, "column": "act_arr_time", "clean_value": "9:45 a.m." }, { "row": 169, "column": "act_dep_time", "clean_value": "4:29 p.m." }, { "row": 169, "column": "act_arr_time", "clean_value": "7:39 p.m." }, { "row": 170, "column": "sched_dep_time", "clean_value": "10:45 a.m." }, { "row": 170, "column": "sched_arr_time", "clean_value": "2:20 p.m." }, { "row": 170, "column": "act_arr_time", "clean_value": "1:40 p.m." } ], "predicted_repairs": [ { "row": 170, "column": "flight", "new_value": "AA-1886-BOS-MIA", "reason": "The flight AA-1886-BOS-MIA is not listed in the contract version." }, { "row": 167, "column": "flight", "new_value": "UA-3515-IAD-MSP", "reason": "The flight UA-3515-IAD-MSP is not listed in the contract version." }, { "row": 169, "column": "flight", "new_value": "AA-484-DFW-MIA", "reason": "The flight AA-484-DFW-MIA is not listed in the contract version." }, { "row": 171, "column": "flight", "new_value": "NA", "reason": "No flights are listed in the contract version." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":170,\"column\":\"flight\",\"new_value\":\"AA-1886-BOS-MIA\",\"reason\":\"The flight AA-1886-BOS-MIA is not listed in the contract version.\"},{\"row\":167,\"column\":\"flight\",\"new_value\":\"UA-3515-IAD-MSP\",\"reason\":\"The flight UA-3515-IAD-MSP is not listed in the contract version.\"},{\"row\":169,\"column\":\"flight\",\"new_value\":\"AA-484-DFW-MIA\",\"reason\":\"The flight AA-484-DFW-MIA is not listed in the contract version.\"},{\"row\":171,\"column\":\"flight\",\"new_value\":\"NA\",\"reason\":\"No flights are listed in the contract version.\"}]}" }, { "task_index": 18, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 1, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 1 }, "target_rows": [ { "_row": "1589", "index": "1590", "id": "785", "beer-name": "Old Chub (2003)", "style": "Scottish Ale", "ounces": "12.0 oz", "abv": "0.08", "ibu": "35", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1590", "index": "1591", "id": "745", "beer-name": "Dale's Pale Ale (2008)", "style": "American Pale Ale (APA)", "ounces": "12.0 ounce", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" }, { "_row": "1591", "index": "1592", "id": "744", "beer-name": "Dale's Pale Ale (2006)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz.", "abv": "0.065%", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons CO", "state": "" }, { "_row": "1592", "index": "1593", "id": "743", "beer-name": "Dale's Pale Ale (2004)", "style": "American Pale Ale (APA)", "ounces": "12.0 oz", "abv": "0.065", "ibu": "65", "brewery_id": "503", "brewery-name": "Oskar Blues Brewery", "city": "Lyons", "state": "CO" } ], "ground_truth": [ { "row": 1589, "column": "ounces", "clean_value": "12" }, { "row": 1590, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "ounces", "clean_value": "12" }, { "row": 1591, "column": "abv", "clean_value": "0.065" }, { "row": 1591, "column": "city", "clean_value": "Lyons" }, { "row": 1591, "column": "state", "clean_value": "CO" }, { "row": 1592, "column": "ounces", "clean_value": "12" } ], "predicted_repairs": [ { "row": 1592, "column": "style", "new_value": "Scottish Ale", "reason": "The beer name has been changed to 'Scottish Ale' which is a different style than the original 'Scottish Ale'." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1592,\"column\":\"style\",\"new_value\":\"Scottish Ale\",\"reason\":\"The beer name has been changed to 'Scottish Ale' which is a different style than the original 'Scottish Ale'.\"}]}" }, { "task_index": 19, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 }, "target_rows": [ { "_row": "512", "index": "513", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" }, { "_row": "513", "index": "514", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "chxrokxx", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "100%", "Sample": "6 patients", "Stateavg": "al_scip-inf-6" }, { "_row": "514", "index": "515", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-1", "MeasureName": "surgery patients whose doctors ordered treatments to prevent blood clots after certain types of surgeries", "Score": "1xx%", "Sample": "5 patients", "Stateavg": "al_scip-vte-1" }, { "_row": "515", "index": "516", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-vte-2", "MeasureName": "patients who got treatment at the right time (within 24 hours before or after their surgery) to help prevent blood clots after certain types of surgery", "Score": "100%", "Sample": "5 patients", "Stateavg": "al_scip-vte-2" } ], "ground_truth": [ { "row": 513, "column": "CountyName", "clean_value": "cherokee" }, { "row": 514, "column": "Score", "clean_value": "100%" } ], "predicted_repairs": [ { "row": 512, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." }, { "row": 513, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." }, { "row": 514, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." }, { "row": 515, "column": "ProviderNumber", "new_value": "10022", "reason": "The patient's condition requires immediate attention and may require urgent care." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":512,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"},{\"row\":513,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"},{\"row\":514,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"},{\"row\":515,\"column\":\"ProviderNumber\",\"new_value\":\"10022\",\"reason\":\"The patient's condition requires immediate attention and may require urgent care.\",\"why\":\"The patient's condition necessitates prompt intervention as it could potentially lead to severe complications if left untreated.\"}]}" }, { "task_index": 22, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 }, "target_rows": [ { "_row": "870", "index": "871", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-1", "MeasureName": "surgery patients who were given an antibiotic at the right time (within one hour before surgery) to help prevent infection", "Score": "80%", "Sample": "15 patients", "Stateavg": "al_scip-inf-1" }, { "_row": "871", "index": "872", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "87%", "Sample": "15 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "872", "index": "873", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntaxy non-pxofit - pxivate", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "87%", "Sample": "15 patiexts", "Stateavg": "al_scip-inf-3" }, { "_row": "873", "index": "874", "ProviderNumber": "10044", "HospitalName": "marion regional medical center", "Address1": "1256 military street south", "Address2": "empty", "Address3": "empty", "City": "hamilton", "State": "al", "ZipCode": "35570", "CountyName": "marion", "PhoneNumber": "2059216200", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_scip-inf-4" } ], "ground_truth": [ { "row": 872, "column": "HospitalOwner", "clean_value": "voluntary non-profit - private" }, { "row": 872, "column": "Sample", "clean_value": "15 patients" } ], "predicted_repairs": [ { "row": 870, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." }, { "row": 871, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." }, { "row": 872, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." }, { "row": 873, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null or empty." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":870,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"},{\"row\":871,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"},{\"row\":872,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"},{\"row\":873,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null or empty.\"}]}" }, { "task_index": 23, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 4 }, "target_rows": [ { "_row": "324", "tuple_id": "325", "src": "weather", "flight": "AA-789-ORD-DEN", "sched_dep_time": "1:05 p.m.", "act_dep_time": "1:20 p.m.", "sched_arr_time": "2:35 p.m.", "act_arr_time": "2:49 p.m." }, { "_row": "325", "tuple_id": "326", "src": "weather", "flight": "UA-854-SFO-IAH", "sched_dep_time": "7:53 a.m.", "act_dep_time": "8:07 a.m.", "sched_arr_time": "1:39 p.m.", "act_arr_time": "1:23 p.m." }, { "_row": "326", "tuple_id": "327", "src": "weather", "flight": "AA-415-BOS-ORD", "sched_dep_time": "8:35 a.m.", "act_dep_time": "", "sched_arr_time": "10:40 a.m.", "act_arr_time": "" }, { "_row": "327", "tuple_id": "328", "src": "weather", "flight": "AA-85-JFK-SFO", "sched_dep_time": "3:05 p.m.", "act_dep_time": "", "sched_arr_time": "6:30 p.m.", "act_arr_time": "" } ], "ground_truth": [ { "row": 324, "column": "act_dep_time", "clean_value": "1:19 p.m." }, { "row": 324, "column": "act_arr_time", "clean_value": "3:13 p.m." }, { "row": 325, "column": "act_dep_time", "clean_value": "7:49 a.m." }, { "row": 325, "column": "act_arr_time", "clean_value": "1:30 p.m." }, { "row": 326, "column": "act_dep_time", "clean_value": "8:56 a.m." }, { "row": 326, "column": "act_arr_time", "clean_value": "10:16 a.m." }, { "row": 327, "column": "act_dep_time", "clean_value": "3:36 p.m." }, { "row": 327, "column": "act_arr_time", "clean_value": "6:43 p.m." } ], "predicted_repairs": [ { "row": 324, "column": "act_arr_time", "new_value": "2:49 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 325, "column": "act_arr_time", "new_value": "1:23 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 326, "column": "act_arr_time", "new_value": "10:40 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 327, "column": "act_arr_time", "new_value": "", "reason": "The new value for act_arr_time is empty." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":324,\"column\":\"act_arr_time\",\"new_value\":\"2:49 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":325,\"column\":\"act_arr_time\",\"new_value\":\"1:23 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":326,\"column\":\"act_arr_time\",\"new_value\":\"10:40 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":327,\"column\":\"act_arr_time\",\"new_value\":\"\",\"reason\":\"The new value for act_arr_time is empty.\"}]}" }, { "task_index": 26, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 11, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 9, "overrepair": 2, "wrong_value": 2 }, "target_rows": [ { "_row": "471", "tuple_id": "472", "src": "flightview", "flight": "AA-4344-ORD-DTW", "sched_dep_time": "", "act_dep_time": "12:14 p.m.", "sched_arr_time": "", "act_arr_time": "2:01 p.m." }, { "_row": "472", "tuple_id": "473", "src": "flightview", "flight": "UA-257-JFK-SFO", "sched_dep_time": "2:30 p.m.", "act_dep_time": "2:43 p.m.", "sched_arr_time": "6:15 p.m.", "act_arr_time": "5:42 p.m." }, { "_row": "473", "tuple_id": "474", "src": "flightview", "flight": "UA-2945-PHL-CLT", "sched_dep_time": "12:00 p.m.", "act_dep_time": "12:08 p.m.", "sched_arr_time": "1:45 p.m.", "act_arr_time": "1:14 p.m." }, { "_row": "474", "tuple_id": "475", "src": "flightview", "flight": "CO-63-EWR-IAH", "sched_dep_time": "", "act_dep_time": "5:38 p.m.", "sched_arr_time": "", "act_arr_time": "8:03 p.m." } ], "ground_truth": [ { "row": 471, "column": "sched_dep_time", "clean_value": "11:45 a.m." }, { "row": 471, "column": "act_dep_time", "clean_value": "12:13 p.m." }, { "row": 471, "column": "sched_arr_time", "clean_value": "2:00 p.m." }, { "row": 471, "column": "act_arr_time", "clean_value": "2:10 p.m." }, { "row": 472, "column": "act_dep_time", "clean_value": "2:26 p.m." }, { "row": 473, "column": "sched_dep_time", "clean_value": "12:00 a.m." }, { "row": 473, "column": "act_dep_time", "clean_value": "3:11 a.m." }, { "row": 473, "column": "act_arr_time", "clean_value": "1:15 p.m." }, { "row": 474, "column": "sched_dep_time", "clean_value": "5:25 p.m." }, { "row": 474, "column": "act_dep_time", "clean_value": "5:22 p.m." }, { "row": 474, "column": "sched_arr_time", "clean_value": "8:22 p.m." } ], "predicted_repairs": [ { "row": 471, "column": "act_arr_time", "new_value": "2:01 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 472, "column": "act_arr_time", "new_value": "5:42 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 473, "column": "act_arr_time", "new_value": "1:14 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 474, "column": "act_arr_time", "new_value": "8:03 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":471,\"column\":\"act_arr_time\",\"new_value\":\"2:01 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":472,\"column\":\"act_arr_time\",\"new_value\":\"5:42 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":473,\"column\":\"act_arr_time\",\"new_value\":\"1:14 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":474,\"column\":\"act_arr_time\",\"new_value\":\"8:03 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 27, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 7, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "379", "index": "380", "id": "397", "beer-name": "SummerBright Ale", "style": "American Pale Wheat Ale", "ounces": "12.0 ounce", "abv": "0.045", "ibu": "15", "brewery_id": "391", "brewery-name": "Breckenridge Brewery", "city": "Denver", "state": "CO" }, { "_row": "380", "index": "381", "id": "193", "beer-name": "Lucky U IPA", "style": "American IPA", "ounces": "12.0 ounce", "abv": "0.062%", "ibu": "68", "brewery_id": "391", "brewery-name": "Breckenridge Brewery", "city": "Denver", "state": "CO" }, { "_row": "381", "index": "382", "id": "83", "beer-name": "Avalanche Ale", "style": "American Amber / Red Ale", "ounces": "12.0 oz", "abv": "0.054", "ibu": "19", "brewery_id": "391", "brewery-name": "Breckenridge Brewery", "city": "Denver CO", "state": "" }, { "_row": "382", "index": "383", "id": "1802", "beer-name": "You're My Boy, Blue", "style": "Fruit / Vegetable Beer", "ounces": "12.0 oz.", "abv": "0.05", "ibu": "N/A", "brewery_id": "308", "brewery-name": "Brew Bus Brewing", "city": "Tampa", "state": "FL" } ], "ground_truth": [ { "row": 379, "column": "ounces", "clean_value": "12" }, { "row": 380, "column": "ounces", "clean_value": "12" }, { "row": 380, "column": "abv", "clean_value": "0.062" }, { "row": 381, "column": "ounces", "clean_value": "12" }, { "row": 381, "column": "city", "clean_value": "Denver" }, { "row": 381, "column": "state", "clean_value": "CO" }, { "row": 382, "column": "ounces", "clean_value": "12" }, { "row": 382, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 379, "column": "abv", "new_value": "0.045", "reason": "The new value for abv is incorrect." }, { "row": 380, "column": "abv", "new_value": "0.062%", "reason": "The new value for abv is incorrect." }, { "row": 381, "column": "abv", "new_value": "0.054", "reason": "The new value for abv is incorrect." }, { "row": 382, "column": "abv", "new_value": "0.05", "reason": "The new value for abv is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":379,\"column\":\"abv\",\"new_value\":\"0.045\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":380,\"column\":\"abv\",\"new_value\":\"0.062%\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":381,\"column\":\"abv\",\"new_value\":\"0.054\",\"reason\":\"The new value for abv is incorrect.\"},{\"row\":382,\"column\":\"abv\",\"new_value\":\"0.05\",\"reason\":\"The new value for abv is incorrect.\"}]}" }, { "task_index": 28, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 4 }, "target_rows": [ { "_row": "958", "index": "959", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprise", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-4", "MeasureName": "heart attack patients given smoking cessation advice/counseling", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-4" }, { "_row": "959", "index": "960", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprise", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-5", "MeasureName": "heart attack patients given beta blocker at discharge", "Score": "100%", "Sample": "2 patients", "Stateavg": "al_ami-5" }, { "_row": "960", "index": "961", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprxse", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "961", "index": "962", "ProviderNumber": "10049", "HospitalName": "medical center enterprise", "Address1": "400 n edwards street", "Address2": "empty", "Address3": "empty", "City": "enterprise", "State": "al", "ZipCode": "36330", "CountyName": "coffee", "PhoneNumber": "3343470584", "HospitalType": "acute care hospitals", "HospitalOwner": "proprietary", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-8a" } ], "ground_truth": [ { "row": 960, "column": "City", "clean_value": "enterprise" } ], "predicted_repairs": [ { "row": 958, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid phone number." }, { "row": 959, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid phone number." }, { "row": 960, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid phone number." }, { "row": 961, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid phone number." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":958,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid phone number.\"},{\"row\":959,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid phone number.\"},{\"row\":960,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid phone number.\"},{\"row\":961,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid phone number.\"}]}" }, { "task_index": 29, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.1667, "precision": 0.25, "recall": 0.125, "tp": 1, "fp": 3, "fn": 7, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 4, "wrong_value": 3 }, "target_rows": [ { "_row": "931", "tuple_id": "932", "src": "flightarrival", "flight": "AA-3-JFK-LAX", "sched_dep_time": "12:00 p.m.", "act_dep_time": "12:12 p.m.", "sched_arr_time": "3:15 p.m.", "act_arr_time": "3:10 p.m." }, { "_row": "932", "tuple_id": "933", "src": "flightarrival", "flight": "CO-1694-LAX-IAH", "sched_dep_time": "7:15 p.m.", "act_dep_time": "7:15 p.m. (Estimated)", "sched_arr_time": "12:21 a.m.", "act_arr_time": "12:21 a.m. (Estimated)" }, { "_row": "933", "tuple_id": "934", "src": "flightarrival", "flight": "CO-1193-EWR-MCO", "sched_dep_time": "9:15 a.m.", "act_dep_time": "", "sched_arr_time": "12:18 p.m.", "act_arr_time": "" }, { "_row": "934", "tuple_id": "935", "src": "flightarrival", "flight": "UA-2906-PHL-MCO", "sched_dep_time": "3:50 p.m.", "act_dep_time": "4:46 p.m.", "sched_arr_time": "6:23 p.m.", "act_arr_time": "6:36 p.m." } ], "ground_truth": [ { "row": 931, "column": "act_dep_time", "clean_value": "12:11 p.m." }, { "row": 931, "column": "act_arr_time", "clean_value": "3:16 p.m." }, { "row": 932, "column": "act_dep_time", "clean_value": "7:15 p.m." }, { "row": 932, "column": "act_arr_time", "clean_value": "12:21 a.m." }, { "row": 933, "column": "act_dep_time", "clean_value": "9:14 a.m." }, { "row": 933, "column": "act_arr_time", "clean_value": "12:09 p.m." }, { "row": 934, "column": "act_dep_time", "clean_value": "4:28 p.m." }, { "row": 934, "column": "act_arr_time", "clean_value": "6:38 p.m." } ], "predicted_repairs": [ { "row": 931, "column": "act_arr_time", "new_value": "12:21 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 932, "column": "act_arr_time", "new_value": "12:21 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 933, "column": "act_arr_time", "new_value": "6:36 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 934, "column": "act_arr_time", "new_value": "6:23 p.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":931,\"column\":\"act_arr_time\",\"new_value\":\"12:21 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":932,\"column\":\"act_arr_time\",\"new_value\":\"12:21 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":933,\"column\":\"act_arr_time\",\"new_value\":\"6:36 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":934,\"column\":\"act_arr_time\",\"new_value\":\"6:23 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 31, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 2, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 2, "overrepair": 4 }, "target_rows": [ { "_row": "521", "index": "522", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yxs", "Condition": "heart attack", "MeasureCode": "ami-7a", "MeasureName": "heart attack patients given fibrinolytic medication within 30 minutes of arrival", "Score": "empty", "Sample": "0 patients", "Stateavg": "al_ami-7a" }, { "_row": "522", "index": "523", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yes", "Condition": "heart attack", "MeasureCode": "ami-8a", "MeasureName": "heart attack patients given pci within 90 minutes of arrival", "Score": "96%", "Sample": "27 patients", "Stateavg": "al_ami-8a" }, { "_row": "523", "index": "524", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-1", "MeasureName": "heart failure patients given discharge instructions", "Score": "100%", "Sample": "25x patients", "Stateavg": "al_hf-1" }, { "_row": "524", "index": "525", "ProviderNumber": "10023", "HospitalName": "baptist medical center south", "Address1": "2105 east south boulevard", "Address2": "empty", "Address3": "empty", "City": "montgomery", "State": "al", "ZipCode": "36116", "CountyName": "montgomery", "PhoneNumber": "3342882100", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - church", "EmergencyService": "yes", "Condition": "heart failure", "MeasureCode": "hf-2", "MeasureName": "heart failure patients given an evaluation of left ventricular systolic (lvs) function", "Score": "100%", "Sample": "292 patients", "Stateavg": "al_hf-2" } ], "ground_truth": [ { "row": 521, "column": "EmergencyService", "clean_value": "yes" }, { "row": 523, "column": "Sample", "clean_value": "257 patients" } ], "predicted_repairs": [ { "row": 521, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid hospital name." }, { "row": 522, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid hospital name." }, { "row": 523, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid hospital name." }, { "row": 524, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's address does not have a valid hospital name." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":521,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid hospital name.\",\"why\":\"The address provided is for a different hospital or provider than what was specified in the contract.\"},{\"row\":522,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid hospital name.\",\"why\":\"The address provided is for a different hospital or provider than what was specified in the contract.\"},{\"row\":523,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid hospital name.\",\"why\":\"The address provided is for a different hospital or provider than what was specified in the contract.\"},{\"row\":524,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's address does not have a valid hospital name.\",\"why\":\"The address provided is for a different hospital or provider than what was specified in the contract.\"}]}" }, { "task_index": 32, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 9, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 8, "overrepair": 3, "wrong_value": 1 }, "target_rows": [ { "_row": "655", "tuple_id": "656", "src": "panynj", "flight": "AA-466-IAH-MIA", "sched_dep_time": "6:00 a.m.", "act_dep_time": "6:09 a.m.", "sched_arr_time": "9:20 a.m.", "act_arr_time": "9:05 a.m." }, { "_row": "656", "tuple_id": "657", "src": "panynj", "flight": "UA-3050-PHX-CLT", "sched_dep_time": "11:05 a.m.", "act_dep_time": "11:45 a.m.", "sched_arr_time": "4:57 p.m.", "act_arr_time": "5:03 p.m." }, { "_row": "657", "tuple_id": "658", "src": "panynj", "flight": "CO-89-IAH-EWR", "sched_dep_time": "", "act_dep_time": "6:17 a.m.", "sched_arr_time": "", "act_arr_time": "10:27 a.m." }, { "_row": "658", "tuple_id": "659", "src": "panynj", "flight": "CO-1088-CLE-IAH", "sched_dep_time": "", "act_dep_time": "9:01 a.m.", "sched_arr_time": "", "act_arr_time": "10:56 a.m." } ], "ground_truth": [ { "row": 655, "column": "act_dep_time", "clean_value": "6:08 a.m." }, { "row": 656, "column": "act_dep_time", "clean_value": "11:30 a.m." }, { "row": 656, "column": "act_arr_time", "clean_value": "5:05 p.m." }, { "row": 657, "column": "sched_dep_time", "clean_value": "6:00 a.m." }, { "row": 657, "column": "act_dep_time", "clean_value": "6:02 a.m." }, { "row": 657, "column": "sched_arr_time", "clean_value": "10:20 a.m." }, { "row": 658, "column": "sched_dep_time", "clean_value": "8:40 a.m." }, { "row": 658, "column": "act_dep_time", "clean_value": "8:40 a.m." }, { "row": 658, "column": "sched_arr_time", "clean_value": "10:54 a.m." } ], "predicted_repairs": [ { "row": 655, "column": "act_arr_time", "new_value": "9:05 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 656, "column": "act_arr_time", "new_value": "5:03 p.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 657, "column": "act_arr_time", "new_value": "10:27 a.m.", "reason": "The new value for act_arr_time is incorrect." }, { "row": 658, "column": "act_arr_time", "new_value": "10:56 a.m.", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":655,\"column\":\"act_arr_time\",\"new_value\":\"9:05 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":656,\"column\":\"act_arr_time\",\"new_value\":\"5:03 p.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":657,\"column\":\"act_arr_time\",\"new_value\":\"10:27 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":658,\"column\":\"act_arr_time\",\"new_value\":\"10:56 a.m.\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" }, { "task_index": 33, "dataset": "beers", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 3, "fn": 13, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 12, "overrepair": 2, "wrong_value": 1 }, "target_rows": [ { "_row": "541", "index": "542", "id": "61", "beer-name": "Supper Club Lager", "style": "American Pale Lager", "ounces": "12.0 ounce", "abv": "", "ibu": "N/A", "brewery_id": "192", "brewery-name": "Capital Brewery", "city": "Middleton", "state": "WI" }, { "_row": "542", "index": "543", "id": "784", "beer-name": "Carolina Lighthouse (2007)", "style": "American Blonde Ale", "ounces": "12.0 ounce", "abv": "0.04", "ibu": "N/A", "brewery_id": "504", "brewery-name": "Carolina Beer & Beverage", "city": "Mooresville NC", "state": "" }, { "_row": "543", "index": "544", "id": "783", "beer-name": "Carolina Blonde (2006)", "style": "American Blonde Ale", "ounces": "12.0 ounce", "abv": "0.05%", "ibu": "N/A", "brewery_id": "504", "brewery-name": "Carolina Beer & Beverage", "city": "Mooresville NC", "state": "" }, { "_row": "544", "index": "545", "id": "782", "beer-name": "Carolina Blonde Light (2005)", "style": "American Blonde Ale", "ounces": "12.0 oz", "abv": "0.035", "ibu": "N/A", "brewery_id": "504", "brewery-name": "Carolina Beer & Beverage", "city": "Mooresville", "state": "NC" } ], "ground_truth": [ { "row": 541, "column": "ounces", "clean_value": "12" }, { "row": 541, "column": "ibu", "clean_value": "" }, { "row": 542, "column": "ounces", "clean_value": "12" }, { "row": 542, "column": "ibu", "clean_value": "" }, { "row": 542, "column": "city", "clean_value": "Mooresville" }, { "row": 542, "column": "state", "clean_value": "NC" }, { "row": 543, "column": "ounces", "clean_value": "12" }, { "row": 543, "column": "abv", "clean_value": "0.05" }, { "row": 543, "column": "ibu", "clean_value": "" }, { "row": 543, "column": "city", "clean_value": "Mooresville" }, { "row": 543, "column": "state", "clean_value": "NC" }, { "row": 544, "column": "ounces", "clean_value": "12" }, { "row": 544, "column": "ibu", "clean_value": "" } ], "predicted_repairs": [ { "row": 541, "column": "abv", "new_value": "0.04", "reason": "The beer name has been changed to 'Carolina Lighthouse (2007)' which is a different style." }, { "row": 542, "column": "abv", "new_value": "0.05%", "reason": "The beer name has been changed to 'Carolina Blonde (2006)' which is a different style." }, { "row": 543, "column": "abv", "new_value": "0.035", "reason": "The beer name has been changed to 'Carolina Blonde Light (2005)' which is a different style." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":541,\"column\":\"abv\",\"new_value\":\"0.04\",\"reason\":\"The beer name has been changed to 'Carolina Lighthouse (2007)' which is a different style.\"},{\"row\":542,\"column\":\"abv\",\"new_value\":\"0.05%\",\"reason\":\"The beer name has been changed to 'Carolina Blonde (2006)' which is a different style.\"},{\"row\":543,\"column\":\"abv\",\"new_value\":\"0.035\",\"reason\":\"The beer name has been changed to 'Carolina Blonde Light (2005)' which is a different style.\"}]}" }, { "task_index": 34, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 1, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 1, "overrepair": 4 }, "target_rows": [ { "_row": "460", "index": "461", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-2", "MeasureName": "surgery patients who were given the right kind of antibiotic to help prevent infection", "Score": "91%", "Sample": "255 patients", "Stateavg": "al_scip-inf-2" }, { "_row": "461", "index": "462", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-3", "MeasureName": "surgery patients whose preventive antibiotics were stopped at the right time (within 24 hours after surgery)", "Score": "84%", "Sample": "245 patients", "Stateavg": "al_scip-inf-3" }, { "_row": "462", "index": "463", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-4", "MeasureName": "all heart surgery patients whose blood sugar (blood glucose) is kept under good control in the days right after surgery", "Score": "empty", "Sample": "x patients", "Stateavg": "al_scip-inf-4" }, { "_row": "463", "index": "464", "ProviderNumber": "10019", "HospitalName": "helen keller memorial hospital", "Address1": "1300 south montgomery avenue", "Address2": "empty", "Address3": "empty", "City": "sheffield", "State": "al", "ZipCode": "35660", "CountyName": "jefferson", "PhoneNumber": "2563864556", "HospitalType": "acute care hospitals", "HospitalOwner": "government - hospital district or authority", "EmergencyService": "yes", "Condition": "surgical infection prevention", "MeasureCode": "scip-inf-6", "MeasureName": "surgery patients needing hair removed from the surgical area before surgery who had hair removed using a safer method (electric clippers or hair removal cream c not a razor)", "Score": "97%", "Sample": "369 patients", "Stateavg": "al_scip-inf-6" } ], "ground_truth": [ { "row": 462, "column": "Sample", "clean_value": "0 patients" } ], "predicted_repairs": [ { "row": 460, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null." }, { "row": 461, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null." }, { "row": 462, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null." }, { "row": 463, "column": "ProviderNumber", "new_value": "none", "reason": "The patient's provider number cannot be null." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":460,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null.\",\"__type\":\"invalid_provider_number\"},{\"row\":461,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null.\",\"__type\":\"invalid_provider_number\"},{\"row\":462,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null.\",\"__type\":\"invalid_provider_number\"},{\"row\":463,\"column\":\"ProviderNumber\",\"new_value\":\"none\",\"reason\":\"The patient's provider number cannot be null.\",\"__type\":\"invalid_provider_number\"}]}" }, { "task_index": 37, "dataset": "hospital", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 0, "fn": 3, "parse_ok": false, "parse_error_kind": "truncated_json", "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 3 }, "target_rows": [ { "_row": "502", "index": "503", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "chxrokxx", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-2", "MeasureName": "pneumonia patients assessed and given pneumococcal vaccination", "Score": "93%", "Sample": "44 paxienxs", "Stateavg": "al_pn-2" }, { "_row": "503", "index": "504", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-3b", "MeasureName": "pneumonia patients whose initial emergency room blood culture was performed prior to the administration of the first hospital dose of antibiotics", "Score": "97%", "Sample": "33 patients", "Stateavg": "al_pn-3b" }, { "_row": "504", "index": "505", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "ax", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-4", "MeasureName": "pneumonia patients given smoking cessation advice/counseling", "Score": "100%", "Sample": "20 patients", "Stateavg": "al_pn-4" }, { "_row": "505", "index": "506", "ProviderNumber": "10022", "HospitalName": "cherokee medical center", "Address1": "400 northwood dr", "Address2": "empty", "Address3": "empty", "City": "centre", "State": "al", "ZipCode": "35960", "CountyName": "cherokee", "PhoneNumber": "2569275531", "HospitalType": "acute care hospitals", "HospitalOwner": "voluntary non-profit - private", "EmergencyService": "yes", "Condition": "pneumonia", "MeasureCode": "pn-5c", "MeasureName": "pneumonia patients given initial antibiotic(s) within 6 hours after arrival", "Score": "89%", "Sample": "56 patients", "Stateavg": "al_pn-5c" } ], "ground_truth": [ { "row": 502, "column": "CountyName", "clean_value": "cherokee" }, { "row": 502, "column": "Sample", "clean_value": "44 patients" }, { "row": 504, "column": "State", "clean_value": "al" } ], "predicted_repairs": [], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":502,\"column\":\"ProviderNumber\",\"new_value\":\"Voluntary Non-Profit - Private\",\"reason\":\"The ProviderNumber is already Voluntary Non-Profit - Private which does not require any changes.\",\"strict:false}]}" }, { "task_index": 38, "dataset": "flights", "inferability": "external_reference_required", "f1": 0.0, "precision": 0.0, "recall": 0.0, "tp": 0, "fp": 4, "fn": 8, "parse_ok": true, "parse_error_kind": null, "schema_case_errors": 0, "failure_taxonomy": { "missed_repair": 6, "overrepair": 2, "wrong_value": 2 }, "target_rows": [ { "_row": "1394", "tuple_id": "1395", "src": "orbitz", "flight": "UA-858-PVG-SFO", "sched_dep_time": "1:45 p.m.", "act_dep_time": "1:32 p.m.", "sched_arr_time": "8:27aDec 1", "act_arr_time": "8:02aDec 1" }, { "_row": "1395", "tuple_id": "1396", "src": "orbitz", "flight": "UA-2704-DTW-PHX", "sched_dep_time": "11:15aDec 1", "act_dep_time": "11:15aDec 1", "sched_arr_time": "1:40 p.m.", "act_arr_time": "2:00 p.m." }, { "_row": "1396", "tuple_id": "1397", "src": "orbitz", "flight": "AA-3063-SLC-LAX", "sched_dep_time": "8:20 p.m.", "act_dep_time": "8:30 p.m.", "sched_arr_time": "9:18 p.m.", "act_arr_time": "" }, { "_row": "1397", "tuple_id": "1398", "src": "orbitz", "flight": "UA-2708-EWR-CLT", "sched_dep_time": "2:55 p.m.", "act_dep_time": "2:52 p.m.", "sched_arr_time": "4:53 p.m.", "act_arr_time": "4:44 p.m." } ], "ground_truth": [ { "row": 1394, "column": "sched_arr_time", "clean_value": "8:27 a.m." }, { "row": 1394, "column": "act_arr_time", "clean_value": "8:02 a.m." }, { "row": 1395, "column": "sched_dep_time", "clean_value": "11:15 a.m." }, { "row": 1395, "column": "act_dep_time", "clean_value": "11:15 a.m." }, { "row": 1396, "column": "act_dep_time", "clean_value": "8:39 p.m." }, { "row": 1396, "column": "sched_arr_time", "clean_value": "9:20 p.m." }, { "row": 1396, "column": "act_arr_time", "clean_value": "9:20 p.m." }, { "row": 1397, "column": "act_dep_time", "clean_value": "2:55 p.m." } ], "predicted_repairs": [ { "row": 1394, "column": "act_arr_time", "new_value": "8:02pDec 1", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1395, "column": "act_arr_time", "new_value": "2:00pDec 1", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1396, "column": "act_arr_time", "new_value": "8:30pDec 1", "reason": "The new value for act_arr_time is incorrect." }, { "row": 1397, "column": "act_arr_time", "new_value": "4:44pDec 1", "reason": "The new value for act_arr_time is incorrect." } ], "decoded_preview": "{\"action\":\"submit_repairs\",\"repairs\":[{\"row\":1394,\"column\":\"act_arr_time\",\"new_value\":\"8:02pDec 1\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1395,\"column\":\"act_arr_time\",\"new_value\":\"2:00pDec 1\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1396,\"column\":\"act_arr_time\",\"new_value\":\"8:30pDec 1\",\"reason\":\"The new value for act_arr_time is incorrect.\"},{\"row\":1397,\"column\":\"act_arr_time\",\"new_value\":\"4:44pDec 1\",\"reason\":\"The new value for act_arr_time is incorrect.\"}]}" } ] } } }