Upload MIMIC test evaluation results
Browse files
README.md
CHANGED
|
@@ -105,34 +105,34 @@ These comparison tables are refreshed across the full LAnA collection whenever a
|
|
| 105 |
| Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
|
| 106 |
| --- | --- | --- | --- | --- | --- |
|
| 107 |
| Number of studies | `3041` | `3041` | `3041` | `3041` | `3041` |
|
| 108 |
-
| ROUGE-L | `0.1686` | `0.1653` | `0.1513` | `0.1670` | `0.
|
| 109 |
-
| BLEU-1 | `0.2091` | `0.1916` | `0.1707` | `0.2174` | `0.
|
| 110 |
-
| BLEU-4 | `0.0417` | `0.0386` | `0.0357` | `0.0417` | `0.
|
| 111 |
-
| METEOR | `0.2298` | `0.2202` | `0.2079` | `0.2063` | `0.
|
| 112 |
-
| RadGraph F1 | `0.1024` | `0.0921` | `0.0918` | `0.1057` | `0.
|
| 113 |
-
| RadGraph entity F1 | `0.1587` | `0.1459` | `0.1399` | `0.1569` | `0.
|
| 114 |
-
| RadGraph relation F1 | `0.1443` | `0.1322` | `0.1246` | `0.1474` | `0.
|
| 115 |
-
| CheXpert F1 14-micro | `0.2116` | `0.1565` | `0.1829` | `0.1401` | `0.
|
| 116 |
-
| CheXpert F1 5-micro | `0.2512` | `0.1530` | `0.2183` | `0.2506` | `0.
|
| 117 |
-
| CheXpert F1 14-macro | `0.1095` | `0.0713` | `0.1095` | `0.0401` | `0.
|
| 118 |
-
| CheXpert F1 5-macro | `0.1644` | `0.1007` | `0.1634` | `0.1004` | `0.
|
| 119 |
|
| 120 |
### Cross-Model Comparison: Findings-Only Frontal Test Studies
|
| 121 |
|
| 122 |
| Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
|
| 123 |
| --- | --- | --- | --- | --- | --- |
|
| 124 |
| Number of studies | `2210` | `2210` | `2210` | `2210` | `2210` |
|
| 125 |
-
| ROUGE-L | `0.1771` | `0.1720` | `0.1576` | `0.1771` | `0.
|
| 126 |
-
| BLEU-1 | `0.2177` | `0.2003` | `0.1754` | `0.2263` | `0.
|
| 127 |
-
| BLEU-4 | `0.0484` | `0.0449` | `0.0405` | `0.0487` | `0.
|
| 128 |
-
| METEOR | `0.2466` | `0.2347` | `0.2207` | `0.2240` | `0.
|
| 129 |
-
| RadGraph F1 | `0.1119` | `0.1000` | `0.1010` | `0.1181` | `0.
|
| 130 |
-
| RadGraph entity F1 | `0.1713` | `0.1577` | `0.1517` | `0.1739` | `0.
|
| 131 |
-
| RadGraph relation F1 | `0.1549` | `0.1413` | `0.1347` | `0.1628` | `0.
|
| 132 |
-
| CheXpert F1 14-micro | `0.1907` | `0.1442` | `0.1651` | `0.1365` | `0.
|
| 133 |
-
| CheXpert F1 5-micro | `0.2415` | `0.1716` | `0.2152` | `0.2455` | `0.
|
| 134 |
-
| CheXpert F1 14-macro | `0.1039` | `0.0700` | `0.1047` | `0.0381` | `0.
|
| 135 |
-
| CheXpert F1 5-macro | `0.1578` | `0.1112` | `0.1611` | `0.0952` | `0.
|
| 136 |
|
| 137 |
## Data
|
| 138 |
|
|
|
|
| 105 |
| Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
|
| 106 |
| --- | --- | --- | --- | --- | --- |
|
| 107 |
| Number of studies | `3041` | `3041` | `3041` | `3041` | `3041` |
|
| 108 |
+
| ROUGE-L | `0.1686` | `0.1653` | `0.1513` | `0.1670` | `0.1745` |
|
| 109 |
+
| BLEU-1 | `0.2091` | `0.1916` | `0.1707` | `0.2174` | `0.2346` |
|
| 110 |
+
| BLEU-4 | `0.0417` | `0.0386` | `0.0357` | `0.0417` | `0.0484` |
|
| 111 |
+
| METEOR | `0.2298` | `0.2202` | `0.2079` | `0.2063` | `0.2129` |
|
| 112 |
+
| RadGraph F1 | `0.1024` | `0.0921` | `0.0918` | `0.1057` | `0.0939` |
|
| 113 |
+
| RadGraph entity F1 | `0.1587` | `0.1459` | `0.1399` | `0.1569` | `0.1441` |
|
| 114 |
+
| RadGraph relation F1 | `0.1443` | `0.1322` | `0.1246` | `0.1474` | `0.1280` |
|
| 115 |
+
| CheXpert F1 14-micro | `0.2116` | `0.1565` | `0.1829` | `0.1401` | `0.3116` |
|
| 116 |
+
| CheXpert F1 5-micro | `0.2512` | `0.1530` | `0.2183` | `0.2506` | `0.2486` |
|
| 117 |
+
| CheXpert F1 14-macro | `0.1095` | `0.0713` | `0.1095` | `0.0401` | `0.1363` |
|
| 118 |
+
| CheXpert F1 5-macro | `0.1644` | `0.1007` | `0.1634` | `0.1004` | `0.1686` |
|
| 119 |
|
| 120 |
### Cross-Model Comparison: Findings-Only Frontal Test Studies
|
| 121 |
|
| 122 |
| Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
|
| 123 |
| --- | --- | --- | --- | --- | --- |
|
| 124 |
| Number of studies | `2210` | `2210` | `2210` | `2210` | `2210` |
|
| 125 |
+
| ROUGE-L | `0.1771` | `0.1720` | `0.1576` | `0.1771` | `0.1848` |
|
| 126 |
+
| BLEU-1 | `0.2177` | `0.2003` | `0.1754` | `0.2263` | `0.2480` |
|
| 127 |
+
| BLEU-4 | `0.0484` | `0.0449` | `0.0405` | `0.0487` | `0.0573` |
|
| 128 |
+
| METEOR | `0.2466` | `0.2347` | `0.2207` | `0.2240` | `0.2310` |
|
| 129 |
+
| RadGraph F1 | `0.1119` | `0.1000` | `0.1010` | `0.1181` | `0.1046` |
|
| 130 |
+
| RadGraph entity F1 | `0.1713` | `0.1577` | `0.1517` | `0.1739` | `0.1584` |
|
| 131 |
+
| RadGraph relation F1 | `0.1549` | `0.1413` | `0.1347` | `0.1628` | `0.1405` |
|
| 132 |
+
| CheXpert F1 14-micro | `0.1907` | `0.1442` | `0.1651` | `0.1365` | `0.2921` |
|
| 133 |
+
| CheXpert F1 5-micro | `0.2415` | `0.1716` | `0.2152` | `0.2455` | `0.2394` |
|
| 134 |
+
| CheXpert F1 14-macro | `0.1039` | `0.0700` | `0.1047` | `0.0381` | `0.1326` |
|
| 135 |
+
| CheXpert F1 5-macro | `0.1578` | `0.1112` | `0.1611` | `0.0952` | `0.1636` |
|
| 136 |
|
| 137 |
## Data
|
| 138 |
|
evaluations/mimic_test_findings_only_metrics.json
CHANGED
|
@@ -4,35 +4,35 @@
|
|
| 4 |
"dataset": "mimic-cxr",
|
| 5 |
"view_filter": "frontal-only (PA/AP), structured Findings section only",
|
| 6 |
"num_examples": 2210,
|
| 7 |
-
"bleu_1": 0.
|
| 8 |
-
"bleu_4": 0.
|
| 9 |
-
"meteor": 0.
|
| 10 |
-
"rouge_l": 0.
|
| 11 |
-
"chexpert_f1_14_micro": 0.
|
| 12 |
-
"chexpert_f1_5_micro": 0.
|
| 13 |
-
"chexpert_f1_14_macro": 0.
|
| 14 |
-
"chexpert_f1_5_macro": 0.
|
| 15 |
-
"chexpert_f1_micro": 0.
|
| 16 |
-
"chexpert_f1_macro": 0.
|
| 17 |
"chexpert_per_label_f1": {
|
| 18 |
-
"Enlarged Cardiomediastinum": 0.
|
| 19 |
-
"Cardiomegaly": 0.
|
| 20 |
"Lung Opacity": 0.005772005772005772,
|
| 21 |
"Lung Lesion": 0.0,
|
| 22 |
-
"Edema": 0.
|
| 23 |
"Consolidation": 0.0,
|
| 24 |
"Pneumonia": 0.0,
|
| 25 |
"Atelectasis": 0.013186813186813187,
|
| 26 |
"Pneumothorax": 0.0,
|
| 27 |
-
"Pleural Effusion": 0.
|
| 28 |
"Pleural Other": 0.0,
|
| 29 |
-
"Fracture": 0.
|
| 30 |
-
"Support Devices": 0.
|
| 31 |
-
"No Finding": 0.
|
| 32 |
},
|
| 33 |
-
"radgraph_f1": 0.
|
| 34 |
-
"radgraph_f1_entity": 0.
|
| 35 |
-
"radgraph_f1_relation": 0.
|
| 36 |
"radgraph_available": true,
|
| 37 |
"radgraph_error": null
|
| 38 |
}
|
|
|
|
| 4 |
"dataset": "mimic-cxr",
|
| 5 |
"view_filter": "frontal-only (PA/AP), structured Findings section only",
|
| 6 |
"num_examples": 2210,
|
| 7 |
+
"bleu_1": 0.24804371044734913,
|
| 8 |
+
"bleu_4": 0.05730693271738745,
|
| 9 |
+
"meteor": 0.2309676565725014,
|
| 10 |
+
"rouge_l": 0.18476844395763578,
|
| 11 |
+
"chexpert_f1_14_micro": 0.2921437031188314,
|
| 12 |
+
"chexpert_f1_5_micro": 0.23939202026599113,
|
| 13 |
+
"chexpert_f1_14_macro": 0.13259269532627468,
|
| 14 |
+
"chexpert_f1_5_macro": 0.1635857001735776,
|
| 15 |
+
"chexpert_f1_micro": 0.2921437031188314,
|
| 16 |
+
"chexpert_f1_macro": 0.13259269532627468,
|
| 17 |
"chexpert_per_label_f1": {
|
| 18 |
+
"Enlarged Cardiomediastinum": 0.06293706293706294,
|
| 19 |
+
"Cardiomegaly": 0.3652312599681021,
|
| 20 |
"Lung Opacity": 0.005772005772005772,
|
| 21 |
"Lung Lesion": 0.0,
|
| 22 |
+
"Edema": 0.2601626016260163,
|
| 23 |
"Consolidation": 0.0,
|
| 24 |
"Pneumonia": 0.0,
|
| 25 |
"Atelectasis": 0.013186813186813187,
|
| 26 |
"Pneumothorax": 0.0,
|
| 27 |
+
"Pleural Effusion": 0.1793478260869565,
|
| 28 |
"Pleural Other": 0.0,
|
| 29 |
+
"Fracture": 0.023255813953488372,
|
| 30 |
+
"Support Devices": 0.5962264150943396,
|
| 31 |
+
"No Finding": 0.3501779359430605
|
| 32 |
},
|
| 33 |
+
"radgraph_f1": 0.10463721960424775,
|
| 34 |
+
"radgraph_f1_entity": 0.15836826410474694,
|
| 35 |
+
"radgraph_f1_relation": 0.1404934373559056,
|
| 36 |
"radgraph_available": true,
|
| 37 |
"radgraph_error": null
|
| 38 |
}
|
evaluations/mimic_test_findings_only_predictions.csv
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
evaluations/mimic_test_metrics.json
CHANGED
|
@@ -4,35 +4,35 @@
|
|
| 4 |
"dataset": "mimic-cxr",
|
| 5 |
"view_filter": "frontal-only (PA/AP)",
|
| 6 |
"num_examples": 3041,
|
| 7 |
-
"bleu_1": 0.
|
| 8 |
-
"bleu_4": 0.
|
| 9 |
-
"meteor": 0.
|
| 10 |
-
"rouge_l": 0.
|
| 11 |
-
"chexpert_f1_14_micro": 0.
|
| 12 |
-
"chexpert_f1_5_micro": 0.
|
| 13 |
-
"chexpert_f1_14_macro": 0.
|
| 14 |
-
"chexpert_f1_5_macro": 0.
|
| 15 |
-
"chexpert_f1_micro": 0.
|
| 16 |
-
"chexpert_f1_macro": 0.
|
| 17 |
"chexpert_per_label_f1": {
|
| 18 |
-
"Enlarged Cardiomediastinum": 0.
|
| 19 |
-
"Cardiomegaly": 0.
|
| 20 |
"Lung Opacity": 0.004073319755600814,
|
| 21 |
"Lung Lesion": 0.0,
|
| 22 |
-
"Edema": 0.
|
| 23 |
"Consolidation": 0.0,
|
| 24 |
"Pneumonia": 0.0,
|
| 25 |
"Atelectasis": 0.008695652173913044,
|
| 26 |
"Pneumothorax": 0.0,
|
| 27 |
-
"Pleural Effusion": 0.
|
| 28 |
"Pleural Other": 0.0,
|
| 29 |
-
"Fracture": 0.
|
| 30 |
-
"Support Devices": 0.
|
| 31 |
-
"No Finding": 0.
|
| 32 |
},
|
| 33 |
-
"radgraph_f1": 0.
|
| 34 |
-
"radgraph_f1_entity": 0.
|
| 35 |
-
"radgraph_f1_relation": 0.
|
| 36 |
"radgraph_available": true,
|
| 37 |
"radgraph_error": null,
|
| 38 |
"evaluation_suite": "mimic_test_dual",
|
|
@@ -42,35 +42,35 @@
|
|
| 42 |
"dataset": "mimic-cxr",
|
| 43 |
"view_filter": "frontal-only (PA/AP)",
|
| 44 |
"num_examples": 3041,
|
| 45 |
-
"bleu_1": 0.
|
| 46 |
-
"bleu_4": 0.
|
| 47 |
-
"meteor": 0.
|
| 48 |
-
"rouge_l": 0.
|
| 49 |
-
"chexpert_f1_14_micro": 0.
|
| 50 |
-
"chexpert_f1_5_micro": 0.
|
| 51 |
-
"chexpert_f1_14_macro": 0.
|
| 52 |
-
"chexpert_f1_5_macro": 0.
|
| 53 |
-
"chexpert_f1_micro": 0.
|
| 54 |
-
"chexpert_f1_macro": 0.
|
| 55 |
"chexpert_per_label_f1": {
|
| 56 |
-
"Enlarged Cardiomediastinum": 0.
|
| 57 |
-
"Cardiomegaly": 0.
|
| 58 |
"Lung Opacity": 0.004073319755600814,
|
| 59 |
"Lung Lesion": 0.0,
|
| 60 |
-
"Edema": 0.
|
| 61 |
"Consolidation": 0.0,
|
| 62 |
"Pneumonia": 0.0,
|
| 63 |
"Atelectasis": 0.008695652173913044,
|
| 64 |
"Pneumothorax": 0.0,
|
| 65 |
-
"Pleural Effusion": 0.
|
| 66 |
"Pleural Other": 0.0,
|
| 67 |
-
"Fracture": 0.
|
| 68 |
-
"Support Devices": 0.
|
| 69 |
-
"No Finding": 0.
|
| 70 |
},
|
| 71 |
-
"radgraph_f1": 0.
|
| 72 |
-
"radgraph_f1_entity": 0.
|
| 73 |
-
"radgraph_f1_relation": 0.
|
| 74 |
"radgraph_available": true,
|
| 75 |
"radgraph_error": null
|
| 76 |
},
|
|
@@ -80,35 +80,35 @@
|
|
| 80 |
"dataset": "mimic-cxr",
|
| 81 |
"view_filter": "frontal-only (PA/AP), structured Findings section only",
|
| 82 |
"num_examples": 2210,
|
| 83 |
-
"bleu_1": 0.
|
| 84 |
-
"bleu_4": 0.
|
| 85 |
-
"meteor": 0.
|
| 86 |
-
"rouge_l": 0.
|
| 87 |
-
"chexpert_f1_14_micro": 0.
|
| 88 |
-
"chexpert_f1_5_micro": 0.
|
| 89 |
-
"chexpert_f1_14_macro": 0.
|
| 90 |
-
"chexpert_f1_5_macro": 0.
|
| 91 |
-
"chexpert_f1_micro": 0.
|
| 92 |
-
"chexpert_f1_macro": 0.
|
| 93 |
"chexpert_per_label_f1": {
|
| 94 |
-
"Enlarged Cardiomediastinum": 0.
|
| 95 |
-
"Cardiomegaly": 0.
|
| 96 |
"Lung Opacity": 0.005772005772005772,
|
| 97 |
"Lung Lesion": 0.0,
|
| 98 |
-
"Edema": 0.
|
| 99 |
"Consolidation": 0.0,
|
| 100 |
"Pneumonia": 0.0,
|
| 101 |
"Atelectasis": 0.013186813186813187,
|
| 102 |
"Pneumothorax": 0.0,
|
| 103 |
-
"Pleural Effusion": 0.
|
| 104 |
"Pleural Other": 0.0,
|
| 105 |
-
"Fracture": 0.
|
| 106 |
-
"Support Devices": 0.
|
| 107 |
-
"No Finding": 0.
|
| 108 |
},
|
| 109 |
-
"radgraph_f1": 0.
|
| 110 |
-
"radgraph_f1_entity": 0.
|
| 111 |
-
"radgraph_f1_relation": 0.
|
| 112 |
"radgraph_available": true,
|
| 113 |
"radgraph_error": null
|
| 114 |
}
|
|
|
|
| 4 |
"dataset": "mimic-cxr",
|
| 5 |
"view_filter": "frontal-only (PA/AP)",
|
| 6 |
"num_examples": 3041,
|
| 7 |
+
"bleu_1": 0.23460907118482577,
|
| 8 |
+
"bleu_4": 0.0483690414206241,
|
| 9 |
+
"meteor": 0.21291121731396784,
|
| 10 |
+
"rouge_l": 0.17453617861562737,
|
| 11 |
+
"chexpert_f1_14_micro": 0.31163845751177804,
|
| 12 |
+
"chexpert_f1_5_micro": 0.24861538461538463,
|
| 13 |
+
"chexpert_f1_14_macro": 0.13629250906293128,
|
| 14 |
+
"chexpert_f1_5_macro": 0.16862522291180843,
|
| 15 |
+
"chexpert_f1_micro": 0.31163845751177804,
|
| 16 |
+
"chexpert_f1_macro": 0.13629250906293128,
|
| 17 |
"chexpert_per_label_f1": {
|
| 18 |
+
"Enlarged Cardiomediastinum": 0.07407407407407407,
|
| 19 |
+
"Cardiomegaly": 0.39663335086796425,
|
| 20 |
"Lung Opacity": 0.004073319755600814,
|
| 21 |
"Lung Lesion": 0.0,
|
| 22 |
+
"Edema": 0.2462526766595289,
|
| 23 |
"Consolidation": 0.0,
|
| 24 |
"Pneumonia": 0.0,
|
| 25 |
"Atelectasis": 0.008695652173913044,
|
| 26 |
"Pneumothorax": 0.0,
|
| 27 |
+
"Pleural Effusion": 0.1915444348576359,
|
| 28 |
"Pleural Other": 0.0,
|
| 29 |
+
"Fracture": 0.017543859649122806,
|
| 30 |
+
"Support Devices": 0.6656580937972768,
|
| 31 |
+
"No Finding": 0.30361966504592114
|
| 32 |
},
|
| 33 |
+
"radgraph_f1": 0.0938551356876054,
|
| 34 |
+
"radgraph_f1_entity": 0.14413244058497404,
|
| 35 |
+
"radgraph_f1_relation": 0.12803672953985817,
|
| 36 |
"radgraph_available": true,
|
| 37 |
"radgraph_error": null,
|
| 38 |
"evaluation_suite": "mimic_test_dual",
|
|
|
|
| 42 |
"dataset": "mimic-cxr",
|
| 43 |
"view_filter": "frontal-only (PA/AP)",
|
| 44 |
"num_examples": 3041,
|
| 45 |
+
"bleu_1": 0.23460907118482577,
|
| 46 |
+
"bleu_4": 0.0483690414206241,
|
| 47 |
+
"meteor": 0.21291121731396784,
|
| 48 |
+
"rouge_l": 0.17453617861562737,
|
| 49 |
+
"chexpert_f1_14_micro": 0.31163845751177804,
|
| 50 |
+
"chexpert_f1_5_micro": 0.24861538461538463,
|
| 51 |
+
"chexpert_f1_14_macro": 0.13629250906293128,
|
| 52 |
+
"chexpert_f1_5_macro": 0.16862522291180843,
|
| 53 |
+
"chexpert_f1_micro": 0.31163845751177804,
|
| 54 |
+
"chexpert_f1_macro": 0.13629250906293128,
|
| 55 |
"chexpert_per_label_f1": {
|
| 56 |
+
"Enlarged Cardiomediastinum": 0.07407407407407407,
|
| 57 |
+
"Cardiomegaly": 0.39663335086796425,
|
| 58 |
"Lung Opacity": 0.004073319755600814,
|
| 59 |
"Lung Lesion": 0.0,
|
| 60 |
+
"Edema": 0.2462526766595289,
|
| 61 |
"Consolidation": 0.0,
|
| 62 |
"Pneumonia": 0.0,
|
| 63 |
"Atelectasis": 0.008695652173913044,
|
| 64 |
"Pneumothorax": 0.0,
|
| 65 |
+
"Pleural Effusion": 0.1915444348576359,
|
| 66 |
"Pleural Other": 0.0,
|
| 67 |
+
"Fracture": 0.017543859649122806,
|
| 68 |
+
"Support Devices": 0.6656580937972768,
|
| 69 |
+
"No Finding": 0.30361966504592114
|
| 70 |
},
|
| 71 |
+
"radgraph_f1": 0.0938551356876054,
|
| 72 |
+
"radgraph_f1_entity": 0.14413244058497404,
|
| 73 |
+
"radgraph_f1_relation": 0.12803672953985817,
|
| 74 |
"radgraph_available": true,
|
| 75 |
"radgraph_error": null
|
| 76 |
},
|
|
|
|
| 80 |
"dataset": "mimic-cxr",
|
| 81 |
"view_filter": "frontal-only (PA/AP), structured Findings section only",
|
| 82 |
"num_examples": 2210,
|
| 83 |
+
"bleu_1": 0.24804371044734913,
|
| 84 |
+
"bleu_4": 0.05730693271738745,
|
| 85 |
+
"meteor": 0.2309676565725014,
|
| 86 |
+
"rouge_l": 0.18476844395763578,
|
| 87 |
+
"chexpert_f1_14_micro": 0.2921437031188314,
|
| 88 |
+
"chexpert_f1_5_micro": 0.23939202026599113,
|
| 89 |
+
"chexpert_f1_14_macro": 0.13259269532627468,
|
| 90 |
+
"chexpert_f1_5_macro": 0.1635857001735776,
|
| 91 |
+
"chexpert_f1_micro": 0.2921437031188314,
|
| 92 |
+
"chexpert_f1_macro": 0.13259269532627468,
|
| 93 |
"chexpert_per_label_f1": {
|
| 94 |
+
"Enlarged Cardiomediastinum": 0.06293706293706294,
|
| 95 |
+
"Cardiomegaly": 0.3652312599681021,
|
| 96 |
"Lung Opacity": 0.005772005772005772,
|
| 97 |
"Lung Lesion": 0.0,
|
| 98 |
+
"Edema": 0.2601626016260163,
|
| 99 |
"Consolidation": 0.0,
|
| 100 |
"Pneumonia": 0.0,
|
| 101 |
"Atelectasis": 0.013186813186813187,
|
| 102 |
"Pneumothorax": 0.0,
|
| 103 |
+
"Pleural Effusion": 0.1793478260869565,
|
| 104 |
"Pleural Other": 0.0,
|
| 105 |
+
"Fracture": 0.023255813953488372,
|
| 106 |
+
"Support Devices": 0.5962264150943396,
|
| 107 |
+
"No Finding": 0.3501779359430605
|
| 108 |
},
|
| 109 |
+
"radgraph_f1": 0.10463721960424775,
|
| 110 |
+
"radgraph_f1_entity": 0.15836826410474694,
|
| 111 |
+
"radgraph_f1_relation": 0.1404934373559056,
|
| 112 |
"radgraph_available": true,
|
| 113 |
"radgraph_error": null
|
| 114 |
}
|
evaluations/mimic_test_predictions.csv
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
run_summary.json
CHANGED
|
@@ -50,35 +50,35 @@
|
|
| 50 |
"dataset": "mimic-cxr",
|
| 51 |
"view_filter": "frontal-only (PA/AP)",
|
| 52 |
"num_examples": 3041,
|
| 53 |
-
"bleu_1": 0.
|
| 54 |
-
"bleu_4": 0.
|
| 55 |
-
"meteor": 0.
|
| 56 |
-
"rouge_l": 0.
|
| 57 |
-
"chexpert_f1_14_micro": 0.
|
| 58 |
-
"chexpert_f1_5_micro": 0.
|
| 59 |
-
"chexpert_f1_14_macro": 0.
|
| 60 |
-
"chexpert_f1_5_macro": 0.
|
| 61 |
-
"chexpert_f1_micro": 0.
|
| 62 |
-
"chexpert_f1_macro": 0.
|
| 63 |
"chexpert_per_label_f1": {
|
| 64 |
-
"Enlarged Cardiomediastinum": 0.
|
| 65 |
-
"Cardiomegaly": 0.
|
| 66 |
"Lung Opacity": 0.004073319755600814,
|
| 67 |
"Lung Lesion": 0.0,
|
| 68 |
-
"Edema": 0.
|
| 69 |
"Consolidation": 0.0,
|
| 70 |
"Pneumonia": 0.0,
|
| 71 |
"Atelectasis": 0.008695652173913044,
|
| 72 |
"Pneumothorax": 0.0,
|
| 73 |
-
"Pleural Effusion": 0.
|
| 74 |
"Pleural Other": 0.0,
|
| 75 |
-
"Fracture": 0.
|
| 76 |
-
"Support Devices": 0.
|
| 77 |
-
"No Finding": 0.
|
| 78 |
},
|
| 79 |
-
"radgraph_f1": 0.
|
| 80 |
-
"radgraph_f1_entity": 0.
|
| 81 |
-
"radgraph_f1_relation": 0.
|
| 82 |
"radgraph_available": true,
|
| 83 |
"radgraph_error": null
|
| 84 |
},
|
|
@@ -89,35 +89,35 @@
|
|
| 89 |
"dataset": "mimic-cxr",
|
| 90 |
"view_filter": "frontal-only (PA/AP)",
|
| 91 |
"num_examples": 3041,
|
| 92 |
-
"bleu_1": 0.
|
| 93 |
-
"bleu_4": 0.
|
| 94 |
-
"meteor": 0.
|
| 95 |
-
"rouge_l": 0.
|
| 96 |
-
"chexpert_f1_14_micro": 0.
|
| 97 |
-
"chexpert_f1_5_micro": 0.
|
| 98 |
-
"chexpert_f1_14_macro": 0.
|
| 99 |
-
"chexpert_f1_5_macro": 0.
|
| 100 |
-
"chexpert_f1_micro": 0.
|
| 101 |
-
"chexpert_f1_macro": 0.
|
| 102 |
"chexpert_per_label_f1": {
|
| 103 |
-
"Enlarged Cardiomediastinum": 0.
|
| 104 |
-
"Cardiomegaly": 0.
|
| 105 |
"Lung Opacity": 0.004073319755600814,
|
| 106 |
"Lung Lesion": 0.0,
|
| 107 |
-
"Edema": 0.
|
| 108 |
"Consolidation": 0.0,
|
| 109 |
"Pneumonia": 0.0,
|
| 110 |
"Atelectasis": 0.008695652173913044,
|
| 111 |
"Pneumothorax": 0.0,
|
| 112 |
-
"Pleural Effusion": 0.
|
| 113 |
"Pleural Other": 0.0,
|
| 114 |
-
"Fracture": 0.
|
| 115 |
-
"Support Devices": 0.
|
| 116 |
-
"No Finding": 0.
|
| 117 |
},
|
| 118 |
-
"radgraph_f1": 0.
|
| 119 |
-
"radgraph_f1_entity": 0.
|
| 120 |
-
"radgraph_f1_relation": 0.
|
| 121 |
"radgraph_available": true,
|
| 122 |
"radgraph_error": null
|
| 123 |
},
|
|
@@ -127,35 +127,35 @@
|
|
| 127 |
"dataset": "mimic-cxr",
|
| 128 |
"view_filter": "frontal-only (PA/AP), structured Findings section only",
|
| 129 |
"num_examples": 2210,
|
| 130 |
-
"bleu_1": 0.
|
| 131 |
-
"bleu_4": 0.
|
| 132 |
-
"meteor": 0.
|
| 133 |
-
"rouge_l": 0.
|
| 134 |
-
"chexpert_f1_14_micro": 0.
|
| 135 |
-
"chexpert_f1_5_micro": 0.
|
| 136 |
-
"chexpert_f1_14_macro": 0.
|
| 137 |
-
"chexpert_f1_5_macro": 0.
|
| 138 |
-
"chexpert_f1_micro": 0.
|
| 139 |
-
"chexpert_f1_macro": 0.
|
| 140 |
"chexpert_per_label_f1": {
|
| 141 |
-
"Enlarged Cardiomediastinum": 0.
|
| 142 |
-
"Cardiomegaly": 0.
|
| 143 |
"Lung Opacity": 0.005772005772005772,
|
| 144 |
"Lung Lesion": 0.0,
|
| 145 |
-
"Edema": 0.
|
| 146 |
"Consolidation": 0.0,
|
| 147 |
"Pneumonia": 0.0,
|
| 148 |
"Atelectasis": 0.013186813186813187,
|
| 149 |
"Pneumothorax": 0.0,
|
| 150 |
-
"Pleural Effusion": 0.
|
| 151 |
"Pleural Other": 0.0,
|
| 152 |
-
"Fracture": 0.
|
| 153 |
-
"Support Devices": 0.
|
| 154 |
-
"No Finding": 0.
|
| 155 |
},
|
| 156 |
-
"radgraph_f1": 0.
|
| 157 |
-
"radgraph_f1_entity": 0.
|
| 158 |
-
"radgraph_f1_relation": 0.
|
| 159 |
"radgraph_available": true,
|
| 160 |
"radgraph_error": null
|
| 161 |
}
|
|
|
|
| 50 |
"dataset": "mimic-cxr",
|
| 51 |
"view_filter": "frontal-only (PA/AP)",
|
| 52 |
"num_examples": 3041,
|
| 53 |
+
"bleu_1": 0.23460907118482577,
|
| 54 |
+
"bleu_4": 0.0483690414206241,
|
| 55 |
+
"meteor": 0.21291121731396784,
|
| 56 |
+
"rouge_l": 0.17453617861562737,
|
| 57 |
+
"chexpert_f1_14_micro": 0.31163845751177804,
|
| 58 |
+
"chexpert_f1_5_micro": 0.24861538461538463,
|
| 59 |
+
"chexpert_f1_14_macro": 0.13629250906293128,
|
| 60 |
+
"chexpert_f1_5_macro": 0.16862522291180843,
|
| 61 |
+
"chexpert_f1_micro": 0.31163845751177804,
|
| 62 |
+
"chexpert_f1_macro": 0.13629250906293128,
|
| 63 |
"chexpert_per_label_f1": {
|
| 64 |
+
"Enlarged Cardiomediastinum": 0.07407407407407407,
|
| 65 |
+
"Cardiomegaly": 0.39663335086796425,
|
| 66 |
"Lung Opacity": 0.004073319755600814,
|
| 67 |
"Lung Lesion": 0.0,
|
| 68 |
+
"Edema": 0.2462526766595289,
|
| 69 |
"Consolidation": 0.0,
|
| 70 |
"Pneumonia": 0.0,
|
| 71 |
"Atelectasis": 0.008695652173913044,
|
| 72 |
"Pneumothorax": 0.0,
|
| 73 |
+
"Pleural Effusion": 0.1915444348576359,
|
| 74 |
"Pleural Other": 0.0,
|
| 75 |
+
"Fracture": 0.017543859649122806,
|
| 76 |
+
"Support Devices": 0.6656580937972768,
|
| 77 |
+
"No Finding": 0.30361966504592114
|
| 78 |
},
|
| 79 |
+
"radgraph_f1": 0.0938551356876054,
|
| 80 |
+
"radgraph_f1_entity": 0.14413244058497404,
|
| 81 |
+
"radgraph_f1_relation": 0.12803672953985817,
|
| 82 |
"radgraph_available": true,
|
| 83 |
"radgraph_error": null
|
| 84 |
},
|
|
|
|
| 89 |
"dataset": "mimic-cxr",
|
| 90 |
"view_filter": "frontal-only (PA/AP)",
|
| 91 |
"num_examples": 3041,
|
| 92 |
+
"bleu_1": 0.23460907118482577,
|
| 93 |
+
"bleu_4": 0.0483690414206241,
|
| 94 |
+
"meteor": 0.21291121731396784,
|
| 95 |
+
"rouge_l": 0.17453617861562737,
|
| 96 |
+
"chexpert_f1_14_micro": 0.31163845751177804,
|
| 97 |
+
"chexpert_f1_5_micro": 0.24861538461538463,
|
| 98 |
+
"chexpert_f1_14_macro": 0.13629250906293128,
|
| 99 |
+
"chexpert_f1_5_macro": 0.16862522291180843,
|
| 100 |
+
"chexpert_f1_micro": 0.31163845751177804,
|
| 101 |
+
"chexpert_f1_macro": 0.13629250906293128,
|
| 102 |
"chexpert_per_label_f1": {
|
| 103 |
+
"Enlarged Cardiomediastinum": 0.07407407407407407,
|
| 104 |
+
"Cardiomegaly": 0.39663335086796425,
|
| 105 |
"Lung Opacity": 0.004073319755600814,
|
| 106 |
"Lung Lesion": 0.0,
|
| 107 |
+
"Edema": 0.2462526766595289,
|
| 108 |
"Consolidation": 0.0,
|
| 109 |
"Pneumonia": 0.0,
|
| 110 |
"Atelectasis": 0.008695652173913044,
|
| 111 |
"Pneumothorax": 0.0,
|
| 112 |
+
"Pleural Effusion": 0.1915444348576359,
|
| 113 |
"Pleural Other": 0.0,
|
| 114 |
+
"Fracture": 0.017543859649122806,
|
| 115 |
+
"Support Devices": 0.6656580937972768,
|
| 116 |
+
"No Finding": 0.30361966504592114
|
| 117 |
},
|
| 118 |
+
"radgraph_f1": 0.0938551356876054,
|
| 119 |
+
"radgraph_f1_entity": 0.14413244058497404,
|
| 120 |
+
"radgraph_f1_relation": 0.12803672953985817,
|
| 121 |
"radgraph_available": true,
|
| 122 |
"radgraph_error": null
|
| 123 |
},
|
|
|
|
| 127 |
"dataset": "mimic-cxr",
|
| 128 |
"view_filter": "frontal-only (PA/AP), structured Findings section only",
|
| 129 |
"num_examples": 2210,
|
| 130 |
+
"bleu_1": 0.24804371044734913,
|
| 131 |
+
"bleu_4": 0.05730693271738745,
|
| 132 |
+
"meteor": 0.2309676565725014,
|
| 133 |
+
"rouge_l": 0.18476844395763578,
|
| 134 |
+
"chexpert_f1_14_micro": 0.2921437031188314,
|
| 135 |
+
"chexpert_f1_5_micro": 0.23939202026599113,
|
| 136 |
+
"chexpert_f1_14_macro": 0.13259269532627468,
|
| 137 |
+
"chexpert_f1_5_macro": 0.1635857001735776,
|
| 138 |
+
"chexpert_f1_micro": 0.2921437031188314,
|
| 139 |
+
"chexpert_f1_macro": 0.13259269532627468,
|
| 140 |
"chexpert_per_label_f1": {
|
| 141 |
+
"Enlarged Cardiomediastinum": 0.06293706293706294,
|
| 142 |
+
"Cardiomegaly": 0.3652312599681021,
|
| 143 |
"Lung Opacity": 0.005772005772005772,
|
| 144 |
"Lung Lesion": 0.0,
|
| 145 |
+
"Edema": 0.2601626016260163,
|
| 146 |
"Consolidation": 0.0,
|
| 147 |
"Pneumonia": 0.0,
|
| 148 |
"Atelectasis": 0.013186813186813187,
|
| 149 |
"Pneumothorax": 0.0,
|
| 150 |
+
"Pleural Effusion": 0.1793478260869565,
|
| 151 |
"Pleural Other": 0.0,
|
| 152 |
+
"Fracture": 0.023255813953488372,
|
| 153 |
+
"Support Devices": 0.5962264150943396,
|
| 154 |
+
"No Finding": 0.3501779359430605
|
| 155 |
},
|
| 156 |
+
"radgraph_f1": 0.10463721960424775,
|
| 157 |
+
"radgraph_f1_entity": 0.15836826410474694,
|
| 158 |
+
"radgraph_f1_relation": 0.1404934373559056,
|
| 159 |
"radgraph_available": true,
|
| 160 |
"radgraph_error": null
|
| 161 |
}
|