manu02 commited on
Commit
8df95e5
·
verified ·
1 Parent(s): f1b8811

Upload MIMIC test evaluation results

Browse files
README.md CHANGED
@@ -105,34 +105,34 @@ These comparison tables are refreshed across the full LAnA collection whenever a
105
  | Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
106
  | --- | --- | --- | --- | --- | --- |
107
  | Number of studies | `3041` | `3041` | `3041` | `3041` | `3041` |
108
- | ROUGE-L | `0.1686` | `0.1653` | `0.1513` | `0.1670` | `0.1526` |
109
- | BLEU-1 | `0.2091` | `0.1916` | `0.1707` | `0.2174` | `0.1650` |
110
- | BLEU-4 | `0.0417` | `0.0386` | `0.0357` | `0.0417` | `0.0334` |
111
- | METEOR | `0.2298` | `0.2202` | `0.2079` | `0.2063` | `0.2057` |
112
- | RadGraph F1 | `0.1024` | `0.0921` | `0.0918` | `0.1057` | `0.0941` |
113
- | RadGraph entity F1 | `0.1587` | `0.1459` | `0.1399` | `0.1569` | `0.1454` |
114
- | RadGraph relation F1 | `0.1443` | `0.1322` | `0.1246` | `0.1474` | `0.1296` |
115
- | CheXpert F1 14-micro | `0.2116` | `0.1565` | `0.1829` | `0.1401` | `0.2607` |
116
- | CheXpert F1 5-micro | `0.2512` | `0.1530` | `0.2183` | `0.2506` | `0.2470` |
117
- | CheXpert F1 14-macro | `0.1095` | `0.0713` | `0.1095` | `0.0401` | `0.1240` |
118
- | CheXpert F1 5-macro | `0.1644` | `0.1007` | `0.1634` | `0.1004` | `0.1682` |
119
 
120
  ### Cross-Model Comparison: Findings-Only Frontal Test Studies
121
 
122
  | Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
123
  | --- | --- | --- | --- | --- | --- |
124
  | Number of studies | `2210` | `2210` | `2210` | `2210` | `2210` |
125
- | ROUGE-L | `0.1771` | `0.1720` | `0.1576` | `0.1771` | `0.1613` |
126
- | BLEU-1 | `0.2177` | `0.2003` | `0.1754` | `0.2263` | `0.1749` |
127
- | BLEU-4 | `0.0484` | `0.0449` | `0.0405` | `0.0487` | `0.0397` |
128
- | METEOR | `0.2466` | `0.2347` | `0.2207` | `0.2240` | `0.2231` |
129
- | RadGraph F1 | `0.1119` | `0.1000` | `0.1010` | `0.1181` | `0.1047` |
130
- | RadGraph entity F1 | `0.1713` | `0.1577` | `0.1517` | `0.1739` | `0.1595` |
131
- | RadGraph relation F1 | `0.1549` | `0.1413` | `0.1347` | `0.1628` | `0.1419` |
132
- | CheXpert F1 14-micro | `0.1907` | `0.1442` | `0.1651` | `0.1365` | `0.2501` |
133
- | CheXpert F1 5-micro | `0.2415` | `0.1716` | `0.2152` | `0.2455` | `0.2375` |
134
- | CheXpert F1 14-macro | `0.1039` | `0.0700` | `0.1047` | `0.0381` | `0.1203` |
135
- | CheXpert F1 5-macro | `0.1578` | `0.1112` | `0.1611` | `0.0952` | `0.1627` |
136
 
137
  ## Data
138
 
 
105
  | Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
106
  | --- | --- | --- | --- | --- | --- |
107
  | Number of studies | `3041` | `3041` | `3041` | `3041` | `3041` |
108
+ | ROUGE-L | `0.1686` | `0.1653` | `0.1513` | `0.1670` | `0.1745` |
109
+ | BLEU-1 | `0.2091` | `0.1916` | `0.1707` | `0.2174` | `0.2346` |
110
+ | BLEU-4 | `0.0417` | `0.0386` | `0.0357` | `0.0417` | `0.0484` |
111
+ | METEOR | `0.2298` | `0.2202` | `0.2079` | `0.2063` | `0.2129` |
112
+ | RadGraph F1 | `0.1024` | `0.0921` | `0.0918` | `0.1057` | `0.0939` |
113
+ | RadGraph entity F1 | `0.1587` | `0.1459` | `0.1399` | `0.1569` | `0.1441` |
114
+ | RadGraph relation F1 | `0.1443` | `0.1322` | `0.1246` | `0.1474` | `0.1280` |
115
+ | CheXpert F1 14-micro | `0.2116` | `0.1565` | `0.1829` | `0.1401` | `0.3116` |
116
+ | CheXpert F1 5-micro | `0.2512` | `0.1530` | `0.2183` | `0.2506` | `0.2486` |
117
+ | CheXpert F1 14-macro | `0.1095` | `0.0713` | `0.1095` | `0.0401` | `0.1363` |
118
+ | CheXpert F1 5-macro | `0.1644` | `0.1007` | `0.1634` | `0.1004` | `0.1686` |
119
 
120
  ### Cross-Model Comparison: Findings-Only Frontal Test Studies
121
 
122
  | Metric | LAnA | LAnA-MIMIC | LAnA-MIMIC-CHEXPERT | LAnA-v2 | LAnA-v3 |
123
  | --- | --- | --- | --- | --- | --- |
124
  | Number of studies | `2210` | `2210` | `2210` | `2210` | `2210` |
125
+ | ROUGE-L | `0.1771` | `0.1720` | `0.1576` | `0.1771` | `0.1848` |
126
+ | BLEU-1 | `0.2177` | `0.2003` | `0.1754` | `0.2263` | `0.2480` |
127
+ | BLEU-4 | `0.0484` | `0.0449` | `0.0405` | `0.0487` | `0.0573` |
128
+ | METEOR | `0.2466` | `0.2347` | `0.2207` | `0.2240` | `0.2310` |
129
+ | RadGraph F1 | `0.1119` | `0.1000` | `0.1010` | `0.1181` | `0.1046` |
130
+ | RadGraph entity F1 | `0.1713` | `0.1577` | `0.1517` | `0.1739` | `0.1584` |
131
+ | RadGraph relation F1 | `0.1549` | `0.1413` | `0.1347` | `0.1628` | `0.1405` |
132
+ | CheXpert F1 14-micro | `0.1907` | `0.1442` | `0.1651` | `0.1365` | `0.2921` |
133
+ | CheXpert F1 5-micro | `0.2415` | `0.1716` | `0.2152` | `0.2455` | `0.2394` |
134
+ | CheXpert F1 14-macro | `0.1039` | `0.0700` | `0.1047` | `0.0381` | `0.1326` |
135
+ | CheXpert F1 5-macro | `0.1578` | `0.1112` | `0.1611` | `0.0952` | `0.1636` |
136
 
137
  ## Data
138
 
evaluations/mimic_test_findings_only_metrics.json CHANGED
@@ -4,35 +4,35 @@
4
  "dataset": "mimic-cxr",
5
  "view_filter": "frontal-only (PA/AP), structured Findings section only",
6
  "num_examples": 2210,
7
- "bleu_1": 0.17491187190057955,
8
- "bleu_4": 0.03966117310602323,
9
- "meteor": 0.22311507091428398,
10
- "rouge_l": 0.1612770175038926,
11
- "chexpert_f1_14_micro": 0.2501020547013199,
12
- "chexpert_f1_5_micro": 0.23749208359721344,
13
- "chexpert_f1_14_macro": 0.12030236160434729,
14
- "chexpert_f1_5_macro": 0.16269249240448827,
15
- "chexpert_f1_micro": 0.2501020547013199,
16
- "chexpert_f1_macro": 0.12030236160434729,
17
  "chexpert_per_label_f1": {
18
- "Enlarged Cardiomediastinum": 0.0625,
19
- "Cardiomegaly": 0.3613109512390088,
20
  "Lung Opacity": 0.005772005772005772,
21
  "Lung Lesion": 0.0,
22
- "Edema": 0.26058631921824105,
23
  "Consolidation": 0.0,
24
  "Pneumonia": 0.0,
25
  "Atelectasis": 0.013186813186813187,
26
  "Pneumothorax": 0.0,
27
- "Pleural Effusion": 0.1783783783783784,
28
  "Pleural Other": 0.0,
29
- "Fracture": 0.022988505747126436,
30
- "Support Devices": 0.415625,
31
- "No Finding": 0.36388508891928867
32
  },
33
- "radgraph_f1": 0.10468134329680011,
34
- "radgraph_f1_entity": 0.1595464585348944,
35
- "radgraph_f1_relation": 0.14191739966668873,
36
  "radgraph_available": true,
37
  "radgraph_error": null
38
  }
 
4
  "dataset": "mimic-cxr",
5
  "view_filter": "frontal-only (PA/AP), structured Findings section only",
6
  "num_examples": 2210,
7
+ "bleu_1": 0.24804371044734913,
8
+ "bleu_4": 0.05730693271738745,
9
+ "meteor": 0.2309676565725014,
10
+ "rouge_l": 0.18476844395763578,
11
+ "chexpert_f1_14_micro": 0.2921437031188314,
12
+ "chexpert_f1_5_micro": 0.23939202026599113,
13
+ "chexpert_f1_14_macro": 0.13259269532627468,
14
+ "chexpert_f1_5_macro": 0.1635857001735776,
15
+ "chexpert_f1_micro": 0.2921437031188314,
16
+ "chexpert_f1_macro": 0.13259269532627468,
17
  "chexpert_per_label_f1": {
18
+ "Enlarged Cardiomediastinum": 0.06293706293706294,
19
+ "Cardiomegaly": 0.3652312599681021,
20
  "Lung Opacity": 0.005772005772005772,
21
  "Lung Lesion": 0.0,
22
+ "Edema": 0.2601626016260163,
23
  "Consolidation": 0.0,
24
  "Pneumonia": 0.0,
25
  "Atelectasis": 0.013186813186813187,
26
  "Pneumothorax": 0.0,
27
+ "Pleural Effusion": 0.1793478260869565,
28
  "Pleural Other": 0.0,
29
+ "Fracture": 0.023255813953488372,
30
+ "Support Devices": 0.5962264150943396,
31
+ "No Finding": 0.3501779359430605
32
  },
33
+ "radgraph_f1": 0.10463721960424775,
34
+ "radgraph_f1_entity": 0.15836826410474694,
35
+ "radgraph_f1_relation": 0.1404934373559056,
36
  "radgraph_available": true,
37
  "radgraph_error": null
38
  }
evaluations/mimic_test_findings_only_predictions.csv CHANGED
The diff for this file is too large to render. See raw diff
 
evaluations/mimic_test_metrics.json CHANGED
@@ -4,35 +4,35 @@
4
  "dataset": "mimic-cxr",
5
  "view_filter": "frontal-only (PA/AP)",
6
  "num_examples": 3041,
7
- "bleu_1": 0.16499879686902857,
8
- "bleu_4": 0.033400783448202014,
9
- "meteor": 0.2057195729907702,
10
- "rouge_l": 0.15262886260140987,
11
- "chexpert_f1_14_micro": 0.26065662978414655,
12
- "chexpert_f1_5_micro": 0.246974358974359,
13
- "chexpert_f1_14_macro": 0.1239880617810402,
14
- "chexpert_f1_5_macro": 0.16818421256006927,
15
- "chexpert_f1_micro": 0.26065662978414655,
16
- "chexpert_f1_macro": 0.1239880617810402,
17
  "chexpert_per_label_f1": {
18
- "Enlarged Cardiomediastinum": 0.0776255707762557,
19
- "Cardiomegaly": 0.39155672823218995,
20
  "Lung Opacity": 0.004073319755600814,
21
  "Lung Lesion": 0.0,
22
- "Edema": 0.24839400428265523,
23
  "Consolidation": 0.0,
24
  "Pneumonia": 0.0,
25
  "Atelectasis": 0.008695652173913044,
26
  "Pneumothorax": 0.0,
27
- "Pleural Effusion": 0.192274678111588,
28
  "Pleural Other": 0.0,
29
- "Fracture": 0.017391304347826087,
30
- "Support Devices": 0.4812382739212008,
31
- "No Finding": 0.3145833333333333
32
  },
33
- "radgraph_f1": 0.09410311365933419,
34
- "radgraph_f1_entity": 0.14542321670985509,
35
- "radgraph_f1_relation": 0.12964295145994836,
36
  "radgraph_available": true,
37
  "radgraph_error": null,
38
  "evaluation_suite": "mimic_test_dual",
@@ -42,35 +42,35 @@
42
  "dataset": "mimic-cxr",
43
  "view_filter": "frontal-only (PA/AP)",
44
  "num_examples": 3041,
45
- "bleu_1": 0.16499879686902857,
46
- "bleu_4": 0.033400783448202014,
47
- "meteor": 0.2057195729907702,
48
- "rouge_l": 0.15262886260140987,
49
- "chexpert_f1_14_micro": 0.26065662978414655,
50
- "chexpert_f1_5_micro": 0.246974358974359,
51
- "chexpert_f1_14_macro": 0.1239880617810402,
52
- "chexpert_f1_5_macro": 0.16818421256006927,
53
- "chexpert_f1_micro": 0.26065662978414655,
54
- "chexpert_f1_macro": 0.1239880617810402,
55
  "chexpert_per_label_f1": {
56
- "Enlarged Cardiomediastinum": 0.0776255707762557,
57
- "Cardiomegaly": 0.39155672823218995,
58
  "Lung Opacity": 0.004073319755600814,
59
  "Lung Lesion": 0.0,
60
- "Edema": 0.24839400428265523,
61
  "Consolidation": 0.0,
62
  "Pneumonia": 0.0,
63
  "Atelectasis": 0.008695652173913044,
64
  "Pneumothorax": 0.0,
65
- "Pleural Effusion": 0.192274678111588,
66
  "Pleural Other": 0.0,
67
- "Fracture": 0.017391304347826087,
68
- "Support Devices": 0.4812382739212008,
69
- "No Finding": 0.3145833333333333
70
  },
71
- "radgraph_f1": 0.09410311365933419,
72
- "radgraph_f1_entity": 0.14542321670985509,
73
- "radgraph_f1_relation": 0.12964295145994836,
74
  "radgraph_available": true,
75
  "radgraph_error": null
76
  },
@@ -80,35 +80,35 @@
80
  "dataset": "mimic-cxr",
81
  "view_filter": "frontal-only (PA/AP), structured Findings section only",
82
  "num_examples": 2210,
83
- "bleu_1": 0.17491187190057955,
84
- "bleu_4": 0.03966117310602323,
85
- "meteor": 0.22311507091428398,
86
- "rouge_l": 0.1612770175038926,
87
- "chexpert_f1_14_micro": 0.2501020547013199,
88
- "chexpert_f1_5_micro": 0.23749208359721344,
89
- "chexpert_f1_14_macro": 0.12030236160434729,
90
- "chexpert_f1_5_macro": 0.16269249240448827,
91
- "chexpert_f1_micro": 0.2501020547013199,
92
- "chexpert_f1_macro": 0.12030236160434729,
93
  "chexpert_per_label_f1": {
94
- "Enlarged Cardiomediastinum": 0.0625,
95
- "Cardiomegaly": 0.3613109512390088,
96
  "Lung Opacity": 0.005772005772005772,
97
  "Lung Lesion": 0.0,
98
- "Edema": 0.26058631921824105,
99
  "Consolidation": 0.0,
100
  "Pneumonia": 0.0,
101
  "Atelectasis": 0.013186813186813187,
102
  "Pneumothorax": 0.0,
103
- "Pleural Effusion": 0.1783783783783784,
104
  "Pleural Other": 0.0,
105
- "Fracture": 0.022988505747126436,
106
- "Support Devices": 0.415625,
107
- "No Finding": 0.36388508891928867
108
  },
109
- "radgraph_f1": 0.10468134329680011,
110
- "radgraph_f1_entity": 0.1595464585348944,
111
- "radgraph_f1_relation": 0.14191739966668873,
112
  "radgraph_available": true,
113
  "radgraph_error": null
114
  }
 
4
  "dataset": "mimic-cxr",
5
  "view_filter": "frontal-only (PA/AP)",
6
  "num_examples": 3041,
7
+ "bleu_1": 0.23460907118482577,
8
+ "bleu_4": 0.0483690414206241,
9
+ "meteor": 0.21291121731396784,
10
+ "rouge_l": 0.17453617861562737,
11
+ "chexpert_f1_14_micro": 0.31163845751177804,
12
+ "chexpert_f1_5_micro": 0.24861538461538463,
13
+ "chexpert_f1_14_macro": 0.13629250906293128,
14
+ "chexpert_f1_5_macro": 0.16862522291180843,
15
+ "chexpert_f1_micro": 0.31163845751177804,
16
+ "chexpert_f1_macro": 0.13629250906293128,
17
  "chexpert_per_label_f1": {
18
+ "Enlarged Cardiomediastinum": 0.07407407407407407,
19
+ "Cardiomegaly": 0.39663335086796425,
20
  "Lung Opacity": 0.004073319755600814,
21
  "Lung Lesion": 0.0,
22
+ "Edema": 0.2462526766595289,
23
  "Consolidation": 0.0,
24
  "Pneumonia": 0.0,
25
  "Atelectasis": 0.008695652173913044,
26
  "Pneumothorax": 0.0,
27
+ "Pleural Effusion": 0.1915444348576359,
28
  "Pleural Other": 0.0,
29
+ "Fracture": 0.017543859649122806,
30
+ "Support Devices": 0.6656580937972768,
31
+ "No Finding": 0.30361966504592114
32
  },
33
+ "radgraph_f1": 0.0938551356876054,
34
+ "radgraph_f1_entity": 0.14413244058497404,
35
+ "radgraph_f1_relation": 0.12803672953985817,
36
  "radgraph_available": true,
37
  "radgraph_error": null,
38
  "evaluation_suite": "mimic_test_dual",
 
42
  "dataset": "mimic-cxr",
43
  "view_filter": "frontal-only (PA/AP)",
44
  "num_examples": 3041,
45
+ "bleu_1": 0.23460907118482577,
46
+ "bleu_4": 0.0483690414206241,
47
+ "meteor": 0.21291121731396784,
48
+ "rouge_l": 0.17453617861562737,
49
+ "chexpert_f1_14_micro": 0.31163845751177804,
50
+ "chexpert_f1_5_micro": 0.24861538461538463,
51
+ "chexpert_f1_14_macro": 0.13629250906293128,
52
+ "chexpert_f1_5_macro": 0.16862522291180843,
53
+ "chexpert_f1_micro": 0.31163845751177804,
54
+ "chexpert_f1_macro": 0.13629250906293128,
55
  "chexpert_per_label_f1": {
56
+ "Enlarged Cardiomediastinum": 0.07407407407407407,
57
+ "Cardiomegaly": 0.39663335086796425,
58
  "Lung Opacity": 0.004073319755600814,
59
  "Lung Lesion": 0.0,
60
+ "Edema": 0.2462526766595289,
61
  "Consolidation": 0.0,
62
  "Pneumonia": 0.0,
63
  "Atelectasis": 0.008695652173913044,
64
  "Pneumothorax": 0.0,
65
+ "Pleural Effusion": 0.1915444348576359,
66
  "Pleural Other": 0.0,
67
+ "Fracture": 0.017543859649122806,
68
+ "Support Devices": 0.6656580937972768,
69
+ "No Finding": 0.30361966504592114
70
  },
71
+ "radgraph_f1": 0.0938551356876054,
72
+ "radgraph_f1_entity": 0.14413244058497404,
73
+ "radgraph_f1_relation": 0.12803672953985817,
74
  "radgraph_available": true,
75
  "radgraph_error": null
76
  },
 
80
  "dataset": "mimic-cxr",
81
  "view_filter": "frontal-only (PA/AP), structured Findings section only",
82
  "num_examples": 2210,
83
+ "bleu_1": 0.24804371044734913,
84
+ "bleu_4": 0.05730693271738745,
85
+ "meteor": 0.2309676565725014,
86
+ "rouge_l": 0.18476844395763578,
87
+ "chexpert_f1_14_micro": 0.2921437031188314,
88
+ "chexpert_f1_5_micro": 0.23939202026599113,
89
+ "chexpert_f1_14_macro": 0.13259269532627468,
90
+ "chexpert_f1_5_macro": 0.1635857001735776,
91
+ "chexpert_f1_micro": 0.2921437031188314,
92
+ "chexpert_f1_macro": 0.13259269532627468,
93
  "chexpert_per_label_f1": {
94
+ "Enlarged Cardiomediastinum": 0.06293706293706294,
95
+ "Cardiomegaly": 0.3652312599681021,
96
  "Lung Opacity": 0.005772005772005772,
97
  "Lung Lesion": 0.0,
98
+ "Edema": 0.2601626016260163,
99
  "Consolidation": 0.0,
100
  "Pneumonia": 0.0,
101
  "Atelectasis": 0.013186813186813187,
102
  "Pneumothorax": 0.0,
103
+ "Pleural Effusion": 0.1793478260869565,
104
  "Pleural Other": 0.0,
105
+ "Fracture": 0.023255813953488372,
106
+ "Support Devices": 0.5962264150943396,
107
+ "No Finding": 0.3501779359430605
108
  },
109
+ "radgraph_f1": 0.10463721960424775,
110
+ "radgraph_f1_entity": 0.15836826410474694,
111
+ "radgraph_f1_relation": 0.1404934373559056,
112
  "radgraph_available": true,
113
  "radgraph_error": null
114
  }
evaluations/mimic_test_predictions.csv CHANGED
The diff for this file is too large to render. See raw diff
 
run_summary.json CHANGED
@@ -50,35 +50,35 @@
50
  "dataset": "mimic-cxr",
51
  "view_filter": "frontal-only (PA/AP)",
52
  "num_examples": 3041,
53
- "bleu_1": 0.16499879686902857,
54
- "bleu_4": 0.033400783448202014,
55
- "meteor": 0.2057195729907702,
56
- "rouge_l": 0.15262886260140987,
57
- "chexpert_f1_14_micro": 0.26065662978414655,
58
- "chexpert_f1_5_micro": 0.246974358974359,
59
- "chexpert_f1_14_macro": 0.1239880617810402,
60
- "chexpert_f1_5_macro": 0.16818421256006927,
61
- "chexpert_f1_micro": 0.26065662978414655,
62
- "chexpert_f1_macro": 0.1239880617810402,
63
  "chexpert_per_label_f1": {
64
- "Enlarged Cardiomediastinum": 0.0776255707762557,
65
- "Cardiomegaly": 0.39155672823218995,
66
  "Lung Opacity": 0.004073319755600814,
67
  "Lung Lesion": 0.0,
68
- "Edema": 0.24839400428265523,
69
  "Consolidation": 0.0,
70
  "Pneumonia": 0.0,
71
  "Atelectasis": 0.008695652173913044,
72
  "Pneumothorax": 0.0,
73
- "Pleural Effusion": 0.192274678111588,
74
  "Pleural Other": 0.0,
75
- "Fracture": 0.017391304347826087,
76
- "Support Devices": 0.4812382739212008,
77
- "No Finding": 0.3145833333333333
78
  },
79
- "radgraph_f1": 0.09410311365933419,
80
- "radgraph_f1_entity": 0.14542321670985509,
81
- "radgraph_f1_relation": 0.12964295145994836,
82
  "radgraph_available": true,
83
  "radgraph_error": null
84
  },
@@ -89,35 +89,35 @@
89
  "dataset": "mimic-cxr",
90
  "view_filter": "frontal-only (PA/AP)",
91
  "num_examples": 3041,
92
- "bleu_1": 0.16499879686902857,
93
- "bleu_4": 0.033400783448202014,
94
- "meteor": 0.2057195729907702,
95
- "rouge_l": 0.15262886260140987,
96
- "chexpert_f1_14_micro": 0.26065662978414655,
97
- "chexpert_f1_5_micro": 0.246974358974359,
98
- "chexpert_f1_14_macro": 0.1239880617810402,
99
- "chexpert_f1_5_macro": 0.16818421256006927,
100
- "chexpert_f1_micro": 0.26065662978414655,
101
- "chexpert_f1_macro": 0.1239880617810402,
102
  "chexpert_per_label_f1": {
103
- "Enlarged Cardiomediastinum": 0.0776255707762557,
104
- "Cardiomegaly": 0.39155672823218995,
105
  "Lung Opacity": 0.004073319755600814,
106
  "Lung Lesion": 0.0,
107
- "Edema": 0.24839400428265523,
108
  "Consolidation": 0.0,
109
  "Pneumonia": 0.0,
110
  "Atelectasis": 0.008695652173913044,
111
  "Pneumothorax": 0.0,
112
- "Pleural Effusion": 0.192274678111588,
113
  "Pleural Other": 0.0,
114
- "Fracture": 0.017391304347826087,
115
- "Support Devices": 0.4812382739212008,
116
- "No Finding": 0.3145833333333333
117
  },
118
- "radgraph_f1": 0.09410311365933419,
119
- "radgraph_f1_entity": 0.14542321670985509,
120
- "radgraph_f1_relation": 0.12964295145994836,
121
  "radgraph_available": true,
122
  "radgraph_error": null
123
  },
@@ -127,35 +127,35 @@
127
  "dataset": "mimic-cxr",
128
  "view_filter": "frontal-only (PA/AP), structured Findings section only",
129
  "num_examples": 2210,
130
- "bleu_1": 0.17491187190057955,
131
- "bleu_4": 0.03966117310602323,
132
- "meteor": 0.22311507091428398,
133
- "rouge_l": 0.1612770175038926,
134
- "chexpert_f1_14_micro": 0.2501020547013199,
135
- "chexpert_f1_5_micro": 0.23749208359721344,
136
- "chexpert_f1_14_macro": 0.12030236160434729,
137
- "chexpert_f1_5_macro": 0.16269249240448827,
138
- "chexpert_f1_micro": 0.2501020547013199,
139
- "chexpert_f1_macro": 0.12030236160434729,
140
  "chexpert_per_label_f1": {
141
- "Enlarged Cardiomediastinum": 0.0625,
142
- "Cardiomegaly": 0.3613109512390088,
143
  "Lung Opacity": 0.005772005772005772,
144
  "Lung Lesion": 0.0,
145
- "Edema": 0.26058631921824105,
146
  "Consolidation": 0.0,
147
  "Pneumonia": 0.0,
148
  "Atelectasis": 0.013186813186813187,
149
  "Pneumothorax": 0.0,
150
- "Pleural Effusion": 0.1783783783783784,
151
  "Pleural Other": 0.0,
152
- "Fracture": 0.022988505747126436,
153
- "Support Devices": 0.415625,
154
- "No Finding": 0.36388508891928867
155
  },
156
- "radgraph_f1": 0.10468134329680011,
157
- "radgraph_f1_entity": 0.1595464585348944,
158
- "radgraph_f1_relation": 0.14191739966668873,
159
  "radgraph_available": true,
160
  "radgraph_error": null
161
  }
 
50
  "dataset": "mimic-cxr",
51
  "view_filter": "frontal-only (PA/AP)",
52
  "num_examples": 3041,
53
+ "bleu_1": 0.23460907118482577,
54
+ "bleu_4": 0.0483690414206241,
55
+ "meteor": 0.21291121731396784,
56
+ "rouge_l": 0.17453617861562737,
57
+ "chexpert_f1_14_micro": 0.31163845751177804,
58
+ "chexpert_f1_5_micro": 0.24861538461538463,
59
+ "chexpert_f1_14_macro": 0.13629250906293128,
60
+ "chexpert_f1_5_macro": 0.16862522291180843,
61
+ "chexpert_f1_micro": 0.31163845751177804,
62
+ "chexpert_f1_macro": 0.13629250906293128,
63
  "chexpert_per_label_f1": {
64
+ "Enlarged Cardiomediastinum": 0.07407407407407407,
65
+ "Cardiomegaly": 0.39663335086796425,
66
  "Lung Opacity": 0.004073319755600814,
67
  "Lung Lesion": 0.0,
68
+ "Edema": 0.2462526766595289,
69
  "Consolidation": 0.0,
70
  "Pneumonia": 0.0,
71
  "Atelectasis": 0.008695652173913044,
72
  "Pneumothorax": 0.0,
73
+ "Pleural Effusion": 0.1915444348576359,
74
  "Pleural Other": 0.0,
75
+ "Fracture": 0.017543859649122806,
76
+ "Support Devices": 0.6656580937972768,
77
+ "No Finding": 0.30361966504592114
78
  },
79
+ "radgraph_f1": 0.0938551356876054,
80
+ "radgraph_f1_entity": 0.14413244058497404,
81
+ "radgraph_f1_relation": 0.12803672953985817,
82
  "radgraph_available": true,
83
  "radgraph_error": null
84
  },
 
89
  "dataset": "mimic-cxr",
90
  "view_filter": "frontal-only (PA/AP)",
91
  "num_examples": 3041,
92
+ "bleu_1": 0.23460907118482577,
93
+ "bleu_4": 0.0483690414206241,
94
+ "meteor": 0.21291121731396784,
95
+ "rouge_l": 0.17453617861562737,
96
+ "chexpert_f1_14_micro": 0.31163845751177804,
97
+ "chexpert_f1_5_micro": 0.24861538461538463,
98
+ "chexpert_f1_14_macro": 0.13629250906293128,
99
+ "chexpert_f1_5_macro": 0.16862522291180843,
100
+ "chexpert_f1_micro": 0.31163845751177804,
101
+ "chexpert_f1_macro": 0.13629250906293128,
102
  "chexpert_per_label_f1": {
103
+ "Enlarged Cardiomediastinum": 0.07407407407407407,
104
+ "Cardiomegaly": 0.39663335086796425,
105
  "Lung Opacity": 0.004073319755600814,
106
  "Lung Lesion": 0.0,
107
+ "Edema": 0.2462526766595289,
108
  "Consolidation": 0.0,
109
  "Pneumonia": 0.0,
110
  "Atelectasis": 0.008695652173913044,
111
  "Pneumothorax": 0.0,
112
+ "Pleural Effusion": 0.1915444348576359,
113
  "Pleural Other": 0.0,
114
+ "Fracture": 0.017543859649122806,
115
+ "Support Devices": 0.6656580937972768,
116
+ "No Finding": 0.30361966504592114
117
  },
118
+ "radgraph_f1": 0.0938551356876054,
119
+ "radgraph_f1_entity": 0.14413244058497404,
120
+ "radgraph_f1_relation": 0.12803672953985817,
121
  "radgraph_available": true,
122
  "radgraph_error": null
123
  },
 
127
  "dataset": "mimic-cxr",
128
  "view_filter": "frontal-only (PA/AP), structured Findings section only",
129
  "num_examples": 2210,
130
+ "bleu_1": 0.24804371044734913,
131
+ "bleu_4": 0.05730693271738745,
132
+ "meteor": 0.2309676565725014,
133
+ "rouge_l": 0.18476844395763578,
134
+ "chexpert_f1_14_micro": 0.2921437031188314,
135
+ "chexpert_f1_5_micro": 0.23939202026599113,
136
+ "chexpert_f1_14_macro": 0.13259269532627468,
137
+ "chexpert_f1_5_macro": 0.1635857001735776,
138
+ "chexpert_f1_micro": 0.2921437031188314,
139
+ "chexpert_f1_macro": 0.13259269532627468,
140
  "chexpert_per_label_f1": {
141
+ "Enlarged Cardiomediastinum": 0.06293706293706294,
142
+ "Cardiomegaly": 0.3652312599681021,
143
  "Lung Opacity": 0.005772005772005772,
144
  "Lung Lesion": 0.0,
145
+ "Edema": 0.2601626016260163,
146
  "Consolidation": 0.0,
147
  "Pneumonia": 0.0,
148
  "Atelectasis": 0.013186813186813187,
149
  "Pneumothorax": 0.0,
150
+ "Pleural Effusion": 0.1793478260869565,
151
  "Pleural Other": 0.0,
152
+ "Fracture": 0.023255813953488372,
153
+ "Support Devices": 0.5962264150943396,
154
+ "No Finding": 0.3501779359430605
155
  },
156
+ "radgraph_f1": 0.10463721960424775,
157
+ "radgraph_f1_entity": 0.15836826410474694,
158
+ "radgraph_f1_relation": 0.1404934373559056,
159
  "radgraph_available": true,
160
  "radgraph_error": null
161
  }