davanstrien's picture
download
raw
21.9 kB
{
"summary": {
"model": "davanstrien/qwen35-4b-iconclass-grpo-v5recall",
"dataset": "davanstrien/iconclass-vlm-sft",
"split": "test",
"num_evaluated": 40,
"num_skipped": 0,
"elapsed_seconds": 299.1,
"exact_match_accuracy": 0.075,
"hierarchical_f1": 0.5421,
"code_precision": 0.255,
"code_recall": 0.255,
"code_f1": 0.255,
"valid_json_pct": 1.0,
"valid_code_pct": 1.0
},
"results": [
{
"index": 0,
"gt_codes": [
"92B361",
"12B13",
"12EE13",
"25F33(EAGLE)",
"31E3"
],
"predicted_codes": [
"73",
"73D721",
"73D7211"
],
"generated_text": "{\"iconclass-codes\": [\"73\", \"73D721\", \"73D7211\"]}",
"valid_json": true,
"valid_code_count": 3,
"total_predicted": 3,
"exact_match": false,
"hierarchical_f1": 0.0,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 1,
"gt_codes": [
"48C27(+321)",
"92F2"
],
"predicted_codes": [
"48C24"
],
"generated_text": "{\"iconclass-codes\": [\"48C24\"]}",
"valid_json": true,
"valid_code_count": 1,
"total_predicted": 1,
"exact_match": false,
"hierarchical_f1": 0.5333333333333333,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 2,
"gt_codes": [
"86(MONSTRATUR IN UNDIS)",
"22C5:24A6",
"46C24",
"25H214",
"25I1"
],
"predicted_codes": [
"25H23",
"25H213",
"25I12",
"25H11",
"25I121"
],
"generated_text": "{\"iconclass-codes\": [\"25H23\", \"25H213\", \"25I12\", \"25H11\", \"25I121\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.4955357142857142,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 3,
"gt_codes": [
"11I613",
"11I1"
],
"predicted_codes": [
"44B113",
"44B114(PRECEPTOR)"
],
"generated_text": "{\"iconclass-codes\": [\"44B113\", \"44B114(PRECEPTOR)\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.0,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 4,
"gt_codes": [
"25H11",
"25H213",
"25I",
"46C112"
],
"predicted_codes": [
"25H11",
"25H213",
"46C112",
"46C13141",
"46C513"
],
"generated_text": "{\"iconclass-codes\": [\"25H11\", \"25H213\", \"46C112\", \"46C13141\", \"46C513\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.8582877111240534,
"code_precision": 0.6,
"code_recall": 0.75
},
{
"index": 5,
"gt_codes": [
"25G31",
"31D15",
"25H11",
"46C13142",
"25H"
],
"predicted_codes": [
"25H11",
"25H213",
"46C131",
"46C13141",
"46C513"
],
"generated_text": "{\"iconclass-codes\": [\"25H11\", \"25H213\", \"46C131\", \"46C13141\", \"46C513\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.6848470588235294,
"code_precision": 0.2,
"code_recall": 0.2
},
{
"index": 6,
"gt_codes": [
"25G41(CARNATION)",
"31A2421",
"31D15:61BB",
"41D221(SLUIERKAP)",
"61B(+53)"
],
"predicted_codes": [
"31A2421",
"31D15:61BB",
"61B(+53)",
"61B:31A2212(+1)"
],
"generated_text": "{\"iconclass-codes\": [\"31A2421\", \"31D15:61BB\", \"61B(+53)\", \"61B:31A2212(+1)\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 0.7175879396984924,
"code_precision": 0.75,
"code_recall": 0.6
},
{
"index": 7,
"gt_codes": [
"61B(+51)",
"41D221(TURBAN)",
"73",
"32B321",
"61B:31D14"
],
"predicted_codes": [
"31A2211",
"31A2421",
"31D14",
"61B(+52)",
"61B:31D14"
],
"generated_text": "{\"iconclass-codes\": [\"31A2211\", \"31A2421\", \"31D14\", \"61B(+52)\", \"61B:31D14\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.47296638655462186,
"code_precision": 0.2,
"code_recall": 0.2
},
{
"index": 8,
"gt_codes": [
"49L171",
"49M413",
"49M3",
"49L12(V)",
"49L12(E)"
],
"predicted_codes": [
"49L171",
"49M413",
"49M3",
"49L12(V)"
],
"generated_text": "{\"iconclass-codes\": [\"49L171\", \"49M413\", \"49M3\", \"49L12(V)\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 1.0,
"code_precision": 1.0,
"code_recall": 0.8
},
{
"index": 9,
"gt_codes": [
"31A231",
"31A2421",
"61B(+53)"
],
"predicted_codes": [
"31A231",
"31A2422",
"61B(+54)",
"61B:31A2212(+1)"
],
"generated_text": "{\"iconclass-codes\": [\"31A231\", \"31A2422\", \"61B(+54)\", \"61B:31A2212(+1)\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 0.9288014311270126,
"code_precision": 0.25,
"code_recall": 0.3333333333333333
},
{
"index": 10,
"gt_codes": [
"41C5",
"44B113",
"44B1511"
],
"predicted_codes": [
"83(Anonymus, Herzog Ernst)",
"44B113",
"44B191",
"44B192"
],
"generated_text": "{\"iconclass-codes\": [\"83(Anonymus, Herzog Ernst)\", \"44B113\", \"44B191\", \"44B192\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 0.65,
"code_precision": 0.25,
"code_recall": 0.3333333333333333
},
{
"index": 11,
"gt_codes": [
"25F711"
],
"predicted_codes": [
"25F711"
],
"generated_text": "{\"iconclass-codes\": [\"25F711\"]}",
"valid_json": true,
"valid_code_count": 1,
"total_predicted": 1,
"exact_match": true,
"hierarchical_f1": 1.0,
"code_precision": 1.0,
"code_recall": 1.0
},
{
"index": 12,
"gt_codes": [
"11Q712",
"25I22",
"34B11"
],
"predicted_codes": [
"11Q712",
"25I2"
],
"generated_text": "{\"iconclass-codes\": [\"11Q712\", \"25I2\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.704,
"code_precision": 0.5,
"code_recall": 0.3333333333333333
},
{
"index": 13,
"gt_codes": [
"54A44(+4)",
"54D3(+4)",
"51MM11(+4)",
"46C24111",
"25F44(+5246)"
],
"predicted_codes": [
"25F44(+512)",
"25F44(+5262)",
"54A7(+4)",
"86(QUOD NEMO VIDEAT)",
"86(QUE NEMO VIDEAT)"
],
"generated_text": "{\"iconclass-codes\": [\"25F44(+512)\", \"25F44(+5262)\", \"54A7(+4)\", \"86(QUOD NEMO VIDEAT)\", \"86(QUE NEMO VIDEAT)\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.469446088794926,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 14,
"gt_codes": [
"61B:31A2212(+1)",
"61B:31D14",
"31A2518",
"41D223(JERKIN)",
"31A231"
],
"predicted_codes": [
"31A231",
"31A2422",
"61B(+53)",
"61B:31A2212(+1)",
"61B:31D14"
],
"generated_text": "{\"iconclass-codes\": [\"31A231\", \"31A2422\", \"61B(+53)\", \"61B:31A2212(+1)\", \"61B:31D14\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.8130232558139536,
"code_precision": 0.6,
"code_recall": 0.6
},
{
"index": 15,
"gt_codes": [
"94C133"
],
"predicted_codes": [
"45H3",
"45C15(BOW)",
"45C15(ARROW)",
"45C15(ARROW)",
"45C15(ARROW)"
],
"generated_text": "{\"iconclass-codes\": [\"45H3\", \"45C15(BOW)\", \"45C15(ARROW)\", \"45C15(ARROW)\", \"45C15(ARROW)\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.0,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 16,
"gt_codes": [
"31A2422",
"61B(+52)",
"61B:31D14"
],
"predicted_codes": [
"11H(JOHN)"
],
"generated_text": "{\"iconclass-codes\": [\"11H(JOHN)\"]}",
"valid_json": true,
"valid_code_count": 1,
"total_predicted": 1,
"exact_match": false,
"hierarchical_f1": 0.0,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 17,
"gt_codes": [
"31A2422",
"45B",
"61B(+52)",
"61B:31D14"
],
"predicted_codes": [
"31A2422",
"45B",
"61B(+52)",
"61B:31D14"
],
"generated_text": "{\"iconclass-codes\": [\"31A2422\", \"45B\", \"61B(+52)\", \"61B:31D14\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": true,
"hierarchical_f1": 1.0,
"code_precision": 1.0,
"code_recall": 1.0
},
{
"index": 18,
"gt_codes": [
"46C13141(+763)"
],
"predicted_codes": [
"46C13141"
],
"generated_text": "{\"iconclass-codes\": [\"46C13141\"]}",
"valid_json": true,
"valid_code_count": 1,
"total_predicted": 1,
"exact_match": false,
"hierarchical_f1": 1.0,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 19,
"gt_codes": [
"31D15",
"49M32"
],
"predicted_codes": [
"31D15:61BB",
"41D221(CAP)",
"41D222(RUFF)",
"41D26611",
"41D2664"
],
"generated_text": "{\"iconclass-codes\": [\"31D15:61BB\", \"41D221(CAP)\", \"41D222(RUFF)\", \"41D26611\", \"41D2664\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.39921348314606736,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 20,
"gt_codes": [
"48C1612",
"48C2",
"11Q712",
"25H155",
"25I13"
],
"predicted_codes": [
"25G41(ROSE)",
"25G411(COLUMBINE)",
"25G411(FLAG)",
"25G411(FLAG)",
"25G411(FLAG)"
],
"generated_text": "{\"iconclass-codes\": [\"25G41(ROSE)\", \"25G411(COLUMBINE)\", \"25G411(FLAG)\", \"25G411(FLAG)\", \"25G411(FLAG)\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.22857142857142856,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 21,
"gt_codes": [
"31D15",
"41A1",
"31D112",
"25H15",
"25G3"
],
"predicted_codes": [
"25H15",
"25H155",
"41A17",
"46C11"
],
"generated_text": "{\"iconclass-codes\": [\"25H15\", \"25H155\", \"41A17\", \"46C11\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 0.5315651981403586,
"code_precision": 0.25,
"code_recall": 0.2
},
{
"index": 22,
"gt_codes": [
"41D221"
],
"predicted_codes": [
"44B112",
"61B2(OSMAN, SULTAN)1(+52)",
"61B2(OSMAN, SULTAN)1(+52)1"
],
"generated_text": "{\"iconclass-codes\": [\"44B112\", \"61B2(OSMAN, SULTAN)1(+52)\", \"61B2(OSMAN, SULTAN)1(+52)1\"]}",
"valid_json": true,
"valid_code_count": 3,
"total_predicted": 3,
"exact_match": false,
"hierarchical_f1": 0.1,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 23,
"gt_codes": [
"73A6"
],
"predicted_codes": [
"73C7213",
"73C7212",
"73C7211"
],
"generated_text": "{\"iconclass-codes\": [\"73C7213\", \"73C7212\", \"73C7211\"]}",
"valid_json": true,
"valid_code_count": 3,
"total_predicted": 3,
"exact_match": false,
"hierarchical_f1": 0.38000000000000006,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 24,
"gt_codes": [
"25F24(STAG)",
"25B3",
"48A9876",
"25F43",
"12Q21"
],
"predicted_codes": [
"48A9876",
"48A9875",
"48A98311",
"48A9871",
"48A98312"
],
"generated_text": "{\"iconclass-codes\": [\"48A9876\", \"48A9875\", \"48A98311\", \"48A9871\", \"48A98312\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.328698752228164,
"code_precision": 0.2,
"code_recall": 0.2
},
{
"index": 25,
"gt_codes": [
"73C8212",
"73C8214",
"73C8215"
],
"predicted_codes": [
"73G326",
"73G3261"
],
"generated_text": "{\"iconclass-codes\": [\"73G326\", \"73G3261\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.39493670886075954,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 26,
"gt_codes": [
"73A11"
],
"predicted_codes": [
"73C721",
"73C7211"
],
"generated_text": "{\"iconclass-codes\": [\"73C721\", \"73C7211\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.38,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 27,
"gt_codes": [
"49L171",
"49M413",
"49M3",
"49L12(S)"
],
"predicted_codes": [
"49L171",
"49M413",
"49M3",
"49L12(S)"
],
"generated_text": "{\"iconclass-codes\": [\"49L171\", \"49M413\", \"49M3\", \"49L12(S)\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": true,
"hierarchical_f1": 1.0,
"code_precision": 1.0,
"code_recall": 1.0
},
{
"index": 28,
"gt_codes": [
"41C741",
"43B31"
],
"predicted_codes": [
"41C12",
"41C741",
"41C741(+1)",
"41C741(+1):46A14",
"46A14"
],
"generated_text": "{\"iconclass-codes\": [\"41C12\", \"41C741\", \"41C741(+1)\", \"41C741(+1):46A14\", \"46A14\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.6682422451994091,
"code_precision": 0.2,
"code_recall": 0.5
},
{
"index": 29,
"gt_codes": [
"46C21",
"46C223"
],
"predicted_codes": [
"25I1",
"46C24"
],
"generated_text": "{\"iconclass-codes\": [\"25I1\", \"46C24\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.5288135593220339,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 30,
"gt_codes": [
"49E391"
],
"predicted_codes": [
"41C326",
"41C741",
"41C7411",
"41C74111"
],
"generated_text": "{\"iconclass-codes\": [\"41C326\", \"41C741\", \"41C7411\", \"41C74111\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 0.19746835443037977,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 31,
"gt_codes": [
"31A231",
"31D15",
"41D2321",
"61B(+55)"
],
"predicted_codes": [
"25G3",
"31D15",
"41D221(HAT)",
"41D2653",
"41D2661"
],
"generated_text": "{\"iconclass-codes\": [\"25G3\", \"31D15\", \"41D221(HAT)\", \"41D2653\", \"41D2661\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.6018734593262118,
"code_precision": 0.2,
"code_recall": 0.25
},
{
"index": 32,
"gt_codes": [
"73D58",
"73D641"
],
"predicted_codes": [
"73D641",
"73D642"
],
"generated_text": "{\"iconclass-codes\": [\"73D641\", \"73D642\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.8596541786743516,
"code_precision": 0.5,
"code_recall": 0.5
},
{
"index": 33,
"gt_codes": [
"33B3",
"41A221",
"41A722",
"56DD1"
],
"predicted_codes": [
"31D112",
"41A2",
"41A721",
"41A761",
"41A775"
],
"generated_text": "{\"iconclass-codes\": [\"31D112\", \"41A2\", \"41A721\", \"41A761\", \"41A775\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.5537960954446856,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 34,
"gt_codes": [
"25A3",
"45C41",
"45K21"
],
"predicted_codes": [
"25A3",
"45K"
],
"generated_text": "{\"iconclass-codes\": [\"25A3\", \"45K\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.711149825783972,
"code_precision": 0.5,
"code_recall": 0.3333333333333333
},
{
"index": 35,
"gt_codes": [
"73C8172",
"73C8171"
],
"predicted_codes": [
"73C721",
"73C7211"
],
"generated_text": "{\"iconclass-codes\": [\"73C721\", \"73C7211\"]}",
"valid_json": true,
"valid_code_count": 2,
"total_predicted": 2,
"exact_match": false,
"hierarchical_f1": 0.5924050632911392,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 36,
"gt_codes": [
"25F23(PANTHER)",
"31A2323",
"31A2518",
"42A1931",
"46C161"
],
"predicted_codes": [
"46A14",
"46C1442",
"46C14421",
"46C14422",
"46C14423"
],
"generated_text": "{\"iconclass-codes\": [\"46A14\", \"46C1442\", \"46C14421\", \"46C14422\", \"46C14423\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.2998356164383562,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 37,
"gt_codes": [
"12B61",
"25I",
"41A12"
],
"predicted_codes": [
"25I",
"25I1",
"25I146",
"41A12"
],
"generated_text": "{\"iconclass-codes\": [\"25I\", \"25I1\", \"25I146\", \"41A12\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 0.7210103329506313,
"code_precision": 0.5,
"code_recall": 0.6666666666666666
},
{
"index": 38,
"gt_codes": [
"23I41",
"41C32",
"41C12",
"31D14",
"47I4221"
],
"predicted_codes": [
"23K41",
"23O22",
"23K42",
"23K43",
"23K44"
],
"generated_text": "{\"iconclass-codes\": [\"23K41\", \"23O22\", \"23K42\", \"23K43\", \"23K44\"]}",
"valid_json": true,
"valid_code_count": 5,
"total_predicted": 5,
"exact_match": false,
"hierarchical_f1": 0.13333333333333333,
"code_precision": 0.0,
"code_recall": 0.0
},
{
"index": 39,
"gt_codes": [
"31D13",
"61B:31A2212(+1)",
"31A2421",
"41D222(RUFF)",
"31AA533(EMPIREKRULLEN)"
],
"predicted_codes": [
"31A2421",
"31D15:61BB",
"61B(+52)",
"61B:31A2212(+1)"
],
"generated_text": "{\"iconclass-codes\": [\"31A2421\", \"31D15:61BB\", \"61B(+52)\", \"61B:31A2212(+1)\"]}",
"valid_json": true,
"valid_code_count": 4,
"total_predicted": 4,
"exact_match": false,
"hierarchical_f1": 0.7436889332003987,
"code_precision": 0.5,
"code_recall": 0.4
}
]
}

Xet Storage Details

Size:
21.9 kB
·
Xet hash:
f38c3a5ca6eea8483c76278dc3efd266a5cef7a206a89ebffca77b151876f01f

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.