wanderlust-chatbot / docs /eval_ner.json
Kiriten892's picture
Wave 3: expand NER fixture 85->102, time_preference F1 0.40->0.98, people/duration fixes
a832dee
Raw
History Blame Contribute Delete
2.66 kB
{
"model": "ner",
"test_file": "C:\\Users\\Acer\\Downloads\\Wanderlust\\chatbot-ml-service\\app\\data\\datasets\\ner_eval.json",
"samples": 102,
"per_type": {
"activity_preference": {
"precision": 0.7560975609756098,
"recall": 0.8857142857142857,
"f1": 0.8157894736842105,
"tp": 31,
"fp": 10,
"fn": 4
},
"budget": {
"precision": 1.0,
"recall": 0.8181818181818182,
"f1": 0.9,
"tp": 9,
"fp": 0,
"fn": 2
},
"budget_priority": {
"precision": 0.8888888888888888,
"recall": 0.7272727272727273,
"f1": 0.7999999999999999,
"tp": 8,
"fp": 1,
"fn": 3
},
"cuisine": {
"precision": 0.9166666666666666,
"recall": 0.8461538461538461,
"f1": 0.8799999999999999,
"tp": 11,
"fp": 1,
"fn": 2
},
"destination": {
"precision": 0.9285714285714286,
"recall": 0.9629629629629629,
"f1": 0.9454545454545454,
"tp": 104,
"fp": 8,
"fn": 4
},
"dietary": {
"precision": 0.9375,
"recall": 0.8823529411764706,
"f1": 0.9090909090909091,
"tp": 15,
"fp": 1,
"fn": 2
},
"duration": {
"precision": 0.9583333333333334,
"recall": 0.9324324324324325,
"f1": 0.9452054794520548,
"tp": 69,
"fp": 3,
"fn": 5
},
"hotel_type": {
"precision": 0.7916666666666666,
"recall": 1.0,
"f1": 0.8837209302325582,
"tp": 19,
"fp": 5,
"fn": 0
},
"location": {
"precision": 0.9453125,
"recall": 0.968,
"f1": 0.9565217391304348,
"tp": 121,
"fp": 7,
"fn": 4
},
"origin": {
"precision": 0.9375,
"recall": 0.8333333333333334,
"f1": 0.8823529411764706,
"tp": 15,
"fp": 1,
"fn": 3
},
"people": {
"precision": 0.8148148148148148,
"recall": 0.8461538461538461,
"f1": 0.830188679245283,
"tp": 22,
"fp": 5,
"fn": 4
},
"time_preference": {
"precision": 1.0,
"recall": 0.9615384615384616,
"f1": 0.9803921568627451,
"tp": 25,
"fp": 0,
"fn": 1
},
"transport": {
"precision": 0.9375,
"recall": 0.9375,
"f1": 0.9375,
"tp": 15,
"fp": 1,
"fn": 1
},
"travel_style": {
"precision": 0.8918918918918919,
"recall": 0.868421052631579,
"f1": 0.88,
"tp": 33,
"fp": 4,
"fn": 5
}
},
"micro": {
"precision": 0.9136029411764706,
"recall": 0.925512104283054,
"f1": 0.9195189639222942
},
"error_count": 43
}