turn-detector / benchmark /benchmark_results.json
hayatiali's picture
Upload model via Fine-tune Assistant
29ec639 verified
{
"model_name": "turn-detector",
"generated_at": "2025-12-14T21:37:22.477273",
"difficulty_results": {
"baseline": {
"total": 20,
"correct": 18,
"accuracy": 0.9
},
"length_noise": {
"total": 20,
"correct": 10,
"accuracy": 0.5
},
"semantic_overlap": {
"total": 20,
"correct": 16,
"accuracy": 0.8
},
"edge_cases": {
"total": 20,
"correct": 11,
"accuracy": 0.55
}
},
"overall_accuracy": 0.6875,
"total_samples": 80,
"correct_samples": 55,
"samples": [
{
"text": "Ömer, nasıl yardımcı olabilirim?",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.8812354207038879,
"is_correct": true
},
{
"text": "Merhaba, hangi konuda yardım edebilirim?",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.9911393523216248,
"is_correct": true
},
{
"text": "Tabii ki, size bununla ilgili bilgi verebilirim.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.5156869292259216,
"is_correct": true
},
{
"text": "Elbette, bu konuda size destek olacağım.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.5563545823097229,
"is_correct": false
},
{
"text": "Anladım, hemen kontrol ediyorum.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.5459677577018738,
"is_correct": false
},
{
"text": "Lütfen bekleyin, birazdan yanıt vereceğim.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.8637070655822754,
"is_correct": true
},
{
"text": "Bu konuda yardımcı olmaktan memnuniyet duyarım.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.6278860569000244,
"is_correct": true
},
{
"text": "Hemen sizin için araştırıyorum.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.7357267737388611,
"is_correct": true
},
{
"text": "Endişelenmeyin, bu konuyu halledeceğiz.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.6491527557373047,
"is_correct": true
},
{
"text": "Herhangi başka bir sorunuz varsa, sormaktan çekinmeyin.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "agent_response",
"confidence": 0.9041098952293396,
"is_correct": true
},
{
"text": "totes agree lol",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9879427552223206,
"is_correct": false
},
{
"text": "yup yup yup yup yup",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.988431453704834,
"is_correct": false
},
{
"text": "OMG cant believe u did that, like seriously, i mean come on, its just too much, you know what i mean? cuz if you dont then idk what to say, like seriously",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.909318745136261,
"is_correct": true
},
{
"text": "nah bro",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9873980283737183,
"is_correct": false
},
{
"text": "yasss that's wassup",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.974721372127533,
"is_correct": false
},
{
"text": "okay okay okay i get it already no need to repeat urself over and over again like i'm not deaf or whatever",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.9450967907905579,
"is_correct": true
},
{
"text": "omg thts crazee",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9885514974594116,
"is_correct": false
},
{
"text": "u r kidding right?",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9817968606948853,
"is_correct": false
},
{
"text": "wow just wow, i mean, wow! i never thought that this would happen, like ever, not in a million years, and yet here we are, unbelievable, just totally unbelievable, you feel me?",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.8823995590209961,
"is_correct": true
},
{
"text": "hah lol whatevs",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9895368814468384,
"is_correct": false
},
{
"text": "Ah, anlıyorum. Devam edebilir misiniz?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.8250168561935425,
"is_correct": true
},
{
"text": "Hmm, bunu biraz daha açabilir misiniz?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.745111882686615,
"is_correct": true
},
{
"text": "Evet, bu gerçekten ilginç. Daha fazla bilgi verebilir misiniz?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.9849535226821899,
"is_correct": true
},
{
"text": "Bu konuda düşündüğünüz başka bir şey var mı?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.9519035220146179,
"is_correct": true
},
{
"text": "Hımm, pekala. Başka bir açıdan bakacak olursak?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.903683066368103,
"is_correct": false
},
{
"text": "Evet, kesinlikle. Peki başka hangi yönlerini ele alabiliriz?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.9927364587783813,
"is_correct": true
},
{
"text": "Tamam, peki buna ek olarak ne söyleyebilirsiniz?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.9534065127372742,
"is_correct": true
},
{
"text": "Anladım, devam etmek ister misiniz?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.974102795124054,
"is_correct": true
},
{
"text": "Evet, peki başka bir detaya dikkat çekmek ister misiniz?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.9879535436630249,
"is_correct": true
},
{
"text": "Hmm, çok iyi bir nokta. Bunu biraz daha açar mısınız?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.9757851362228394,
"is_correct": true
},
{
"text": "Oh great, another software update that will surely make everything run faster, just like last time.",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.895721971988678,
"is_correct": true
},
{
"text": "I'm sure the server downtime at exactly 5 PM on a Friday was purely coincidental, and not at all inconvenient.",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.849263072013855,
"is_correct": true
},
{
"text": "Yeah, because deleting the database with a single command is exactly what everyone wants, right?",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.7744247317314148,
"is_correct": true
},
{
"text": "I just love it when my AI assistant corrects me even when I'm right, it's like having a personal grammar teacher.",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.5396984815597534,
"is_correct": true
},
{
"text": "No, I absolutely don't need any more disk space. Who needs to store files anyway?",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9811112284660339,
"is_correct": true
},
{
"text": "Sure, let's implement the new feature without any testing. What could possibly go wrong?",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9612233638763428,
"is_correct": true
},
{
"text": "Oh, another meeting about meetings? This is exactly why I got into tech.",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9544288516044617,
"is_correct": true
},
{
"text": "I'm really looking forward to debugging this code at 2 AM again. It's the highlight of my week.",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.8809834122657776,
"is_correct": true
},
{
"text": "The best part of working with AI is when it confidently gives you the wrong answer.",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.8558328151702881,
"is_correct": true
},
{
"text": "Of course, let’s deploy the untested code on a Friday evening, I have nothing better to do.",
"expected_label": "agent_response",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.7736720442771912,
"is_correct": true
},
{
"text": "Evet, seni anlıyorum.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.8567759990692139,
"is_correct": true
},
{
"text": "Hmm, ilginç.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.985055685043335,
"is_correct": true
},
{
"text": "Evet, devam et.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.8956389427185059,
"is_correct": true
},
{
"text": "Gerçekten mi?",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.9868144989013672,
"is_correct": true
},
{
"text": "Tamam, bu mantıklı.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.7614496946334839,
"is_correct": true
},
{
"text": "Anladım.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.9884626269340515,
"is_correct": true
},
{
"text": "Evet, bu doğru.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.8082573413848877,
"is_correct": true
},
{
"text": "Ah, şimdi anlıyorum.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.9578026533126831,
"is_correct": true
},
{
"text": "Bu ilginç bir nokta.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.6748051643371582,
"is_correct": true
},
{
"text": "Evet, buna katılıyorum.",
"expected_label": "backchannel",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.8088875412940979,
"is_correct": true
},
{
"text": "yaaaa broooo",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9909811615943909,
"is_correct": true
},
{
"text": "huh? r u srz??",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9855925440788269,
"is_correct": true
},
{
"text": "OMG this is like the most amazing thing ever I mean I can't even begin to explain how incredible this whole situation is because it's just that awesome you know what I mean like seriously wow just wow ok???",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.7402034997940063,
"is_correct": false
},
{
"text": "idk wat u mean",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9897193908691406,
"is_correct": true
},
{
"text": "sure sure sure sure sure",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9763302206993103,
"is_correct": true
},
{
"text": "omg totally 100% agree with you on that one no doubt about it in fact I was just thinking the same thing the other day and it's crazy how we're like on the same wavelength all the time isn't it?",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.9482101798057556,
"is_correct": false
},
{
"text": "no wayyyy",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.991447925567627,
"is_correct": true
},
{
"text": "heyyy, u ther?",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.990699827671051,
"is_correct": true
},
{
"text": "wow cant believe it happened like that i mean who would have thought that everything would turn out this way after all the planning we did it just goes to show that sometimes things have a way of working out on their own despite all the odds and challenges we faced right from the start",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.971515953540802,
"is_correct": false
},
{
"text": "kk thx bye",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.99072265625,
"is_correct": true
},
{
"text": "Hmm, ilginç bir nokta.",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.9318225979804993,
"is_correct": true
},
{
"text": "Anladım, peki ya sonra?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.9160572290420532,
"is_correct": true
},
{
"text": "Hmm, o konuda biraz daha bilgi verir misin?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.7073332667350769,
"is_correct": false
},
{
"text": "Gerçekten mi? Daha fazla duymak isterim.",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.7160800099372864,
"is_correct": true
},
{
"text": "Bu mantıklı, başka neler oldu?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.812181293964386,
"is_correct": false
},
{
"text": "Hmm, bunu daha önce duymamıştım.",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.8978190422058105,
"is_correct": true
},
{
"text": "Bir dakika, bunu doğru mu anlıyorum?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.7696111798286438,
"is_correct": false
},
{
"text": "Peki, sonra ne yaptılar?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.6477120518684387,
"is_correct": true
},
{
"text": "Gerçekten mi? Bu beni düşündürdü.",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.9161955714225769,
"is_correct": true
},
{
"text": "İlginç, devam et lütfen.",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.7439655661582947,
"is_correct": true
},
{
"text": "Evet evet, tabii ki de tebrik ederim, dünya harikası bir iş çıkardın (!)",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.877510666847229,
"is_correct": false
},
{
"text": "Çok güzel, bu kadar net bir çözüm bulduğunu(!) hiç düşünmemiştim doğrusu.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9826798439025879,
"is_correct": false
},
{
"text": "Ah, tabii ki! Çünkü herkes daima müşteri hizmetlerinin ne kadar hızlı olduğunu söyler (!)",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.5608082413673401,
"is_correct": false
},
{
"text": "Eğer bu kadar 'yaratıcı' bir fikir daha duyar mıyım diye düşünüyordum, teşekkürler!",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9653686881065369,
"is_correct": false
},
{
"text": "Bir işin en iyi nasıl yapılmaması gerektiğini görmek için harika (!) bir örnekti.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9630967378616333,
"is_correct": false
},
{
"text": "Evet, kesinlikle bugünkü toplantıda hiçbir şey anlaşılmadı diyemem.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.8947334289550781,
"is_correct": false
},
{
"text": "Harika, seninki gibi bir çözüm sayesinde sorunlarımız iki katına çıkacak (!)",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.8286226987838745,
"is_correct": false
},
{
"text": "Tabii ki de, Türk çayı yurt dışında sudan bile ucuzdur (!).",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "backchannel",
"confidence": 0.8883209228515625,
"is_correct": true
},
{
"text": "Bu kadar ‘detaylı’ bir analiz için üç cümle yeterli oldu, harikasın!",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.610821545124054,
"is_correct": false
},
{
"text": "Elbette, herkesin sabırsızlıkla beklediği o 'harika' PowerPoint sunumunu bir daha görelim.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9590893387794495,
"is_correct": false
}
],
"misclassifications": [
{
"text": "Elbette, bu konuda size destek olacağım.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.5563545823097229,
"is_correct": false
},
{
"text": "Anladım, hemen kontrol ediyorum.",
"expected_label": "agent_response",
"difficulty": "baseline",
"predicted_label": "backchannel",
"confidence": 0.5459677577018738,
"is_correct": false
},
{
"text": "totes agree lol",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9879427552223206,
"is_correct": false
},
{
"text": "yup yup yup yup yup",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.988431453704834,
"is_correct": false
},
{
"text": "nah bro",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9873980283737183,
"is_correct": false
},
{
"text": "yasss that's wassup",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.974721372127533,
"is_correct": false
},
{
"text": "omg thts crazee",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9885514974594116,
"is_correct": false
},
{
"text": "u r kidding right?",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9817968606948853,
"is_correct": false
},
{
"text": "hah lol whatevs",
"expected_label": "agent_response",
"difficulty": "length_noise",
"predicted_label": "backchannel",
"confidence": 0.9895368814468384,
"is_correct": false
},
{
"text": "Hımm, pekala. Başka bir açıdan bakacak olursak?",
"expected_label": "agent_response",
"difficulty": "semantic_overlap",
"predicted_label": "backchannel",
"confidence": 0.903683066368103,
"is_correct": false
},
{
"text": "OMG this is like the most amazing thing ever I mean I can't even begin to explain how incredible this whole situation is because it's just that awesome you know what I mean like seriously wow just wow ok???",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.7402034997940063,
"is_correct": false
},
{
"text": "omg totally 100% agree with you on that one no doubt about it in fact I was just thinking the same thing the other day and it's crazy how we're like on the same wavelength all the time isn't it?",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.9482101798057556,
"is_correct": false
},
{
"text": "wow cant believe it happened like that i mean who would have thought that everything would turn out this way after all the planning we did it just goes to show that sometimes things have a way of working out on their own despite all the odds and challenges we faced right from the start",
"expected_label": "backchannel",
"difficulty": "length_noise",
"predicted_label": "agent_response",
"confidence": 0.971515953540802,
"is_correct": false
},
{
"text": "Hmm, o konuda biraz daha bilgi verir misin?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.7073332667350769,
"is_correct": false
},
{
"text": "Bu mantıklı, başka neler oldu?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.812181293964386,
"is_correct": false
},
{
"text": "Bir dakika, bunu doğru mu anlıyorum?",
"expected_label": "backchannel",
"difficulty": "semantic_overlap",
"predicted_label": "agent_response",
"confidence": 0.7696111798286438,
"is_correct": false
},
{
"text": "Evet evet, tabii ki de tebrik ederim, dünya harikası bir iş çıkardın (!)",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.877510666847229,
"is_correct": false
},
{
"text": "Çok güzel, bu kadar net bir çözüm bulduğunu(!) hiç düşünmemiştim doğrusu.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9826798439025879,
"is_correct": false
},
{
"text": "Ah, tabii ki! Çünkü herkes daima müşteri hizmetlerinin ne kadar hızlı olduğunu söyler (!)",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.5608082413673401,
"is_correct": false
},
{
"text": "Eğer bu kadar 'yaratıcı' bir fikir daha duyar mıyım diye düşünüyordum, teşekkürler!",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9653686881065369,
"is_correct": false
},
{
"text": "Bir işin en iyi nasıl yapılmaması gerektiğini görmek için harika (!) bir örnekti.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9630967378616333,
"is_correct": false
},
{
"text": "Evet, kesinlikle bugünkü toplantıda hiçbir şey anlaşılmadı diyemem.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.8947334289550781,
"is_correct": false
},
{
"text": "Harika, seninki gibi bir çözüm sayesinde sorunlarımız iki katına çıkacak (!)",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.8286226987838745,
"is_correct": false
},
{
"text": "Bu kadar ‘detaylı’ bir analiz için üç cümle yeterli oldu, harikasın!",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.610821545124054,
"is_correct": false
},
{
"text": "Elbette, herkesin sabırsızlıkla beklediği o 'harika' PowerPoint sunumunu bir daha görelim.",
"expected_label": "backchannel",
"difficulty": "edge_cases",
"predicted_label": "agent_response",
"confidence": 0.9590893387794495,
"is_correct": false
}
]
}