tuklu commited on
Commit
f3c157a
·
verified ·
1 Parent(s): 9989809

Add SHAP explainability analysis

Browse files
.gitattributes CHANGED
@@ -65,3 +65,9 @@ output_v2/figures/hinglish_to_hindi_to_english/Phase_hinglish_eval_full_roc.png
65
  output_v2/figures/hinglish_to_hindi_to_english/Phase_hinglish_eval_hindi_roc.png filter=lfs diff=lfs merge=lfs -text
66
  output_v2/figures/hinglish_to_hindi_to_english/Phase_hinglish_eval_hinglish_pr.png filter=lfs diff=lfs merge=lfs -text
67
  output_v2/figures/hinglish_to_hindi_to_english/Phase_hinglish_eval_hinglish_roc.png filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
65
  output_v2/figures/hinglish_to_hindi_to_english/Phase_hinglish_eval_hindi_roc.png filter=lfs diff=lfs merge=lfs -text
66
  output_v2/figures/hinglish_to_hindi_to_english/Phase_hinglish_eval_hinglish_pr.png filter=lfs diff=lfs merge=lfs -text
67
  output_v2/figures/hinglish_to_hindi_to_english/Phase_hinglish_eval_hinglish_roc.png filter=lfs diff=lfs merge=lfs -text
68
+ output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_english.png filter=lfs diff=lfs merge=lfs -text
69
+ output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_full.png filter=lfs diff=lfs merge=lfs -text
70
+ output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_hinglish.png filter=lfs diff=lfs merge=lfs -text
71
+ output_v2/shap/cross_model_comparison_full.png filter=lfs diff=lfs merge=lfs -text
72
+ output_v2/shap/cross_model_comparison_hindi.png filter=lfs diff=lfs merge=lfs -text
73
+ output_v2/shap/cross_model_comparison_hinglish.png filter=lfs diff=lfs merge=lfs -text
output_v2/shap/cross_model_comparison_english.png ADDED
output_v2/shap/cross_model_comparison_full.png ADDED

Git LFS Details

  • SHA256: 028ac7c356575510ccf3498c0cd7c00fc8e396c2755d5df531b2ee6f305f6ce6
  • Pointer size: 131 Bytes
  • Size of remote file: 148 kB
output_v2/shap/cross_model_comparison_hindi.png ADDED

Git LFS Details

  • SHA256: 0839849e6a0350d78cdedf777599f996568572442d8cb083c724432ef08868af
  • Pointer size: 131 Bytes
  • Size of remote file: 103 kB
output_v2/shap/cross_model_comparison_hinglish.png ADDED

Git LFS Details

  • SHA256: 99ebc8a60c214d8ab4bc6fc8d83370819a088cf8c721df875c797c31982acef4
  • Pointer size: 131 Bytes
  • Size of remote file: 109 kB
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_summary.csv ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ model,eval_lang,top_hate_words,top_nonhate_words
2
+ hinglish_to_hindi_to_english_v2,english,"nas(0.0408), fags(0.0308), sicko(0.0297), sabotage(0.0297), advocating(0.0223)","grow(-0.0357), barrel(-0.0341), homosexual(-0.0323), pak(-0.0301), join(-0.0241)"
3
+ hinglish_to_hindi_to_english_v2,hindi,"वादा(0.0033), वैज्ञानिकों(0.0033), ऐ(0.0032), उतारा(0.0032), गला(0.0030)","जीतेगा(-0.0072), घोंटने(-0.0042), जिहादी(-0.0039), आपत्तिजनक(-0.0039), चमचो(-0.0024)"
4
+ hinglish_to_hindi_to_english_v2,hinglish,"arey(0.0459), bahir(0.0409), punish(0.0396), papa(0.0389), interior(0.0373)","online(-0.0293), member(-0.0265), mam(-0.0230), messages(-0.0221), asha(-0.0204)"
5
+ hinglish_to_hindi_to_english_v2,full,"blamed(0.0648), criticized(0.0473), syntax(0.0467), grown(0.0392), sine(0.0352)","underneath(-0.1046), smack(-0.0426), online(-0.0403), hole(-0.0354), clue(-0.0314)"
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_english.csv ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ word,mean_shap,direction,abs_shap
2
+ nas,0.04084094986319542,hate,0.04084094986319542
3
+ grow,-0.03568753972649574,non-hate,0.03568753972649574
4
+ barrel,-0.03411834314465523,non-hate,0.03411834314465523
5
+ homosexual,-0.032309435307979584,non-hate,0.032309435307979584
6
+ fags,0.030772147700190544,hate,0.030772147700190544
7
+ pak,-0.030134739354252815,non-hate,0.030134739354252815
8
+ sicko,0.029741348698735237,hate,0.029741348698735237
9
+ sabotage,0.029711255803704262,hate,0.029711255803704262
10
+ join,-0.02413080632686615,non-hate,0.02413080632686615
11
+ advocating,0.02234148420393467,hate,0.02234148420393467
12
+ poppy,-0.02190038375556469,non-hate,0.02190038375556469
13
+ alien,-0.021285340189933777,non-hate,0.021285340189933777
14
+ cycle,0.0199173204600811,hate,0.0199173204600811
15
+ illegal,0.019460361175636837,hate,0.019460361175636837
16
+ crush,-0.01917188661172986,non-hate,0.01917188661172986
17
+ tit,0.01897701807320118,hate,0.01897701807320118
18
+ spoilt,0.017174284905195236,hate,0.017174284905195236
19
+ accused,0.016549019142985344,hate,0.016549019142985344
20
+ bigger,-0.016319772228598595,non-hate,0.016319772228598595
21
+ fault,0.016076564012716215,hate,0.016076564012716215
22
+ kad,0.01592048816382885,hate,0.01592048816382885
23
+ social,-0.015574524737894535,non-hate,0.015574524737894535
24
+ excuses,0.015325771644711494,hate,0.015325771644711494
25
+ polite,-0.015105613352109989,non-hate,0.015105613352109989
26
+ proverbial,0.014887955971062183,hate,0.014887955971062183
27
+ caught,0.01482851430773735,hate,0.01482851430773735
28
+ failed,0.014297339133918285,hate,0.014297339133918285
29
+ revising,-0.014272860251367092,non-hate,0.014272860251367092
30
+ boomer,-0.013116286136209965,non-hate,0.013116286136209965
31
+ wear,-0.012863598763942719,non-hate,0.012863598763942719
32
+ plot,-0.012858100235462189,non-hate,0.012858100235462189
33
+ vandalize,0.01270614832174033,hate,0.01270614832174033
34
+ unite,0.012388435192406178,hate,0.012388435192406178
35
+ bitchy,0.012348399497568607,hate,0.012348399497568607
36
+ perform,-0.012242045724633499,non-hate,0.012242045724633499
37
+ pride,0.011979740811511874,hate,0.011979740811511874
38
+ stop,0.011946490097146194,hate,0.011946490097146194
39
+ btw,0.011738581582903862,hate,0.011738581582903862
40
+ romania,0.011656457558274269,hate,0.011656457558274269
41
+ boon,0.011625840328633785,hate,0.011625840328633785
42
+ deny,0.011531622149050236,hate,0.011531622149050236
43
+ trans,0.011500706896185875,hate,0.011500706896185875
44
+ dear,-0.011394963517280607,non-hate,0.011394963517280607
45
+ wwf,0.011149724945425987,hate,0.011149724945425987
46
+ wikis,-0.011066155973821878,non-hate,0.011066155973821878
47
+ bro,-0.011030015535652637,non-hate,0.011030015535652637
48
+ rains,-0.010711784474551678,non-hate,0.010711784474551678
49
+ attitude,0.01068491442129016,hate,0.01068491442129016
50
+ hump,-0.01064093317836523,non-hate,0.01064093317836523
51
+ medicare,-0.010626320727169514,non-hate,0.010626320727169514
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_english.png ADDED

Git LFS Details

  • SHA256: 52d6cd69dff6c0d50709f8cfe306e69bf41d28250064b325a22fa05387f6c771
  • Pointer size: 131 Bytes
  • Size of remote file: 133 kB
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_full.csv ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ word,mean_shap,direction,abs_shap
2
+ underneath,-0.10458830744028091,non-hate,0.10458830744028091
3
+ blamed,0.06481243669986725,hate,0.06481243669986725
4
+ criticized,0.047305628657341,hate,0.047305628657341
5
+ syntax,0.046665407717227936,hate,0.046665407717227936
6
+ smack,-0.042638324201107025,non-hate,0.042638324201107025
7
+ online,-0.040302298963069916,non-hate,0.040302298963069916
8
+ grown,0.039168521761894226,hate,0.039168521761894226
9
+ hole,-0.035353163606487215,non-hate,0.035353163606487215
10
+ sine,0.03520340472459793,hate,0.03520340472459793
11
+ clue,-0.03141946718096733,non-hate,0.03141946718096733
12
+ eliza,-0.025371160358190536,non-hate,0.025371160358190536
13
+ fucked,0.02449769526720047,hate,0.02449769526720047
14
+ ruling,0.02396106906235218,hate,0.02396106906235218
15
+ expressive,0.023163892328739166,hate,0.023163892328739166
16
+ advocating,0.02261391095817089,hate,0.02261391095817089
17
+ manners,-0.022611092776060104,non-hate,0.022611092776060104
18
+ madam,0.022388344630599022,hate,0.022388344630599022
19
+ tweets,-0.0218605634290725,non-hate,0.0218605634290725
20
+ pr,0.02108542900532484,hate,0.02108542900532484
21
+ nawaz,0.019971828907728195,hate,0.019971828907728195
22
+ fateful,0.01936914399266243,hate,0.01936914399266243
23
+ congrats,0.019144877791404724,hate,0.019144877791404724
24
+ flip,0.01885046996176243,hate,0.01885046996176243
25
+ bitter,0.018671734258532524,hate,0.018671734258532524
26
+ dubious,0.016950108110904694,hate,0.016950108110904694
27
+ quran,-0.016676608473062515,non-hate,0.016676608473062515
28
+ turkey,0.016496842727065086,hate,0.016496842727065086
29
+ flop,0.015149658545851707,hate,0.015149658545851707
30
+ punish,0.014967915951274335,hate,0.014967915951274335
31
+ rosewood,-0.014851009473204613,non-hate,0.014851009473204613
32
+ exclude,0.01474262960255146,hate,0.01474262960255146
33
+ tha,0.014648808864876628,hate,0.014648808864876628
34
+ troubles,0.014084530994296074,hate,0.014084530994296074
35
+ attacks,0.013815064914524555,hate,0.013815064914524555
36
+ angela,-0.013330272398889065,non-hate,0.013330272398889065
37
+ bot,-0.01317788427695632,non-hate,0.01317788427695632
38
+ isko,-0.012968616560101509,non-hate,0.012968616560101509
39
+ cretin,-0.012747019529342651,non-hate,0.012747019529342651
40
+ du,0.012732747942209244,hate,0.012732747942209244
41
+ awful,0.012715496122837067,hate,0.012715496122837067
42
+ ashamed,-0.012626993469893932,non-hate,0.012626993469893932
43
+ ive,0.012543770484626293,hate,0.012543770484626293
44
+ gand,0.012430441565811634,hate,0.012430441565811634
45
+ wing,0.01240457221865654,hate,0.01240457221865654
46
+ absolutely,0.012251339852809906,hate,0.012251339852809906
47
+ easily,-0.012238632887601852,non-hate,0.012238632887601852
48
+ ancestral,-0.011794610880315304,non-hate,0.011794610880315304
49
+ bjp,0.011773284524679184,hate,0.011773284524679184
50
+ lete,0.011766272597014904,hate,0.011766272597014904
51
+ ace,0.01174088753759861,hate,0.01174088753759861
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_full.png ADDED

Git LFS Details

  • SHA256: 4649b6a07c3995ef2c211c44fa91c298374540070cc8b12c2825bddd1750d44d
  • Pointer size: 131 Bytes
  • Size of remote file: 137 kB
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_hindi.csv ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ word,mean_shap,direction,abs_shap
2
+ जीतेगा,-0.007239299826323986,non-hate,0.007239299826323986
3
+ घोंटने,-0.004180442541837692,non-hate,0.004180442541837692
4
+ जिहादी,-0.003943843767046928,non-hate,0.003943843767046928
5
+ आपत्तिजनक,-0.0038822039496153593,non-hate,0.0038822039496153593
6
+ वादा,0.0033049401827156544,hate,0.0033049401827156544
7
+ वैज्ञानिकों,0.003294713096693158,hate,0.003294713096693158
8
+ ऐ,0.0032312911935150623,hate,0.0032312911935150623
9
+ उतारा,0.0031968937255442142,hate,0.0031968937255442142
10
+ गला,0.003006579587236047,hate,0.003006579587236047
11
+ बेवक़ूफ़,0.002906812820583582,hate,0.002906812820583582
12
+ पत्रकारिता,0.0027609646786004305,hate,0.0027609646786004305
13
+ रद्दीके,0.0026735278079286218,hate,0.0026735278079286218
14
+ शहरों,0.002631198847666383,hate,0.002631198847666383
15
+ जब्त,0.002548573538661003,hate,0.002548573538661003
16
+ बेहोश,0.0025251752231270075,hate,0.0025251752231270075
17
+ भाव,0.002492323750630021,hate,0.002492323750630021
18
+ टुडे,0.0024582596961408854,hate,0.0024582596961408854
19
+ चमचो,-0.002437782706692815,non-hate,0.002437782706692815
20
+ मुश्किलें,0.002396735828369856,hate,0.002396735828369856
21
+ वर्षों,0.002379495883360505,hate,0.002379495883360505
22
+ हालांकि,-0.0023559594992548227,non-hate,0.0023559594992548227
23
+ लागत,0.0023375283926725388,hate,0.0023375283926725388
24
+ सलाम,0.002286830684170127,hate,0.002286830684170127
25
+ ग्राउंड,0.002279318403452635,hate,0.002279318403452635
26
+ वर्तमान,0.0022609676234424114,hate,0.0022609676234424114
27
+ भागे,-0.0022224474232643843,non-hate,0.0022224474232643843
28
+ दौड़ेगी,-0.002178625902161002,non-hate,0.002178625902161002
29
+ विभिन्न,0.0021422391291707754,hate,0.0021422391291707754
30
+ लाठीडंडे,-0.0020988776814192533,non-hate,0.0020988776814192533
31
+ भागवत,-0.002050387905910611,non-hate,0.002050387905910611
32
+ पार,0.0020433420886547538,hate,0.0020433420886547538
33
+ बुर,0.002026310656219721,hate,0.002026310656219721
34
+ तमाशा,0.0020122036803513765,hate,0.0020122036803513765
35
+ सजा,0.0019943982360928203,hate,0.0019943982360928203
36
+ आदित्य,0.0019323243759572506,hate,0.0019323243759572506
37
+ कहे,0.0018306594574823976,hate,0.0018306594574823976
38
+ बबाकस,0.0018216012977063656,hate,0.0018216012977063656
39
+ चेंज,0.0018008995102718472,hate,0.0018008995102718472
40
+ रेपिस्ट,-0.0017585812602192163,non-hate,0.0017585812602192163
41
+ गले,0.0017552308272570372,hate,0.0017552308272570372
42
+ वाणिज्य,0.0017530020559206605,hate,0.0017530020559206605
43
+ बयान,0.001748441020026803,hate,0.001748441020026803
44
+ और,0.0017154300702309979,hate,0.0017154300702309979
45
+ ज़िंदगी,0.0016978256171569228,hate,0.0016978256171569228
46
+ सपा,0.001689926371909678,hate,0.001689926371909678
47
+ उज्ज्वल,0.0016891625709831715,hate,0.0016891625709831715
48
+ बढ़कर,0.001684919698163867,hate,0.001684919698163867
49
+ सैलरी,0.0016782438615337014,hate,0.0016782438615337014
50
+ सालाना,0.0016701605636626482,hate,0.0016701605636626482
51
+ अलावा,0.0016669516408001073,hate,0.0016669516408001073
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_hindi.png ADDED
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_hinglish.csv ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ word,mean_shap,direction,abs_shap
2
+ arey,0.045903529971838,hate,0.045903529971838
3
+ bahir,0.04093165323138237,hate,0.04093165323138237
4
+ punish,0.03960862010717392,hate,0.03960862010717392
5
+ papa,0.038925547152757645,hate,0.038925547152757645
6
+ interior,0.03734187036752701,hate,0.03734187036752701
7
+ race,0.03409697115421295,hate,0.03409697115421295
8
+ chori,0.033206719905138016,hate,0.033206719905138016
9
+ online,-0.02929110825061798,non-hate,0.02929110825061798
10
+ kren,0.02906891517341137,hate,0.02906891517341137
11
+ choro,0.02657279558479786,hate,0.02657279558479786
12
+ member,-0.026523131877183914,non-hate,0.026523131877183914
13
+ aad,0.026521164923906326,hate,0.026521164923906326
14
+ highlight,0.025127805769443512,hate,0.025127805769443512
15
+ bout,0.025043504312634468,hate,0.025043504312634468
16
+ chalte,0.023972313851118088,hate,0.023972313851118088
17
+ abduction,0.023200901225209236,hate,0.023200901225209236
18
+ mam,-0.02300681360065937,non-hate,0.02300681360065937
19
+ messages,-0.022140955552458763,non-hate,0.022140955552458763
20
+ laya,0.02126455120742321,hate,0.02126455120742321
21
+ srk,0.020947826730359036,hate,0.020947826730359036
22
+ asha,-0.02039911597967148,non-hate,0.02039911597967148
23
+ altaf,0.01923272293061018,hate,0.01923272293061018
24
+ boss,-0.01831447333097458,non-hate,0.01831447333097458
25
+ 2018,0.017717858776450157,hate,0.017717858776450157
26
+ etna,-0.017587222158908844,non-hate,0.017587222158908844
27
+ geo,0.01754508726298809,hate,0.01754508726298809
28
+ post,-0.016837802055912714,non-hate,0.016837802055912714
29
+ sapna,0.016813437920063734,hate,0.016813437920063734
30
+ mint,-0.015777967870235443,non-hate,0.015777967870235443
31
+ bech,-0.015203659422695637,non-hate,0.015203659422695637
32
+ condemn,0.014873333275318146,hate,0.014873333275318146
33
+ she,0.01479670312255621,hate,0.01479670312255621
34
+ dehli,-0.014155546203255653,non-hate,0.014155546203255653
35
+ bangladeshi,0.01362423226237297,hate,0.01362423226237297
36
+ penis,-0.013533218763768673,non-hate,0.013533218763768673
37
+ dont,-0.01309139747172594,non-hate,0.01309139747172594
38
+ banana,0.012709609232842922,hate,0.012709609232842922
39
+ kah,0.012406427413225174,hate,0.012406427413225174
40
+ sar,-0.012206245155539364,non-hate,0.012206245155539364
41
+ deke,-0.012147174216806889,non-hate,0.012147174216806889
42
+ bin,-0.012057552114129066,non-hate,0.012057552114129066
43
+ ar,-0.011831492185592651,non-hate,0.011831492185592651
44
+ your,-0.011781544308178127,non-hate,0.011781544308178127
45
+ pr,0.011247894560386027,hate,0.011247894560386027
46
+ prediction,-0.011225917376577854,non-hate,0.011225917376577854
47
+ raj,-0.011192606762051582,non-hate,0.011192606762051582
48
+ rajya,-0.010959833860397339,non-hate,0.010959833860397339
49
+ ak,0.010884546441957355,hate,0.010884546441957355
50
+ wohi,-0.010823655873537064,non-hate,0.010823655873537064
51
+ 72,-0.010761625715531409,non-hate,0.010761625715531409
output_v2/shap/v2/hinglish_to_hindi_to_english_v2/shap_topwords_hinglish.png ADDED

Git LFS Details

  • SHA256: 3f2d0269fabe56ccb3a1c1aca4838eb62baac278c2829c0873741db96a4d117c
  • Pointer size: 131 Bytes
  • Size of remote file: 126 kB