PuxAI commited on
Commit
057d132
·
verified ·
1 Parent(s): 60b46fa

Upload folder using huggingface_hub

Browse files
open-pii-masking-500k-ai4privacy/evaluations/bert_plus_crf/eval_summary.json CHANGED
@@ -9,35 +9,35 @@
9
  999
10
  ],
11
  "max_samples_per_seed": 1000,
12
- "avg_precision": 0.9664,
13
- "avg_recall": 0.9673,
14
- "avg_f1": 0.9663,
15
  "per_seed": {
16
  "42": {
17
- "precision": 0.975,
18
- "recall": 0.9736,
19
- "f1": 0.9737
20
  },
21
  "123": {
22
- "precision": 0.965,
23
- "recall": 0.9649,
24
- "f1": 0.9644
25
  },
26
  "456": {
27
- "precision": 0.9637,
28
- "recall": 0.9645,
29
- "f1": 0.9633
30
  },
31
  "789": {
32
- "precision": 0.9665,
33
- "recall": 0.9648,
34
- "f1": 0.965
35
  },
36
  "999": {
37
- "precision": 0.9621,
38
- "recall": 0.9689,
39
- "f1": 0.9653
40
  }
41
  },
42
- "timestamp": "2026-04-05T07:04:30.955187"
43
  }
 
9
  999
10
  ],
11
  "max_samples_per_seed": 1000,
12
+ "avg_precision": 0.9675,
13
+ "avg_recall": 0.9721,
14
+ "avg_f1": 0.9694,
15
  "per_seed": {
16
  "42": {
17
+ "precision": 0.9752,
18
+ "recall": 0.9765,
19
+ "f1": 0.9753
20
  },
21
  "123": {
22
+ "precision": 0.9648,
23
+ "recall": 0.9695,
24
+ "f1": 0.9666
25
  },
26
  "456": {
27
+ "precision": 0.9633,
28
+ "recall": 0.9697,
29
+ "f1": 0.9661
30
  },
31
  "789": {
32
+ "precision": 0.9683,
33
+ "recall": 0.9709,
34
+ "f1": 0.9691
35
  },
36
  "999": {
37
+ "precision": 0.966,
38
+ "recall": 0.974,
39
+ "f1": 0.9699
40
  }
41
  },
42
+ "timestamp": "2026-04-06T05:06:52.454239"
43
  }
open-pii-masking-500k-ai4privacy/evaluations/bert_plus_crf/seed_123_predictions.json CHANGED
@@ -417,7 +417,7 @@
417
  "value": "Sein"
418
  },
419
  {
420
- "tag": "IDCARDNUM",
421
  "start": 42,
422
  "end": 52,
423
  "value": "6567725252"
@@ -1586,8 +1586,14 @@
1586
  {
1587
  "tag": "GIVENNAME",
1588
  "start": 8,
 
 
 
 
 
 
1589
  "end": 20,
1590
- "value": "Alicja Kuthy"
1591
  }
1592
  ]
1593
  },
@@ -1642,14 +1648,14 @@
1642
  {
1643
  "tag": "GIVENNAME",
1644
  "start": 55,
1645
- "end": 59,
1646
- "value": "Noor"
1647
  },
1648
  {
1649
  "tag": "SURNAME",
1650
- "start": 60,
1651
  "end": 83,
1652
- "value": "Moosa Puetate Kudrynska"
1653
  }
1654
  ]
1655
  },
@@ -2264,14 +2270,14 @@
2264
  {
2265
  "tag": "GIVENNAME",
2266
  "start": 27,
2267
- "end": 35,
2268
- "value": "Boguslaw"
2269
  },
2270
  {
2271
  "tag": "SURNAME",
2272
- "start": 36,
2273
  "end": 45,
2274
- "value": "Hase Küng"
2275
  }
2276
  ]
2277
  },
@@ -2903,8 +2909,14 @@
2903
  {
2904
  "tag": "GIVENNAME",
2905
  "start": 51,
 
 
 
 
 
 
2906
  "end": 68,
2907
- "value": "Riyo Uthayasangar"
2908
  },
2909
  {
2910
  "tag": "IDCARDNUM",
@@ -3347,7 +3359,7 @@
3347
  ],
3348
  "predictions": [
3349
  {
3350
- "tag": "GIVENNAME",
3351
  "start": 0,
3352
  "end": 6,
3353
  "value": "Nawfel"
@@ -3814,7 +3826,7 @@
3814
  "value": "Vincy Zoya"
3815
  },
3816
  {
3817
- "tag": "GIVENNAME",
3818
  "start": 26,
3819
  "end": 33,
3820
  "value": "Gençaga"
@@ -3985,7 +3997,7 @@
3985
  "value": "Yannacopoulos Aygül Talevski"
3986
  },
3987
  {
3988
- "tag": "GENDER",
3989
  "start": 59,
3990
  "end": 65,
3991
  "value": "Female"
@@ -4012,14 +4024,8 @@
4012
  {
4013
  "tag": "GIVENNAME",
4014
  "start": 76,
4015
- "end": 82,
4016
- "value": "Cédrik"
4017
- },
4018
- {
4019
- "tag": "SURNAME",
4020
- "start": 83,
4021
  "end": 89,
4022
- "value": "Antani"
4023
  }
4024
  ]
4025
  },
@@ -4506,14 +4512,14 @@
4506
  {
4507
  "tag": "GIVENNAME",
4508
  "start": 76,
4509
- "end": 81,
4510
- "value": "Fayad"
4511
  },
4512
  {
4513
  "tag": "SURNAME",
4514
- "start": 82,
4515
  "end": 106,
4516
- "value": "Cresce Riediger Vidueira"
4517
  }
4518
  ]
4519
  },
@@ -4704,8 +4710,14 @@
4704
  {
4705
  "tag": "GIVENNAME",
4706
  "start": 20,
 
 
 
 
 
 
4707
  "end": 34,
4708
- "value": "Irian Milleron"
4709
  }
4710
  ]
4711
  },
@@ -5185,10 +5197,16 @@
5185
  ],
5186
  "predictions": [
5187
  {
5188
- "tag": "GIVENNAME",
5189
  "start": 88,
 
 
 
 
 
 
5190
  "end": 99,
5191
- "value": "Reisel Elfe"
5192
  },
5193
  {
5194
  "tag": "SURNAME",
@@ -6315,8 +6333,14 @@
6315
  {
6316
  "tag": "GIVENNAME",
6317
  "start": 0,
 
 
 
 
 
 
6318
  "end": 11,
6319
- "value": "Raoni Nicol"
6320
  },
6321
  {
6322
  "tag": "ZIPCODE",
@@ -6433,8 +6457,14 @@
6433
  {
6434
  "tag": "GIVENNAME",
6435
  "start": 33,
 
 
 
 
 
 
6436
  "end": 46,
6437
- "value": "Aldana Ursino"
6438
  },
6439
  {
6440
  "tag": "GIVENNAME",
@@ -7266,8 +7296,14 @@
7266
  {
7267
  "tag": "GIVENNAME",
7268
  "start": 0,
 
 
 
 
 
 
7269
  "end": 14,
7270
- "value": "Georgius Eyyup"
7271
  }
7272
  ]
7273
  },
@@ -8362,8 +8398,14 @@
8362
  {
8363
  "tag": "GIVENNAME",
8364
  "start": 0,
 
 
 
 
 
 
8365
  "end": 12,
8366
- "value": "Tamal Liburn"
8367
  },
8368
  {
8369
  "tag": "AGE",
@@ -8459,7 +8501,7 @@
8459
  "value": "Z37F0883L"
8460
  },
8461
  {
8462
- "tag": "GIVENNAME",
8463
  "start": 18,
8464
  "end": 26,
8465
  "value": "Scairato"
@@ -8484,7 +8526,7 @@
8484
  ],
8485
  "predictions": [
8486
  {
8487
- "tag": "GENDER",
8488
  "start": 0,
8489
  "end": 7,
8490
  "value": "Femmina"
@@ -8770,8 +8812,14 @@
8770
  {
8771
  "tag": "SURNAME",
8772
  "start": 13,
 
 
 
 
 
 
8773
  "end": 32,
8774
- "value": "Jääskelä Mohibullah"
8775
  }
8776
  ]
8777
  },
@@ -11175,7 +11223,7 @@
11175
  ],
11176
  "predictions": [
11177
  {
11178
- "tag": "GIVENNAME",
11179
  "start": 30,
11180
  "end": 37,
11181
  "value": "Duglore"
@@ -11577,8 +11625,14 @@
11577
  {
11578
  "tag": "GIVENNAME",
11579
  "start": 0,
 
 
 
 
 
 
11580
  "end": 13,
11581
- "value": "Durmish Ruini"
11582
  },
11583
  {
11584
  "tag": "EMAIL",
@@ -15253,8 +15307,14 @@
15253
  {
15254
  "tag": "GIVENNAME",
15255
  "start": 37,
 
 
 
 
 
 
15256
  "end": 53,
15257
- "value": "Chengming Manech"
15258
  }
15259
  ]
15260
  },
@@ -15581,8 +15641,14 @@
15581
  {
15582
  "tag": "GIVENNAME",
15583
  "start": 0,
 
 
 
 
 
 
15584
  "end": 12,
15585
- "value": "Kaba Misiuda"
15586
  },
15587
  {
15588
  "tag": "TITLE",
@@ -16526,14 +16592,8 @@
16526
  {
16527
  "tag": "GIVENNAME",
16528
  "start": 83,
16529
- "end": 92,
16530
- "value": "Magdaline"
16531
- },
16532
- {
16533
- "tag": "SURNAME",
16534
- "start": 93,
16535
  "end": 99,
16536
- "value": "Tanaka"
16537
  }
16538
  ]
16539
  },
@@ -17352,7 +17412,7 @@
17352
  ],
17353
  "predictions": [
17354
  {
17355
- "tag": "SEX",
17356
  "start": 34,
17357
  "end": 41,
17358
  "value": "Femmina"
@@ -18140,14 +18200,8 @@
18140
  {
18141
  "tag": "SURNAME",
18142
  "start": 0,
18143
- "end": 12,
18144
- "value": "Sortini Mary"
18145
- },
18146
- {
18147
- "tag": "GIVENNAME",
18148
- "start": 12,
18149
  "end": 20,
18150
- "value": "-Dauphin"
18151
  },
18152
  {
18153
  "tag": "CITY",
@@ -18455,8 +18509,14 @@
18455
  {
18456
  "tag": "GIVENNAME",
18457
  "start": 36,
 
 
 
 
 
 
18458
  "end": 50,
18459
- "value": "Ofelya Nowosad"
18460
  },
18461
  {
18462
  "tag": "TELEPHONENUM",
@@ -18634,8 +18694,14 @@
18634
  {
18635
  "tag": "GIVENNAME",
18636
  "start": 28,
 
 
 
 
 
 
18637
  "end": 42,
18638
- "value": "Franci Uriarte"
18639
  }
18640
  ]
18641
  },
@@ -19278,7 +19344,7 @@
19278
  "value": "022915934962"
19279
  },
19280
  {
19281
- "tag": "ZIPCODE",
19282
  "start": 65,
19283
  "end": 73,
19284
  "value": "00849505"
@@ -19528,8 +19594,14 @@
19528
  {
19529
  "tag": "GIVENNAME",
19530
  "start": 38,
 
 
 
 
 
 
19531
  "end": 52,
19532
- "value": "Bizuayehu Geni"
19533
  },
19534
  {
19535
  "tag": "CITY",
@@ -19685,7 +19757,7 @@
19685
  "value": "Rijpwetering"
19686
  },
19687
  {
19688
- "tag": "SURNAME",
19689
  "start": 49,
19690
  "end": 58,
19691
  "value": "Kochurani"
@@ -20354,8 +20426,14 @@
20354
  {
20355
  "tag": "GIVENNAME",
20356
  "start": 74,
 
 
 
 
 
 
20357
  "end": 94,
20358
- "value": "Tharshanaa Mohammady"
20359
  },
20360
  {
20361
  "tag": "AGE",
@@ -21472,7 +21550,7 @@
21472
  "value": "Siew"
21473
  },
21474
  {
21475
- "tag": "DRIVERLICENSENUM",
21476
  "start": 148,
21477
  "end": 159,
21478
  "value": "10500634229"
@@ -23661,9 +23739,9 @@
23661
  "predictions": [
23662
  {
23663
  "tag": "STREET",
23664
- "start": 107,
23665
  "end": 116,
23666
- "value": "Pestarena"
23667
  },
23668
  {
23669
  "tag": "BUILDINGNUM",
@@ -23999,7 +24077,7 @@
23999
  ],
24000
  "predictions": [
24001
  {
24002
- "tag": "SURNAME",
24003
  "start": 33,
24004
  "end": 48,
24005
  "value": "Glanville Aasar"
@@ -24751,7 +24829,7 @@
24751
  "value": "Robbie"
24752
  },
24753
  {
24754
- "tag": "GIVENNAME",
24755
  "start": 26,
24756
  "end": 34,
24757
  "value": "Hanschke"
@@ -24844,7 +24922,7 @@
24844
  "value": "Sasebes Sumner"
24845
  },
24846
  {
24847
- "tag": "IDCARDNUM",
24848
  "start": 124,
24849
  "end": 133,
24850
  "value": "644256382"
@@ -25058,7 +25136,7 @@
25058
  "value": "Aleksandrs Zaim"
25059
  },
25060
  {
25061
- "tag": "GENDER",
25062
  "start": 44,
25063
  "end": 50,
25064
  "value": "Female"
@@ -25336,7 +25414,7 @@
25336
  ],
25337
  "predictions": [
25338
  {
25339
- "tag": "CITY",
25340
  "start": 45,
25341
  "end": 51,
25342
  "value": "Vienna"
@@ -26333,7 +26411,7 @@
26333
  "value": "Segantin"
26334
  },
26335
  {
26336
- "tag": "ZIPCODE",
26337
  "start": 68,
26338
  "end": 72,
26339
  "value": "3120"
@@ -27616,10 +27694,16 @@
27616
  ],
27617
  "predictions": [
27618
  {
27619
- "tag": "SURNAME",
27620
  "start": 10,
 
 
 
 
 
 
27621
  "end": 32,
27622
- "value": "Kllaus Trettin Desigis"
27623
  },
27624
  {
27625
  "tag": "IDCARDNUM",
@@ -27690,7 +27774,7 @@
27690
  "value": "Lemlem"
27691
  },
27692
  {
27693
- "tag": "SURNAME",
27694
  "start": 45,
27695
  "end": 59,
27696
  "value": "Gastón Mikhael"
@@ -28084,14 +28168,14 @@
28084
  {
28085
  "tag": "GIVENNAME",
28086
  "start": 37,
28087
- "end": 43,
28088
- "value": "Beibei"
28089
  },
28090
  {
28091
  "tag": "SURNAME",
28092
- "start": 44,
28093
  "end": 63,
28094
- "value": "Muthukumaru Leitold"
28095
  },
28096
  {
28097
  "tag": "TELEPHONENUM",
@@ -29177,12 +29261,6 @@
29177
  "start": 12,
29178
  "end": 18,
29179
  "value": "Geremy"
29180
- },
29181
- {
29182
- "tag": "ZIPCODE",
29183
- "start": 49,
29184
- "end": 54,
29185
- "value": "120KB"
29186
  }
29187
  ]
29188
  },
@@ -29409,14 +29487,14 @@
29409
  {
29410
  "tag": "GIVENNAME",
29411
  "start": 48,
29412
- "end": 60,
29413
- "value": "Saban Falcon"
29414
  },
29415
  {
29416
  "tag": "SURNAME",
29417
- "start": 61,
29418
  "end": 70,
29419
- "value": "Bernacchi"
29420
  }
29421
  ]
29422
  },
@@ -29687,14 +29765,8 @@
29687
  {
29688
  "tag": "GIVENNAME",
29689
  "start": 0,
29690
- "end": 9,
29691
- "value": "Anunciata"
29692
- },
29693
- {
29694
- "tag": "SURNAME",
29695
- "start": 10,
29696
  "end": 15,
29697
- "value": "Rekik"
29698
  },
29699
  {
29700
  "tag": "GIVENNAME",
@@ -29858,7 +29930,7 @@
29858
  "value": "0141 15-327-4279"
29859
  },
29860
  {
29861
- "tag": "GIVENNAME",
29862
  "start": 60,
29863
  "end": 66,
29864
  "value": "Mazolo"
@@ -30046,6 +30118,12 @@
30046
  "start": 90,
30047
  "end": 102,
30048
  "value": "27 July 1949"
 
 
 
 
 
 
30049
  }
30050
  ]
30051
  },
@@ -30067,7 +30145,7 @@
30067
  ],
30068
  "predictions": [
30069
  {
30070
- "tag": "SEX",
30071
  "start": 12,
30072
  "end": 16,
30073
  "value": "Male"
@@ -31030,7 +31108,7 @@
31030
  "value": "Djordjina"
31031
  },
31032
  {
31033
- "tag": "SEX",
31034
  "start": 73,
31035
  "end": 79,
31036
  "value": "Female"
@@ -31066,12 +31144,6 @@
31066
  "end": 15,
31067
  "value": "Nsrin Mirëlinda"
31068
  },
31069
- {
31070
- "tag": "SURNAME",
31071
- "start": 16,
31072
- "end": 21,
31073
- "value": "वर्मा"
31074
- },
31075
  {
31076
  "tag": "AGE",
31077
  "start": 42,
@@ -32986,14 +33058,14 @@
32986
  {
32987
  "tag": "GIVENNAME",
32988
  "start": 21,
32989
- "end": 34,
32990
- "value": "Imijanka Avul"
32991
  },
32992
  {
32993
  "tag": "SURNAME",
32994
- "start": 35,
32995
  "end": 40,
32996
- "value": "Beggs"
32997
  },
32998
  {
32999
  "tag": "DATE",
@@ -33104,14 +33176,8 @@
33104
  {
33105
  "tag": "GIVENNAME",
33106
  "start": 52,
33107
- "end": 58,
33108
- "value": "Tinley"
33109
- },
33110
- {
33111
- "tag": "SURNAME",
33112
- "start": 59,
33113
  "end": 63,
33114
- "value": "Osni"
33115
  },
33116
  {
33117
  "tag": "AGE",
@@ -33501,7 +33567,7 @@
33501
  ],
33502
  "predictions": [
33503
  {
33504
- "tag": "GIVENNAME",
33505
  "start": 95,
33506
  "end": 101,
33507
  "value": "Gervas"
@@ -34268,8 +34334,14 @@
34268
  {
34269
  "tag": "GIVENNAME",
34270
  "start": 0,
 
 
 
 
 
 
34271
  "end": 14,
34272
- "value": "Warunya Layali"
34273
  }
34274
  ]
34275
  },
@@ -35340,7 +35412,7 @@
35340
  "value": "Chil"
35341
  },
35342
  {
35343
- "tag": "GIVENNAME",
35344
  "start": 32,
35345
  "end": 36,
35346
  "value": "Stan"
@@ -35421,10 +35493,16 @@
35421
  ],
35422
  "predictions": [
35423
  {
35424
- "tag": "GIVENNAME",
35425
  "start": 63,
 
 
 
 
 
 
35426
  "end": 85,
35427
- "value": "General Plutarco Elías"
35428
  },
35429
  {
35430
  "tag": "SURNAME",
 
417
  "value": "Sein"
418
  },
419
  {
420
+ "tag": "SOCIALNUM",
421
  "start": 42,
422
  "end": 52,
423
  "value": "6567725252"
 
1586
  {
1587
  "tag": "GIVENNAME",
1588
  "start": 8,
1589
+ "end": 14,
1590
+ "value": "Alicja"
1591
+ },
1592
+ {
1593
+ "tag": "SURNAME",
1594
+ "start": 15,
1595
  "end": 20,
1596
+ "value": "Kuthy"
1597
  }
1598
  ]
1599
  },
 
1648
  {
1649
  "tag": "GIVENNAME",
1650
  "start": 55,
1651
+ "end": 65,
1652
+ "value": "Noor Moosa"
1653
  },
1654
  {
1655
  "tag": "SURNAME",
1656
+ "start": 66,
1657
  "end": 83,
1658
+ "value": "Puetate Kudrynska"
1659
  }
1660
  ]
1661
  },
 
2270
  {
2271
  "tag": "GIVENNAME",
2272
  "start": 27,
2273
+ "end": 40,
2274
+ "value": "Boguslaw Hase"
2275
  },
2276
  {
2277
  "tag": "SURNAME",
2278
+ "start": 41,
2279
  "end": 45,
2280
+ "value": "Küng"
2281
  }
2282
  ]
2283
  },
 
2909
  {
2910
  "tag": "GIVENNAME",
2911
  "start": 51,
2912
+ "end": 55,
2913
+ "value": "Riyo"
2914
+ },
2915
+ {
2916
+ "tag": "SURNAME",
2917
+ "start": 56,
2918
  "end": 68,
2919
+ "value": "Uthayasangar"
2920
  },
2921
  {
2922
  "tag": "IDCARDNUM",
 
3359
  ],
3360
  "predictions": [
3361
  {
3362
+ "tag": "SURNAME",
3363
  "start": 0,
3364
  "end": 6,
3365
  "value": "Nawfel"
 
3826
  "value": "Vincy Zoya"
3827
  },
3828
  {
3829
+ "tag": "SURNAME",
3830
  "start": 26,
3831
  "end": 33,
3832
  "value": "Gençaga"
 
3997
  "value": "Yannacopoulos Aygül Talevski"
3998
  },
3999
  {
4000
+ "tag": "SEX",
4001
  "start": 59,
4002
  "end": 65,
4003
  "value": "Female"
 
4024
  {
4025
  "tag": "GIVENNAME",
4026
  "start": 76,
 
 
 
 
 
 
4027
  "end": 89,
4028
+ "value": "Cédrik Antani"
4029
  }
4030
  ]
4031
  },
 
4512
  {
4513
  "tag": "GIVENNAME",
4514
  "start": 76,
4515
+ "end": 88,
4516
+ "value": "Fayad Cresce"
4517
  },
4518
  {
4519
  "tag": "SURNAME",
4520
+ "start": 89,
4521
  "end": 106,
4522
+ "value": "Riediger Vidueira"
4523
  }
4524
  ]
4525
  },
 
4710
  {
4711
  "tag": "GIVENNAME",
4712
  "start": 20,
4713
+ "end": 25,
4714
+ "value": "Irian"
4715
+ },
4716
+ {
4717
+ "tag": "SURNAME",
4718
+ "start": 26,
4719
  "end": 34,
4720
+ "value": "Milleron"
4721
  }
4722
  ]
4723
  },
 
5197
  ],
5198
  "predictions": [
5199
  {
5200
+ "tag": "SURNAME",
5201
  "start": 88,
5202
+ "end": 94,
5203
+ "value": "Reisel"
5204
+ },
5205
+ {
5206
+ "tag": "GIVENNAME",
5207
+ "start": 95,
5208
  "end": 99,
5209
+ "value": "Elfe"
5210
  },
5211
  {
5212
  "tag": "SURNAME",
 
6333
  {
6334
  "tag": "GIVENNAME",
6335
  "start": 0,
6336
+ "end": 5,
6337
+ "value": "Raoni"
6338
+ },
6339
+ {
6340
+ "tag": "SURNAME",
6341
+ "start": 6,
6342
  "end": 11,
6343
+ "value": "Nicol"
6344
  },
6345
  {
6346
  "tag": "ZIPCODE",
 
6457
  {
6458
  "tag": "GIVENNAME",
6459
  "start": 33,
6460
+ "end": 39,
6461
+ "value": "Aldana"
6462
+ },
6463
+ {
6464
+ "tag": "SURNAME",
6465
+ "start": 40,
6466
  "end": 46,
6467
+ "value": "Ursino"
6468
  },
6469
  {
6470
  "tag": "GIVENNAME",
 
7296
  {
7297
  "tag": "GIVENNAME",
7298
  "start": 0,
7299
+ "end": 8,
7300
+ "value": "Georgius"
7301
+ },
7302
+ {
7303
+ "tag": "SURNAME",
7304
+ "start": 9,
7305
  "end": 14,
7306
+ "value": "Eyyup"
7307
  }
7308
  ]
7309
  },
 
8398
  {
8399
  "tag": "GIVENNAME",
8400
  "start": 0,
8401
+ "end": 5,
8402
+ "value": "Tamal"
8403
+ },
8404
+ {
8405
+ "tag": "SURNAME",
8406
+ "start": 6,
8407
  "end": 12,
8408
+ "value": "Liburn"
8409
  },
8410
  {
8411
  "tag": "AGE",
 
8501
  "value": "Z37F0883L"
8502
  },
8503
  {
8504
+ "tag": "SURNAME",
8505
  "start": 18,
8506
  "end": 26,
8507
  "value": "Scairato"
 
8526
  ],
8527
  "predictions": [
8528
  {
8529
+ "tag": "SEX",
8530
  "start": 0,
8531
  "end": 7,
8532
  "value": "Femmina"
 
8812
  {
8813
  "tag": "SURNAME",
8814
  "start": 13,
8815
+ "end": 21,
8816
+ "value": "Jääskelä"
8817
+ },
8818
+ {
8819
+ "tag": "GIVENNAME",
8820
+ "start": 22,
8821
  "end": 32,
8822
+ "value": "Mohibullah"
8823
  }
8824
  ]
8825
  },
 
11223
  ],
11224
  "predictions": [
11225
  {
11226
+ "tag": "SURNAME",
11227
  "start": 30,
11228
  "end": 37,
11229
  "value": "Duglore"
 
11625
  {
11626
  "tag": "GIVENNAME",
11627
  "start": 0,
11628
+ "end": 7,
11629
+ "value": "Durmish"
11630
+ },
11631
+ {
11632
+ "tag": "SURNAME",
11633
+ "start": 8,
11634
  "end": 13,
11635
+ "value": "Ruini"
11636
  },
11637
  {
11638
  "tag": "EMAIL",
 
15307
  {
15308
  "tag": "GIVENNAME",
15309
  "start": 37,
15310
+ "end": 46,
15311
+ "value": "Chengming"
15312
+ },
15313
+ {
15314
+ "tag": "SURNAME",
15315
+ "start": 47,
15316
  "end": 53,
15317
+ "value": "Manech"
15318
  }
15319
  ]
15320
  },
 
15641
  {
15642
  "tag": "GIVENNAME",
15643
  "start": 0,
15644
+ "end": 4,
15645
+ "value": "Kaba"
15646
+ },
15647
+ {
15648
+ "tag": "SURNAME",
15649
+ "start": 5,
15650
  "end": 12,
15651
+ "value": "Misiuda"
15652
  },
15653
  {
15654
  "tag": "TITLE",
 
16592
  {
16593
  "tag": "GIVENNAME",
16594
  "start": 83,
 
 
 
 
 
 
16595
  "end": 99,
16596
+ "value": "Magdaline Tanaka"
16597
  }
16598
  ]
16599
  },
 
17412
  ],
17413
  "predictions": [
17414
  {
17415
+ "tag": "GENDER",
17416
  "start": 34,
17417
  "end": 41,
17418
  "value": "Femmina"
 
18200
  {
18201
  "tag": "SURNAME",
18202
  "start": 0,
 
 
 
 
 
 
18203
  "end": 20,
18204
+ "value": "Sortini Mary-Dauphin"
18205
  },
18206
  {
18207
  "tag": "CITY",
 
18509
  {
18510
  "tag": "GIVENNAME",
18511
  "start": 36,
18512
+ "end": 42,
18513
+ "value": "Ofelya"
18514
+ },
18515
+ {
18516
+ "tag": "SURNAME",
18517
+ "start": 43,
18518
  "end": 50,
18519
+ "value": "Nowosad"
18520
  },
18521
  {
18522
  "tag": "TELEPHONENUM",
 
18694
  {
18695
  "tag": "GIVENNAME",
18696
  "start": 28,
18697
+ "end": 34,
18698
+ "value": "Franci"
18699
+ },
18700
+ {
18701
+ "tag": "SURNAME",
18702
+ "start": 35,
18703
  "end": 42,
18704
+ "value": "Uriarte"
18705
  }
18706
  ]
18707
  },
 
19344
  "value": "022915934962"
19345
  },
19346
  {
19347
+ "tag": "DRIVERLICENSENUM",
19348
  "start": 65,
19349
  "end": 73,
19350
  "value": "00849505"
 
19594
  {
19595
  "tag": "GIVENNAME",
19596
  "start": 38,
19597
+ "end": 47,
19598
+ "value": "Bizuayehu"
19599
+ },
19600
+ {
19601
+ "tag": "SURNAME",
19602
+ "start": 48,
19603
  "end": 52,
19604
+ "value": "Geni"
19605
  },
19606
  {
19607
  "tag": "CITY",
 
19757
  "value": "Rijpwetering"
19758
  },
19759
  {
19760
+ "tag": "GIVENNAME",
19761
  "start": 49,
19762
  "end": 58,
19763
  "value": "Kochurani"
 
20426
  {
20427
  "tag": "GIVENNAME",
20428
  "start": 74,
20429
+ "end": 84,
20430
+ "value": "Tharshanaa"
20431
+ },
20432
+ {
20433
+ "tag": "SURNAME",
20434
+ "start": 85,
20435
  "end": 94,
20436
+ "value": "Mohammady"
20437
  },
20438
  {
20439
  "tag": "AGE",
 
21550
  "value": "Siew"
21551
  },
21552
  {
21553
+ "tag": "TAXNUM",
21554
  "start": 148,
21555
  "end": 159,
21556
  "value": "10500634229"
 
23739
  "predictions": [
23740
  {
23741
  "tag": "STREET",
23742
+ "start": 92,
23743
  "end": 116,
23744
+ "value": "Centro Abitato Pestarena"
23745
  },
23746
  {
23747
  "tag": "BUILDINGNUM",
 
24077
  ],
24078
  "predictions": [
24079
  {
24080
+ "tag": "GIVENNAME",
24081
  "start": 33,
24082
  "end": 48,
24083
  "value": "Glanville Aasar"
 
24829
  "value": "Robbie"
24830
  },
24831
  {
24832
+ "tag": "SURNAME",
24833
  "start": 26,
24834
  "end": 34,
24835
  "value": "Hanschke"
 
24922
  "value": "Sasebes Sumner"
24923
  },
24924
  {
24925
+ "tag": "TAXNUM",
24926
  "start": 124,
24927
  "end": 133,
24928
  "value": "644256382"
 
25136
  "value": "Aleksandrs Zaim"
25137
  },
25138
  {
25139
+ "tag": "SEX",
25140
  "start": 44,
25141
  "end": 50,
25142
  "value": "Female"
 
25414
  ],
25415
  "predictions": [
25416
  {
25417
+ "tag": "GIVENNAME",
25418
  "start": 45,
25419
  "end": 51,
25420
  "value": "Vienna"
 
26411
  "value": "Segantin"
26412
  },
26413
  {
26414
+ "tag": "BUILDINGNUM",
26415
  "start": 68,
26416
  "end": 72,
26417
  "value": "3120"
 
27694
  ],
27695
  "predictions": [
27696
  {
27697
+ "tag": "GIVENNAME",
27698
  "start": 10,
27699
+ "end": 16,
27700
+ "value": "Kllaus"
27701
+ },
27702
+ {
27703
+ "tag": "SURNAME",
27704
+ "start": 17,
27705
  "end": 32,
27706
+ "value": "Trettin Desigis"
27707
  },
27708
  {
27709
  "tag": "IDCARDNUM",
 
27774
  "value": "Lemlem"
27775
  },
27776
  {
27777
+ "tag": "GIVENNAME",
27778
  "start": 45,
27779
  "end": 59,
27780
  "value": "Gastón Mikhael"
 
28168
  {
28169
  "tag": "GIVENNAME",
28170
  "start": 37,
28171
+ "end": 55,
28172
+ "value": "Beibei Muthukumaru"
28173
  },
28174
  {
28175
  "tag": "SURNAME",
28176
+ "start": 56,
28177
  "end": 63,
28178
+ "value": "Leitold"
28179
  },
28180
  {
28181
  "tag": "TELEPHONENUM",
 
29261
  "start": 12,
29262
  "end": 18,
29263
  "value": "Geremy"
 
 
 
 
 
 
29264
  }
29265
  ]
29266
  },
 
29487
  {
29488
  "tag": "GIVENNAME",
29489
  "start": 48,
29490
+ "end": 53,
29491
+ "value": "Saban"
29492
  },
29493
  {
29494
  "tag": "SURNAME",
29495
+ "start": 54,
29496
  "end": 70,
29497
+ "value": "Falcon Bernacchi"
29498
  }
29499
  ]
29500
  },
 
29765
  {
29766
  "tag": "GIVENNAME",
29767
  "start": 0,
 
 
 
 
 
 
29768
  "end": 15,
29769
+ "value": "Anunciata Rekik"
29770
  },
29771
  {
29772
  "tag": "GIVENNAME",
 
29930
  "value": "0141 15-327-4279"
29931
  },
29932
  {
29933
+ "tag": "SURNAME",
29934
  "start": 60,
29935
  "end": 66,
29936
  "value": "Mazolo"
 
30118
  "start": 90,
30119
  "end": 102,
30120
  "value": "27 July 1949"
30121
+ },
30122
+ {
30123
+ "tag": "AGE",
30124
+ "start": 103,
30125
+ "end": 105,
30126
+ "value": "25"
30127
  }
30128
  ]
30129
  },
 
30145
  ],
30146
  "predictions": [
30147
  {
30148
+ "tag": "GENDER",
30149
  "start": 12,
30150
  "end": 16,
30151
  "value": "Male"
 
31108
  "value": "Djordjina"
31109
  },
31110
  {
31111
+ "tag": "GENDER",
31112
  "start": 73,
31113
  "end": 79,
31114
  "value": "Female"
 
31144
  "end": 15,
31145
  "value": "Nsrin Mirëlinda"
31146
  },
 
 
 
 
 
 
31147
  {
31148
  "tag": "AGE",
31149
  "start": 42,
 
33058
  {
33059
  "tag": "GIVENNAME",
33060
  "start": 21,
33061
+ "end": 29,
33062
+ "value": "Imijanka"
33063
  },
33064
  {
33065
  "tag": "SURNAME",
33066
+ "start": 30,
33067
  "end": 40,
33068
+ "value": "Avul Beggs"
33069
  },
33070
  {
33071
  "tag": "DATE",
 
33176
  {
33177
  "tag": "GIVENNAME",
33178
  "start": 52,
 
 
 
 
 
 
33179
  "end": 63,
33180
+ "value": "Tinley Osni"
33181
  },
33182
  {
33183
  "tag": "AGE",
 
33567
  ],
33568
  "predictions": [
33569
  {
33570
+ "tag": "SURNAME",
33571
  "start": 95,
33572
  "end": 101,
33573
  "value": "Gervas"
 
34334
  {
34335
  "tag": "GIVENNAME",
34336
  "start": 0,
34337
+ "end": 7,
34338
+ "value": "Warunya"
34339
+ },
34340
+ {
34341
+ "tag": "SURNAME",
34342
+ "start": 8,
34343
  "end": 14,
34344
+ "value": "Layali"
34345
  }
34346
  ]
34347
  },
 
35412
  "value": "Chil"
35413
  },
35414
  {
35415
+ "tag": "SURNAME",
35416
  "start": 32,
35417
  "end": 36,
35418
  "value": "Stan"
 
35493
  ],
35494
  "predictions": [
35495
  {
35496
+ "tag": "TITLE",
35497
  "start": 63,
35498
+ "end": 70,
35499
+ "value": "General"
35500
+ },
35501
+ {
35502
+ "tag": "GIVENNAME",
35503
+ "start": 71,
35504
  "end": 85,
35505
+ "value": "Plutarco Elías"
35506
  },
35507
  {
35508
  "tag": "SURNAME",
open-pii-masking-500k-ai4privacy/evaluations/bert_plus_crf/seed_42_predictions.json CHANGED
@@ -1911,7 +1911,7 @@
1911
  ],
1912
  "predictions": [
1913
  {
1914
- "tag": "SOCIALNUM",
1915
  "start": 64,
1916
  "end": 74,
1917
  "value": "9870711817"
@@ -3255,8 +3255,14 @@
3255
  {
3256
  "tag": "GIVENNAME",
3257
  "start": 7,
 
 
 
 
 
 
3258
  "end": 16,
3259
- "value": "Suli Goga"
3260
  },
3261
  {
3262
  "tag": "DATE",
@@ -4104,7 +4110,7 @@
4104
  ],
4105
  "predictions": [
4106
  {
4107
- "tag": "CITY",
4108
  "start": 135,
4109
  "end": 141,
4110
  "value": "Weerts"
@@ -5738,7 +5744,7 @@
5738
  "value": "V6UKIKNKB6"
5739
  },
5740
  {
5741
- "tag": "GIVENNAME",
5742
  "start": 114,
5743
  "end": 119,
5744
  "value": "Adolf"
@@ -5961,7 +5967,7 @@
5961
  ],
5962
  "predictions": [
5963
  {
5964
- "tag": "ZIPCODE",
5965
  "start": 40,
5966
  "end": 43,
5967
  "value": "513"
@@ -6478,7 +6484,7 @@
6478
  ],
6479
  "predictions": [
6480
  {
6481
- "tag": "IDCARDNUM",
6482
  "start": 74,
6483
  "end": 84,
6484
  "value": "CZKN7WM2UE"
@@ -6978,8 +6984,14 @@
6978
  {
6979
  "tag": "GIVENNAME",
6980
  "start": 31,
 
 
 
 
 
 
6981
  "end": 41,
6982
- "value": "Alvi Deyan"
6983
  },
6984
  {
6985
  "tag": "CITY",
@@ -7021,8 +7033,14 @@
7021
  {
7022
  "tag": "GIVENNAME",
7023
  "start": 15,
 
 
 
 
 
 
7024
  "end": 24,
7025
- "value": "Haja Haso"
7026
  },
7027
  {
7028
  "tag": "CITY",
@@ -7067,7 +7085,7 @@
7067
  ],
7068
  "predictions": [
7069
  {
7070
- "tag": "IDCARDNUM",
7071
  "start": 59,
7072
  "end": 67,
7073
  "value": "T0663501"
@@ -7654,14 +7672,14 @@
7654
  {
7655
  "tag": "GIVENNAME",
7656
  "start": 101,
7657
- "end": 104,
7658
- "value": "Isa"
7659
  },
7660
  {
7661
  "tag": "SURNAME",
7662
- "start": 105,
7663
  "end": 120,
7664
- "value": "Balu Jupi Viali"
7665
  },
7666
  {
7667
  "tag": "SEX",
@@ -7948,7 +7966,7 @@
7948
  "value": "Floresha"
7949
  },
7950
  {
7951
- "tag": "PASSPORTNUM",
7952
  "start": 76,
7953
  "end": 85,
7954
  "value": "718087585"
@@ -8047,7 +8065,7 @@
8047
  ],
8048
  "predictions": [
8049
  {
8050
- "tag": "GIVENNAME",
8051
  "start": 0,
8052
  "end": 5,
8053
  "value": "Gerny"
@@ -8277,8 +8295,14 @@
8277
  {
8278
  "tag": "GIVENNAME",
8279
  "start": 79,
 
 
 
 
 
 
8280
  "end": 90,
8281
- "value": "Dình Qemail"
8282
  }
8283
  ]
8284
  },
@@ -8891,7 +8915,7 @@
8891
  ],
8892
  "predictions": [
8893
  {
8894
- "tag": "TELEPHONENUM",
8895
  "start": 5,
8896
  "end": 16,
8897
  "value": "06730 38736"
@@ -9127,8 +9151,14 @@
9127
  {
9128
  "tag": "GIVENNAME",
9129
  "start": 135,
 
 
 
 
 
 
9130
  "end": 146,
9131
- "value": "Samyr Ezzat"
9132
  },
9133
  {
9134
  "tag": "TELEPHONENUM",
@@ -9500,7 +9530,7 @@
9500
  ],
9501
  "predictions": [
9502
  {
9503
- "tag": "GIVENNAME",
9504
  "start": 0,
9505
  "end": 9,
9506
  "value": "Laghzaoui"
@@ -9943,12 +9973,6 @@
9943
  }
9944
  ],
9945
  "predictions": [
9946
- {
9947
- "tag": "TITLE",
9948
- "start": 0,
9949
- "end": 9,
9950
- "value": "Assistant"
9951
- },
9952
  {
9953
  "tag": "DATE",
9954
  "start": 88,
@@ -11920,6 +11944,12 @@
11920
  }
11921
  ],
11922
  "predictions": [
 
 
 
 
 
 
11923
  {
11924
  "tag": "CREDITCARDNUMBER",
11925
  "start": 62,
@@ -12043,7 +12073,7 @@
12043
  ],
12044
  "predictions": [
12045
  {
12046
- "tag": "SURNAME",
12047
  "start": 13,
12048
  "end": 22,
12049
  "value": "Gabryella"
@@ -12589,8 +12619,8 @@
12589
  {
12590
  "tag": "IDCARDNUM",
12591
  "start": 62,
12592
- "end": 73,
12593
- "value": "E7354036لوب"
12594
  }
12595
  ]
12596
  },
@@ -13344,7 +13374,7 @@
13344
  "value": "OT1312988"
13345
  },
13346
  {
13347
- "tag": "DRIVERLICENSENUM",
13348
  "start": 29,
13349
  "end": 39,
13350
  "value": "3MBXXLTOXT"
@@ -13744,7 +13774,7 @@
13744
  ],
13745
  "predictions": [
13746
  {
13747
- "tag": "BUILDINGNUM",
13748
  "start": 14,
13749
  "end": 18,
13750
  "value": "1660"
@@ -14100,7 +14130,7 @@
14100
  ],
14101
  "predictions": [
14102
  {
14103
- "tag": "IDCARDNUM",
14104
  "start": 113,
14105
  "end": 122,
14106
  "value": "X5080420G"
@@ -14491,14 +14521,8 @@
14491
  {
14492
  "tag": "ZIPCODE",
14493
  "start": 64,
14494
- "end": 67,
14495
- "value": "714"
14496
- },
14497
- {
14498
- "tag": "BUILDINGNUM",
14499
- "start": 67,
14500
  "end": 70,
14501
- "value": "215"
14502
  }
14503
  ]
14504
  },
@@ -14608,8 +14632,14 @@
14608
  {
14609
  "tag": "GIVENNAME",
14610
  "start": 71,
 
 
 
 
 
 
14611
  "end": 83,
14612
- "value": "Dilda Vitera"
14613
  }
14614
  ]
14615
  },
@@ -15550,22 +15580,10 @@
15550
  "value": "27º dicembre 1959"
15551
  },
15552
  {
15553
- "tag": "GIVENNAME",
15554
- "start": 182,
15555
- "end": 194,
15556
- "value": "Pirakalathan"
15557
- },
15558
- {
15559
- "tag": "GIVENNAME",
15560
  "start": 204,
15561
  "end": 215,
15562
  "value": "Lyrer Nuhii"
15563
- },
15564
- {
15565
- "tag": "SURNAME",
15566
- "start": 216,
15567
- "end": 222,
15568
- "value": "Bricca"
15569
  }
15570
  ]
15571
  },
@@ -15686,7 +15704,7 @@
15686
  "value": "Shafiullah"
15687
  },
15688
  {
15689
- "tag": "IDCARDNUM",
15690
  "start": 110,
15691
  "end": 119,
15692
  "value": "868274180"
@@ -16217,7 +16235,7 @@
16217
  "value": "Prof"
16218
  },
16219
  {
16220
- "tag": "SURNAME",
16221
  "start": 15,
16222
  "end": 20,
16223
  "value": "Neiva"
@@ -17082,7 +17100,7 @@
17082
  ],
17083
  "predictions": [
17084
  {
17085
- "tag": "SEX",
17086
  "start": 0,
17087
  "end": 4,
17088
  "value": "Male"
@@ -17489,14 +17507,14 @@
17489
  {
17490
  "tag": "GIVENNAME",
17491
  "start": 20,
17492
- "end": 26,
17493
- "value": "Aisosa"
17494
  },
17495
  {
17496
  "tag": "SURNAME",
17497
- "start": 27,
17498
  "end": 40,
17499
- "value": "Sadouki Fantl"
17500
  },
17501
  {
17502
  "tag": "DATE",
@@ -17646,6 +17664,12 @@
17646
  "start": 0,
17647
  "end": 5,
17648
  "value": "Hadir"
 
 
 
 
 
 
17649
  }
17650
  ]
17651
  },
@@ -18919,6 +18943,12 @@
18919
  }
18920
  ],
18921
  "predictions": [
 
 
 
 
 
 
18922
  {
18923
  "tag": "STREET",
18924
  "start": 77,
@@ -19932,7 +19962,7 @@
19932
  ],
19933
  "predictions": [
19934
  {
19935
- "tag": "BUILDINGNUM",
19936
  "start": 81,
19937
  "end": 83,
19938
  "value": "54"
@@ -21221,7 +21251,7 @@
21221
  "value": "Mr"
21222
  },
21223
  {
21224
- "tag": "GIVENNAME",
21225
  "start": 111,
21226
  "end": 116,
21227
  "value": "Ganis"
@@ -22109,7 +22139,7 @@
22109
  "value": "Sr"
22110
  },
22111
  {
22112
- "tag": "GIVENNAME",
22113
  "start": 54,
22114
  "end": 61,
22115
  "value": "Humeyra"
@@ -23313,14 +23343,14 @@
23313
  {
23314
  "tag": "GIVENNAME",
23315
  "start": 64,
23316
- "end": 76,
23317
- "value": "Drishya Doca"
23318
  },
23319
  {
23320
  "tag": "SURNAME",
23321
- "start": 77,
23322
  "end": 87,
23323
- "value": "Tchalovski"
23324
  }
23325
  ]
23326
  },
@@ -23663,7 +23693,7 @@
23663
  ],
23664
  "predictions": [
23665
  {
23666
- "tag": "CITY",
23667
  "start": 12,
23668
  "end": 20,
23669
  "value": "Richmond"
@@ -25468,8 +25498,14 @@
25468
  {
25469
  "tag": "GIVENNAME",
25470
  "start": 25,
 
 
 
 
 
 
25471
  "end": 39,
25472
- "value": "Annis Llumnica"
25473
  },
25474
  {
25475
  "tag": "TITLE",
@@ -25946,14 +25982,14 @@
25946
  {
25947
  "tag": "GIVENNAME",
25948
  "start": 0,
25949
- "end": 7,
25950
- "value": "Vaibhav"
25951
  },
25952
  {
25953
  "tag": "SURNAME",
25954
- "start": 8,
25955
  "end": 22,
25956
- "value": "Mascud Firment"
25957
  },
25958
  {
25959
  "tag": "STREET",
@@ -26215,12 +26251,6 @@
26215
  }
26216
  ],
26217
  "predictions": [
26218
- {
26219
- "tag": "TITLE",
26220
- "start": 0,
26221
- "end": 10,
26222
- "value": "Controleer"
26223
- },
26224
  {
26225
  "tag": "GIVENNAME",
26226
  "start": 14,
@@ -26431,7 +26461,7 @@
26431
  "value": "Shejan"
26432
  },
26433
  {
26434
- "tag": "GIVENNAME",
26435
  "start": 75,
26436
  "end": 92,
26437
  "value": "Hirashima Einhaus"
@@ -26697,8 +26727,14 @@
26697
  {
26698
  "tag": "GIVENNAME",
26699
  "start": 11,
 
 
 
 
 
 
26700
  "end": 25,
26701
- "value": "Mehrnaz Sumbul"
26702
  },
26703
  {
26704
  "tag": "CITY",
@@ -27833,10 +27869,16 @@
27833
  "value": "Vollaro Kissack"
27834
  },
27835
  {
27836
- "tag": "STREET",
27837
  "start": 31,
 
 
 
 
 
 
27838
  "end": 53,
27839
- "value": "Lanoraie Chemin Brooks"
27840
  },
27841
  {
27842
  "tag": "BUILDINGNUM",
@@ -28076,8 +28118,14 @@
28076
  {
28077
  "tag": "GIVENNAME",
28078
  "start": 48,
 
 
 
 
 
 
28079
  "end": 64,
28080
- "value": "Jagadeesh Kletus"
28081
  },
28082
  {
28083
  "tag": "CITY",
@@ -28803,6 +28851,12 @@
28803
  "start": 15,
28804
  "end": 27,
28805
  "value": "Montan Lüppe"
 
 
 
 
 
 
28806
  }
28807
  ]
28808
  },
@@ -29014,7 +29068,7 @@
29014
  "value": "33789-34195"
29015
  },
29016
  {
29017
- "tag": "DRIVERLICENSENUM",
29018
  "start": 52,
29019
  "end": 62,
29020
  "value": "3336988621"
@@ -32027,14 +32081,14 @@
32027
  {
32028
  "tag": "GIVENNAME",
32029
  "start": 0,
32030
- "end": 7,
32031
- "value": "M'barek"
32032
  },
32033
  {
32034
  "tag": "SURNAME",
32035
- "start": 8,
32036
  "end": 28,
32037
- "value": "Colins Bettler Mimmo"
32038
  },
32039
  {
32040
  "tag": "TELEPHONENUM",
@@ -32558,14 +32612,14 @@
32558
  {
32559
  "tag": "GIVENNAME",
32560
  "start": 25,
32561
- "end": 30,
32562
- "value": "Yixin"
32563
  },
32564
  {
32565
  "tag": "SURNAME",
32566
- "start": 31,
32567
  "end": 49,
32568
- "value": "Ratnasingam Dotoli"
32569
  }
32570
  ]
32571
  },
@@ -32901,7 +32955,7 @@
32901
  "value": "Sein"
32902
  },
32903
  {
32904
- "tag": "IDCARDNUM",
32905
  "start": 42,
32906
  "end": 52,
32907
  "value": "6567725252"
@@ -33016,14 +33070,14 @@
33016
  {
33017
  "tag": "GIVENNAME",
33018
  "start": 87,
33019
- "end": 103,
33020
- "value": "Ezatollah Tereso"
33021
  },
33022
  {
33023
  "tag": "SURNAME",
33024
- "start": 104,
33025
  "end": 121,
33026
- "value": "Benvenuto Dallari"
33027
  }
33028
  ]
33029
  },
@@ -33365,7 +33419,7 @@
33365
  ],
33366
  "predictions": [
33367
  {
33368
- "tag": "GIVENNAME",
33369
  "start": 24,
33370
  "end": 31,
33371
  "value": "Hamayun"
@@ -34600,14 +34654,14 @@
34600
  {
34601
  "tag": "GIVENNAME",
34602
  "start": 9,
34603
- "end": 15,
34604
- "value": "Cercis"
34605
  },
34606
  {
34607
  "tag": "SURNAME",
34608
- "start": 16,
34609
  "end": 27,
34610
- "value": "Ransi Vasko"
34611
  }
34612
  ]
34613
  },
@@ -35277,12 +35331,6 @@
35277
  "start": 0,
35278
  "end": 4,
35279
  "value": "2828"
35280
- },
35281
- {
35282
- "tag": "GIVENNAME",
35283
- "start": 21,
35284
- "end": 27,
35285
- "value": "Pakete"
35286
  }
35287
  ]
35288
  },
@@ -35392,14 +35440,8 @@
35392
  {
35393
  "tag": "GIVENNAME",
35394
  "start": 16,
35395
- "end": 28,
35396
- "value": "Dan-Cristian"
35397
- },
35398
- {
35399
- "tag": "SURNAME",
35400
- "start": 29,
35401
  "end": 35,
35402
- "value": "Medzid"
35403
  },
35404
  {
35405
  "tag": "BUILDINGNUM",
 
1911
  ],
1912
  "predictions": [
1913
  {
1914
+ "tag": "TAXNUM",
1915
  "start": 64,
1916
  "end": 74,
1917
  "value": "9870711817"
 
3255
  {
3256
  "tag": "GIVENNAME",
3257
  "start": 7,
3258
+ "end": 11,
3259
+ "value": "Suli"
3260
+ },
3261
+ {
3262
+ "tag": "SURNAME",
3263
+ "start": 12,
3264
  "end": 16,
3265
+ "value": "Goga"
3266
  },
3267
  {
3268
  "tag": "DATE",
 
4110
  ],
4111
  "predictions": [
4112
  {
4113
+ "tag": "SURNAME",
4114
  "start": 135,
4115
  "end": 141,
4116
  "value": "Weerts"
 
5744
  "value": "V6UKIKNKB6"
5745
  },
5746
  {
5747
+ "tag": "CITY",
5748
  "start": 114,
5749
  "end": 119,
5750
  "value": "Adolf"
 
5967
  ],
5968
  "predictions": [
5969
  {
5970
+ "tag": "BUILDINGNUM",
5971
  "start": 40,
5972
  "end": 43,
5973
  "value": "513"
 
6484
  ],
6485
  "predictions": [
6486
  {
6487
+ "tag": "DRIVERLICENSENUM",
6488
  "start": 74,
6489
  "end": 84,
6490
  "value": "CZKN7WM2UE"
 
6984
  {
6985
  "tag": "GIVENNAME",
6986
  "start": 31,
6987
+ "end": 35,
6988
+ "value": "Alvi"
6989
+ },
6990
+ {
6991
+ "tag": "SURNAME",
6992
+ "start": 36,
6993
  "end": 41,
6994
+ "value": "Deyan"
6995
  },
6996
  {
6997
  "tag": "CITY",
 
7033
  {
7034
  "tag": "GIVENNAME",
7035
  "start": 15,
7036
+ "end": 19,
7037
+ "value": "Haja"
7038
+ },
7039
+ {
7040
+ "tag": "SURNAME",
7041
+ "start": 20,
7042
  "end": 24,
7043
+ "value": "Haso"
7044
  },
7045
  {
7046
  "tag": "CITY",
 
7085
  ],
7086
  "predictions": [
7087
  {
7088
+ "tag": "PASSPORTNUM",
7089
  "start": 59,
7090
  "end": 67,
7091
  "value": "T0663501"
 
7672
  {
7673
  "tag": "GIVENNAME",
7674
  "start": 101,
7675
+ "end": 109,
7676
+ "value": "Isa Balu"
7677
  },
7678
  {
7679
  "tag": "SURNAME",
7680
+ "start": 110,
7681
  "end": 120,
7682
+ "value": "Jupi Viali"
7683
  },
7684
  {
7685
  "tag": "SEX",
 
7966
  "value": "Floresha"
7967
  },
7968
  {
7969
+ "tag": "SOCIALNUM",
7970
  "start": 76,
7971
  "end": 85,
7972
  "value": "718087585"
 
8065
  ],
8066
  "predictions": [
8067
  {
8068
+ "tag": "SURNAME",
8069
  "start": 0,
8070
  "end": 5,
8071
  "value": "Gerny"
 
8295
  {
8296
  "tag": "GIVENNAME",
8297
  "start": 79,
8298
+ "end": 83,
8299
+ "value": "Dình"
8300
+ },
8301
+ {
8302
+ "tag": "SURNAME",
8303
+ "start": 84,
8304
  "end": 90,
8305
+ "value": "Qemail"
8306
  }
8307
  ]
8308
  },
 
8915
  ],
8916
  "predictions": [
8917
  {
8918
+ "tag": "TAXNUM",
8919
  "start": 5,
8920
  "end": 16,
8921
  "value": "06730 38736"
 
9151
  {
9152
  "tag": "GIVENNAME",
9153
  "start": 135,
9154
+ "end": 140,
9155
+ "value": "Samyr"
9156
+ },
9157
+ {
9158
+ "tag": "SURNAME",
9159
+ "start": 141,
9160
  "end": 146,
9161
+ "value": "Ezzat"
9162
  },
9163
  {
9164
  "tag": "TELEPHONENUM",
 
9530
  ],
9531
  "predictions": [
9532
  {
9533
+ "tag": "SURNAME",
9534
  "start": 0,
9535
  "end": 9,
9536
  "value": "Laghzaoui"
 
9973
  }
9974
  ],
9975
  "predictions": [
 
 
 
 
 
 
9976
  {
9977
  "tag": "DATE",
9978
  "start": 88,
 
11944
  }
11945
  ],
11946
  "predictions": [
11947
+ {
11948
+ "tag": "GIVENNAME",
11949
+ "start": 54,
11950
+ "end": 61,
11951
+ "value": "Janvier"
11952
+ },
11953
  {
11954
  "tag": "CREDITCARDNUMBER",
11955
  "start": 62,
 
12073
  ],
12074
  "predictions": [
12075
  {
12076
+ "tag": "GIVENNAME",
12077
  "start": 13,
12078
  "end": 22,
12079
  "value": "Gabryella"
 
12619
  {
12620
  "tag": "IDCARDNUM",
12621
  "start": 62,
12622
+ "end": 70,
12623
+ "value": "E7354036"
12624
  }
12625
  ]
12626
  },
 
13374
  "value": "OT1312988"
13375
  },
13376
  {
13377
+ "tag": "IDCARDNUM",
13378
  "start": 29,
13379
  "end": 39,
13380
  "value": "3MBXXLTOXT"
 
13774
  ],
13775
  "predictions": [
13776
  {
13777
+ "tag": "ZIPCODE",
13778
  "start": 14,
13779
  "end": 18,
13780
  "value": "1660"
 
14130
  ],
14131
  "predictions": [
14132
  {
14133
+ "tag": "TAXNUM",
14134
  "start": 113,
14135
  "end": 122,
14136
  "value": "X5080420G"
 
14521
  {
14522
  "tag": "ZIPCODE",
14523
  "start": 64,
 
 
 
 
 
 
14524
  "end": 70,
14525
+ "value": "714215"
14526
  }
14527
  ]
14528
  },
 
14632
  {
14633
  "tag": "GIVENNAME",
14634
  "start": 71,
14635
+ "end": 76,
14636
+ "value": "Dilda"
14637
+ },
14638
+ {
14639
+ "tag": "SURNAME",
14640
+ "start": 77,
14641
  "end": 83,
14642
+ "value": "Vitera"
14643
  }
14644
  ]
14645
  },
 
15580
  "value": "27º dicembre 1959"
15581
  },
15582
  {
15583
+ "tag": "SURNAME",
 
 
 
 
 
 
15584
  "start": 204,
15585
  "end": 215,
15586
  "value": "Lyrer Nuhii"
 
 
 
 
 
 
15587
  }
15588
  ]
15589
  },
 
15704
  "value": "Shafiullah"
15705
  },
15706
  {
15707
+ "tag": "TAXNUM",
15708
  "start": 110,
15709
  "end": 119,
15710
  "value": "868274180"
 
16235
  "value": "Prof"
16236
  },
16237
  {
16238
+ "tag": "GIVENNAME",
16239
  "start": 15,
16240
  "end": 20,
16241
  "value": "Neiva"
 
17100
  ],
17101
  "predictions": [
17102
  {
17103
+ "tag": "GENDER",
17104
  "start": 0,
17105
  "end": 4,
17106
  "value": "Male"
 
17507
  {
17508
  "tag": "GIVENNAME",
17509
  "start": 20,
17510
+ "end": 34,
17511
+ "value": "Aisosa Sadouki"
17512
  },
17513
  {
17514
  "tag": "SURNAME",
17515
+ "start": 35,
17516
  "end": 40,
17517
+ "value": "Fantl"
17518
  },
17519
  {
17520
  "tag": "DATE",
 
17664
  "start": 0,
17665
  "end": 5,
17666
  "value": "Hadir"
17667
+ },
17668
+ {
17669
+ "tag": "AGE",
17670
+ "start": 79,
17671
+ "end": 81,
17672
+ "value": "30"
17673
  }
17674
  ]
17675
  },
 
18943
  }
18944
  ],
18945
  "predictions": [
18946
+ {
18947
+ "tag": "SURNAME",
18948
+ "start": 50,
18949
+ "end": 57,
18950
+ "value": "Diriger"
18951
+ },
18952
  {
18953
  "tag": "STREET",
18954
  "start": 77,
 
19962
  ],
19963
  "predictions": [
19964
  {
19965
+ "tag": "AGE",
19966
  "start": 81,
19967
  "end": 83,
19968
  "value": "54"
 
21251
  "value": "Mr"
21252
  },
21253
  {
21254
+ "tag": "SURNAME",
21255
  "start": 111,
21256
  "end": 116,
21257
  "value": "Ganis"
 
22139
  "value": "Sr"
22140
  },
22141
  {
22142
+ "tag": "SURNAME",
22143
  "start": 54,
22144
  "end": 61,
22145
  "value": "Humeyra"
 
23343
  {
23344
  "tag": "GIVENNAME",
23345
  "start": 64,
23346
+ "end": 71,
23347
+ "value": "Drishya"
23348
  },
23349
  {
23350
  "tag": "SURNAME",
23351
+ "start": 72,
23352
  "end": 87,
23353
+ "value": "Doca Tchalovski"
23354
  }
23355
  ]
23356
  },
 
23693
  ],
23694
  "predictions": [
23695
  {
23696
+ "tag": "GIVENNAME",
23697
  "start": 12,
23698
  "end": 20,
23699
  "value": "Richmond"
 
25498
  {
25499
  "tag": "GIVENNAME",
25500
  "start": 25,
25501
+ "end": 30,
25502
+ "value": "Annis"
25503
+ },
25504
+ {
25505
+ "tag": "SURNAME",
25506
+ "start": 31,
25507
  "end": 39,
25508
+ "value": "Llumnica"
25509
  },
25510
  {
25511
  "tag": "TITLE",
 
25982
  {
25983
  "tag": "GIVENNAME",
25984
  "start": 0,
25985
+ "end": 14,
25986
+ "value": "Vaibhav Mascud"
25987
  },
25988
  {
25989
  "tag": "SURNAME",
25990
+ "start": 15,
25991
  "end": 22,
25992
+ "value": "Firment"
25993
  },
25994
  {
25995
  "tag": "STREET",
 
26251
  }
26252
  ],
26253
  "predictions": [
 
 
 
 
 
 
26254
  {
26255
  "tag": "GIVENNAME",
26256
  "start": 14,
 
26461
  "value": "Shejan"
26462
  },
26463
  {
26464
+ "tag": "SURNAME",
26465
  "start": 75,
26466
  "end": 92,
26467
  "value": "Hirashima Einhaus"
 
26727
  {
26728
  "tag": "GIVENNAME",
26729
  "start": 11,
26730
+ "end": 18,
26731
+ "value": "Mehrnaz"
26732
+ },
26733
+ {
26734
+ "tag": "SURNAME",
26735
+ "start": 19,
26736
  "end": 25,
26737
+ "value": "Sumbul"
26738
  },
26739
  {
26740
  "tag": "CITY",
 
27869
  "value": "Vollaro Kissack"
27870
  },
27871
  {
27872
+ "tag": "CITY",
27873
  "start": 31,
27874
+ "end": 39,
27875
+ "value": "Lanoraie"
27876
+ },
27877
+ {
27878
+ "tag": "STREET",
27879
+ "start": 40,
27880
  "end": 53,
27881
+ "value": "Chemin Brooks"
27882
  },
27883
  {
27884
  "tag": "BUILDINGNUM",
 
28118
  {
28119
  "tag": "GIVENNAME",
28120
  "start": 48,
28121
+ "end": 57,
28122
+ "value": "Jagadeesh"
28123
+ },
28124
+ {
28125
+ "tag": "SURNAME",
28126
+ "start": 58,
28127
  "end": 64,
28128
+ "value": "Kletus"
28129
  },
28130
  {
28131
  "tag": "CITY",
 
28851
  "start": 15,
28852
  "end": 27,
28853
  "value": "Montan Lüppe"
28854
+ },
28855
+ {
28856
+ "tag": "BUILDINGNUM",
28857
+ "start": 100,
28858
+ "end": 103,
28859
+ "value": "100"
28860
  }
28861
  ]
28862
  },
 
29068
  "value": "33789-34195"
29069
  },
29070
  {
29071
+ "tag": "SOCIALNUM",
29072
  "start": 52,
29073
  "end": 62,
29074
  "value": "3336988621"
 
32081
  {
32082
  "tag": "GIVENNAME",
32083
  "start": 0,
32084
+ "end": 14,
32085
+ "value": "M'barek Colins"
32086
  },
32087
  {
32088
  "tag": "SURNAME",
32089
+ "start": 15,
32090
  "end": 28,
32091
+ "value": "Bettler Mimmo"
32092
  },
32093
  {
32094
  "tag": "TELEPHONENUM",
 
32612
  {
32613
  "tag": "GIVENNAME",
32614
  "start": 25,
32615
+ "end": 42,
32616
+ "value": "Yixin Ratnasingam"
32617
  },
32618
  {
32619
  "tag": "SURNAME",
32620
+ "start": 43,
32621
  "end": 49,
32622
+ "value": "Dotoli"
32623
  }
32624
  ]
32625
  },
 
32955
  "value": "Sein"
32956
  },
32957
  {
32958
+ "tag": "SOCIALNUM",
32959
  "start": 42,
32960
  "end": 52,
32961
  "value": "6567725252"
 
33070
  {
33071
  "tag": "GIVENNAME",
33072
  "start": 87,
33073
+ "end": 96,
33074
+ "value": "Ezatollah"
33075
  },
33076
  {
33077
  "tag": "SURNAME",
33078
+ "start": 97,
33079
  "end": 121,
33080
+ "value": "Tereso Benvenuto Dallari"
33081
  }
33082
  ]
33083
  },
 
33419
  ],
33420
  "predictions": [
33421
  {
33422
+ "tag": "CITY",
33423
  "start": 24,
33424
  "end": 31,
33425
  "value": "Hamayun"
 
34654
  {
34655
  "tag": "GIVENNAME",
34656
  "start": 9,
34657
+ "end": 21,
34658
+ "value": "Cercis Ransi"
34659
  },
34660
  {
34661
  "tag": "SURNAME",
34662
+ "start": 22,
34663
  "end": 27,
34664
+ "value": "Vasko"
34665
  }
34666
  ]
34667
  },
 
35331
  "start": 0,
35332
  "end": 4,
35333
  "value": "2828"
 
 
 
 
 
 
35334
  }
35335
  ]
35336
  },
 
35440
  {
35441
  "tag": "GIVENNAME",
35442
  "start": 16,
 
 
 
 
 
 
35443
  "end": 35,
35444
+ "value": "Dan-Cristian Medzid"
35445
  },
35446
  {
35447
  "tag": "BUILDINGNUM",
open-pii-masking-500k-ai4privacy/evaluations/bert_plus_crf/seed_456_predictions.json CHANGED
@@ -49,14 +49,8 @@
49
  {
50
  "tag": "GIVENNAME",
51
  "start": 101,
52
- "end": 106,
53
- "value": "Sveya"
54
- },
55
- {
56
- "tag": "SURNAME",
57
- "start": 107,
58
  "end": 113,
59
- "value": "Malado"
60
  }
61
  ]
62
  },
@@ -379,7 +373,7 @@
379
  "value": "Sirikanya"
380
  },
381
  {
382
- "tag": "SEX",
383
  "start": 20,
384
  "end": 28,
385
  "value": "Männlich"
@@ -766,12 +760,6 @@
766
  }
767
  ],
768
  "predictions": [
769
- {
770
- "tag": "GIVENNAME",
771
- "start": 11,
772
- "end": 15,
773
- "value": "Chai"
774
- },
775
  {
776
  "tag": "GIVENNAME",
777
  "start": 36,
@@ -1286,8 +1274,14 @@
1286
  {
1287
  "tag": "GIVENNAME",
1288
  "start": 35,
 
 
 
 
 
 
1289
  "end": 49,
1290
- "value": "Haifeng Almena"
1291
  }
1292
  ]
1293
  },
@@ -2202,7 +2196,7 @@
2202
  ],
2203
  "predictions": [
2204
  {
2205
- "tag": "GIVENNAME",
2206
  "start": 28,
2207
  "end": 45,
2208
  "value": "Lomanto Rupprecht"
@@ -2467,7 +2461,7 @@
2467
  "value": "343383163175337"
2468
  },
2469
  {
2470
- "tag": "DRIVERLICENSENUM",
2471
  "start": 73,
2472
  "end": 83,
2473
  "value": "Q3YEN1MPVF"
@@ -2904,8 +2898,8 @@
2904
  {
2905
  "tag": "SURNAME",
2906
  "start": 42,
2907
- "end": 57,
2908
- "value": "Khatchikian God"
2909
  }
2910
  ]
2911
  },
@@ -3000,7 +2994,7 @@
3000
  "value": "Mister"
3001
  },
3002
  {
3003
- "tag": "GIVENNAME",
3004
  "start": 80,
3005
  "end": 86,
3006
  "value": "Belina"
@@ -3302,7 +3296,7 @@
3302
  "value": "Gardet Bodet"
3303
  },
3304
  {
3305
- "tag": "IDCARDNUM",
3306
  "start": 104,
3307
  "end": 114,
3308
  "value": "6509094045"
@@ -3550,7 +3544,7 @@
3550
  "value": "Sedalia"
3551
  },
3552
  {
3553
- "tag": "CITY",
3554
  "start": 132,
3555
  "end": 139,
3556
  "value": "Valpuri"
@@ -3753,7 +3747,7 @@
3753
  "value": "Flumini"
3754
  },
3755
  {
3756
- "tag": "STREET",
3757
  "start": 73,
3758
  "end": 85,
3759
  "value": "Oeschinensee"
@@ -4996,8 +4990,14 @@
4996
  {
4997
  "tag": "GIVENNAME",
4998
  "start": 0,
 
 
 
 
 
 
4999
  "end": 14,
5000
- "value": "Sugey Lalicata"
5001
  }
5002
  ]
5003
  },
@@ -5272,12 +5272,6 @@
5272
  "start": 0,
5273
  "end": 19,
5274
  "value": "3127052588326222790"
5275
- },
5276
- {
5277
- "tag": "TELEPHONENUM",
5278
- "start": 22,
5279
- "end": 41,
5280
- "value": "1234-4567-8912-3456"
5281
  }
5282
  ]
5283
  },
@@ -7511,8 +7505,14 @@
7511
  {
7512
  "tag": "GIVENNAME",
7513
  "start": 0,
 
 
 
 
 
 
7514
  "end": 17,
7515
- "value": "Maïlyss Omokhuale"
7516
  },
7517
  {
7518
  "tag": "CREDITCARDNUMBER",
@@ -8705,8 +8705,14 @@
8705
  {
8706
  "tag": "GIVENNAME",
8707
  "start": 11,
 
 
 
 
 
 
8708
  "end": 23,
8709
- "value": "Fazela Drori"
8710
  },
8711
  {
8712
  "tag": "EMAIL",
@@ -9879,8 +9885,14 @@
9879
  {
9880
  "tag": "GIVENNAME",
9881
  "start": 8,
 
 
 
 
 
 
9882
  "end": 22,
9883
- "value": "Ravirajah Fung"
9884
  }
9885
  ]
9886
  },
@@ -10206,10 +10218,16 @@
10206
  "value": "Thaddeus Ignatius"
10207
  },
10208
  {
10209
- "tag": "SURNAME",
10210
  "start": 36,
 
 
 
 
 
 
10211
  "end": 50,
10212
- "value": "Arbey Drongdey"
10213
  }
10214
  ]
10215
  },
@@ -10878,7 +10896,7 @@
10878
  "value": "Slodowicz"
10879
  },
10880
  {
10881
- "tag": "IDCARDNUM",
10882
  "start": 53,
10883
  "end": 63,
10884
  "value": "RNSUEEE42V"
@@ -12400,7 +12418,7 @@
12400
  "value": "Boulton Drive"
12401
  },
12402
  {
12403
- "tag": "ZIPCODE",
12404
  "start": 65,
12405
  "end": 70,
12406
  "value": "43860"
@@ -13686,7 +13704,7 @@
13686
  "value": "38722832551847"
13687
  },
13688
  {
13689
- "tag": "SEX",
13690
  "start": 66,
13691
  "end": 73,
13692
  "value": "Femmina"
@@ -14168,9 +14186,9 @@
14168
  "predictions": [
14169
  {
14170
  "tag": "GIVENNAME",
14171
- "start": 0,
14172
  "end": 30,
14173
- "value": "Archer Jamina Mihaela-Loredana"
14174
  },
14175
  {
14176
  "tag": "SURNAME",
@@ -15192,8 +15210,14 @@
15192
  {
15193
  "tag": "GIVENNAME",
15194
  "start": 79,
 
 
 
 
 
 
15195
  "end": 90,
15196
- "value": "Dình Qemail"
15197
  }
15198
  ]
15199
  },
@@ -15482,6 +15506,12 @@
15482
  "start": 79,
15483
  "end": 84,
15484
  "value": "23823"
 
 
 
 
 
 
15485
  }
15486
  ]
15487
  },
@@ -15893,8 +15923,14 @@
15893
  {
15894
  "tag": "GIVENNAME",
15895
  "start": 7,
 
 
 
 
 
 
15896
  "end": 32,
15897
- "value": "Jacques-François Yemaneab"
15898
  },
15899
  {
15900
  "tag": "STREET",
@@ -16097,8 +16133,14 @@
16097
  {
16098
  "tag": "GIVENNAME",
16099
  "start": 101,
 
 
 
 
 
 
16100
  "end": 112,
16101
- "value": "Adorján Syl"
16102
  },
16103
  {
16104
  "tag": "DATE",
@@ -16228,6 +16270,12 @@
16228
  "end": 33,
16229
  "value": "mars/96"
16230
  },
 
 
 
 
 
 
16231
  {
16232
  "tag": "CITY",
16233
  "start": 36,
@@ -17433,8 +17481,14 @@
17433
  {
17434
  "tag": "GIVENNAME",
17435
  "start": 112,
 
 
 
 
 
 
17436
  "end": 127,
17437
- "value": "Manolita Cahide"
17438
  }
17439
  ]
17440
  },
@@ -17477,8 +17531,14 @@
17477
  {
17478
  "tag": "GIVENNAME",
17479
  "start": 40,
 
 
 
 
 
 
17480
  "end": 53,
17481
- "value": "Blend - Macie"
17482
  },
17483
  {
17484
  "tag": "SURNAME",
@@ -18153,8 +18213,14 @@
18153
  {
18154
  "tag": "GIVENNAME",
18155
  "start": 24,
 
 
 
 
 
 
18156
  "end": 34,
18157
- "value": "Anikò Fibi"
18158
  }
18159
  ]
18160
  },
@@ -18739,9 +18805,9 @@
18739
  },
18740
  {
18741
  "tag": "SURNAME",
18742
- "start": 81,
18743
  "end": 91,
18744
- "value": "Bardowicks"
18745
  }
18746
  ]
18747
  },
@@ -18892,7 +18958,7 @@
18892
  ],
18893
  "predictions": [
18894
  {
18895
- "tag": "SURNAME",
18896
  "start": 21,
18897
  "end": 25,
18898
  "value": "Butz"
@@ -20624,14 +20690,14 @@
20624
  {
20625
  "tag": "GIVENNAME",
20626
  "start": 13,
20627
- "end": 29,
20628
- "value": "Joelson Nnaemeka"
20629
  },
20630
  {
20631
  "tag": "SURNAME",
20632
- "start": 30,
20633
  "end": 36,
20634
- "value": "Sutera"
20635
  },
20636
  {
20637
  "tag": "EMAIL",
@@ -21430,7 +21496,7 @@
21430
  ],
21431
  "predictions": [
21432
  {
21433
- "tag": "SEX",
21434
  "start": 38,
21435
  "end": 39,
21436
  "value": "M"
@@ -22054,8 +22120,14 @@
22054
  {
22055
  "tag": "GIVENNAME",
22056
  "start": 6,
 
 
 
 
 
 
22057
  "end": 21,
22058
- "value": "Lavinia Binetou"
22059
  },
22060
  {
22061
  "tag": "GIVENNAME",
@@ -22131,7 +22203,7 @@
22131
  "value": "0691 40765773"
22132
  },
22133
  {
22134
- "tag": "CITY",
22135
  "start": 218,
22136
  "end": 229,
22137
  "value": "Lalithadevi"
@@ -22469,12 +22541,6 @@
22469
  "end": 41,
22470
  "value": "Thuruvan"
22471
  },
22472
- {
22473
- "tag": "SURNAME",
22474
- "start": 42,
22475
- "end": 47,
22476
- "value": "Yacht"
22477
- },
22478
  {
22479
  "tag": "TELEPHONENUM",
22480
  "start": 73,
@@ -22855,14 +22921,8 @@
22855
  {
22856
  "tag": "GIVENNAME",
22857
  "start": 16,
22858
- "end": 20,
22859
- "value": "Maya"
22860
- },
22861
- {
22862
- "tag": "SURNAME",
22863
- "start": 21,
22864
  "end": 27,
22865
- "value": "Burton"
22866
  },
22867
  {
22868
  "tag": "BUILDINGNUM",
@@ -23119,8 +23179,14 @@
23119
  {
23120
  "tag": "GIVENNAME",
23121
  "start": 31,
 
 
 
 
 
 
23122
  "end": 45,
23123
- "value": "Helmuth Tonton"
23124
  },
23125
  {
23126
  "tag": "ZIPCODE",
@@ -23265,10 +23331,16 @@
23265
  ],
23266
  "predictions": [
23267
  {
23268
- "tag": "GIVENNAME",
23269
  "start": 48,
 
 
 
 
 
 
23270
  "end": 64,
23271
- "value": "Dusautoir Ofélie"
23272
  },
23273
  {
23274
  "tag": "STREET",
@@ -23754,7 +23826,7 @@
23754
  ],
23755
  "predictions": [
23756
  {
23757
- "tag": "CITY",
23758
  "start": 72,
23759
  "end": 84,
23760
  "value": "Buenaventura"
@@ -24763,8 +24835,14 @@
24763
  {
24764
  "tag": "GIVENNAME",
24765
  "start": 0,
 
 
 
 
 
 
24766
  "end": 14,
24767
- "value": "Zekeria Parham"
24768
  },
24769
  {
24770
  "tag": "SEX",
@@ -24935,7 +25013,7 @@
24935
  "value": "Op de Ries"
24936
  },
24937
  {
24938
- "tag": "ZIPCODE",
24939
  "start": 105,
24940
  "end": 109,
24941
  "value": "4297"
@@ -26273,7 +26351,7 @@
26273
  "value": "86"
26274
  },
26275
  {
26276
- "tag": "SEX",
26277
  "start": 33,
26278
  "end": 41,
26279
  "value": "Männlich"
@@ -26705,7 +26783,7 @@
26705
  ],
26706
  "predictions": [
26707
  {
26708
- "tag": "SEX",
26709
  "start": 0,
26710
  "end": 6,
26711
  "value": "Female"
@@ -27004,14 +27082,14 @@
27004
  {
27005
  "tag": "GIVENNAME",
27006
  "start": 167,
27007
- "end": 172,
27008
- "value": "Banna"
27009
  },
27010
  {
27011
  "tag": "SURNAME",
27012
- "start": 173,
27013
  "end": 194,
27014
- "value": "Ciel Skerswetat Künze"
27015
  }
27016
  ]
27017
  },
@@ -28606,7 +28684,7 @@
28606
  ],
28607
  "predictions": [
28608
  {
28609
- "tag": "CITY",
28610
  "start": 12,
28611
  "end": 20,
28612
  "value": "Richmond"
@@ -29129,8 +29207,14 @@
29129
  {
29130
  "tag": "GIVENNAME",
29131
  "start": 25,
 
 
 
 
 
 
29132
  "end": 37,
29133
- "value": "Nicolaï Crom"
29134
  }
29135
  ]
29136
  },
@@ -29721,7 +29805,7 @@
29721
  "value": "Emka Idea"
29722
  },
29723
  {
29724
- "tag": "GIVENNAME",
29725
  "start": 60,
29726
  "end": 65,
29727
  "value": "Létra"
@@ -30154,7 +30238,7 @@
30154
  "value": "Norgard"
30155
  },
30156
  {
30157
- "tag": "SEX",
30158
  "start": 43,
30159
  "end": 47,
30160
  "value": "Male"
@@ -30826,10 +30910,10 @@
30826
  "value": "Seuzach Oberohringen"
30827
  },
30828
  {
30829
- "tag": "TIME",
30830
  "start": 106,
30831
- "end": 114,
30832
- "value": "9 heures"
30833
  },
30834
  {
30835
  "tag": "DATE",
@@ -31284,7 +31368,7 @@
31284
  "value": "Jerez de la Frontera"
31285
  },
31286
  {
31287
- "tag": "IDCARDNUM",
31288
  "start": 122,
31289
  "end": 131,
31290
  "value": "O8511777K"
@@ -31428,14 +31512,14 @@
31428
  {
31429
  "tag": "GIVENNAME",
31430
  "start": 118,
31431
- "end": 131,
31432
- "value": "Asmi Sivakami"
31433
  },
31434
  {
31435
  "tag": "SURNAME",
31436
- "start": 132,
31437
  "end": 137,
31438
- "value": "Bizot"
31439
  },
31440
  {
31441
  "tag": "DATE",
@@ -32146,8 +32230,14 @@
32146
  {
32147
  "tag": "GIVENNAME",
32148
  "start": 5,
 
 
 
 
 
 
32149
  "end": 16,
32150
- "value": "Acyl Tsigab"
32151
  },
32152
  {
32153
  "tag": "STREET",
@@ -32201,14 +32291,14 @@
32201
  {
32202
  "tag": "GIVENNAME",
32203
  "start": 84,
32204
- "end": 89,
32205
- "value": "Brett"
32206
  },
32207
  {
32208
  "tag": "SURNAME",
32209
- "start": 90,
32210
  "end": 105,
32211
- "value": "Flandri Piffero"
32212
  }
32213
  ]
32214
  },
@@ -32267,7 +32357,7 @@
32267
  "value": "04/15/1964"
32268
  },
32269
  {
32270
- "tag": "PASSPORTNUM",
32271
  "start": 36,
32272
  "end": 45,
32273
  "value": "992211051"
@@ -32427,7 +32517,7 @@
32427
  "value": "Sen"
32428
  },
32429
  {
32430
- "tag": "GIVENNAME",
32431
  "start": 59,
32432
  "end": 65,
32433
  "value": "Pepijn"
@@ -32636,16 +32726,10 @@
32636
  ],
32637
  "predictions": [
32638
  {
32639
- "tag": "TITLE",
32640
  "start": 8,
32641
- "end": 14,
32642
- "value": "Artist"
32643
- },
32644
- {
32645
- "tag": "SURNAME",
32646
- "start": 15,
32647
  "end": 21,
32648
- "value": "Kanaan"
32649
  },
32650
  {
32651
  "tag": "CITY",
@@ -32966,7 +33050,7 @@
32966
  "value": "Moses"
32967
  },
32968
  {
32969
- "tag": "AGE",
32970
  "start": 146,
32971
  "end": 148,
32972
  "value": "71"
@@ -33024,14 +33108,8 @@
33024
  {
33025
  "tag": "GIVENNAME",
33026
  "start": 24,
33027
- "end": 31,
33028
- "value": "Gulnara"
33029
- },
33030
- {
33031
- "tag": "SURNAME",
33032
- "start": 32,
33033
  "end": 37,
33034
- "value": "Shams"
33035
  }
33036
  ]
33037
  },
 
49
  {
50
  "tag": "GIVENNAME",
51
  "start": 101,
 
 
 
 
 
 
52
  "end": 113,
53
+ "value": "Sveya Malado"
54
  }
55
  ]
56
  },
 
373
  "value": "Sirikanya"
374
  },
375
  {
376
+ "tag": "GENDER",
377
  "start": 20,
378
  "end": 28,
379
  "value": "Männlich"
 
760
  }
761
  ],
762
  "predictions": [
 
 
 
 
 
 
763
  {
764
  "tag": "GIVENNAME",
765
  "start": 36,
 
1274
  {
1275
  "tag": "GIVENNAME",
1276
  "start": 35,
1277
+ "end": 42,
1278
+ "value": "Haifeng"
1279
+ },
1280
+ {
1281
+ "tag": "SURNAME",
1282
+ "start": 43,
1283
  "end": 49,
1284
+ "value": "Almena"
1285
  }
1286
  ]
1287
  },
 
2196
  ],
2197
  "predictions": [
2198
  {
2199
+ "tag": "SURNAME",
2200
  "start": 28,
2201
  "end": 45,
2202
  "value": "Lomanto Rupprecht"
 
2461
  "value": "343383163175337"
2462
  },
2463
  {
2464
+ "tag": "IDCARDNUM",
2465
  "start": 73,
2466
  "end": 83,
2467
  "value": "Q3YEN1MPVF"
 
2898
  {
2899
  "tag": "SURNAME",
2900
  "start": 42,
2901
+ "end": 53,
2902
+ "value": "Khatchikian"
2903
  }
2904
  ]
2905
  },
 
2994
  "value": "Mister"
2995
  },
2996
  {
2997
+ "tag": "SURNAME",
2998
  "start": 80,
2999
  "end": 86,
3000
  "value": "Belina"
 
3296
  "value": "Gardet Bodet"
3297
  },
3298
  {
3299
+ "tag": "SOCIALNUM",
3300
  "start": 104,
3301
  "end": 114,
3302
  "value": "6509094045"
 
3544
  "value": "Sedalia"
3545
  },
3546
  {
3547
+ "tag": "GIVENNAME",
3548
  "start": 132,
3549
  "end": 139,
3550
  "value": "Valpuri"
 
3747
  "value": "Flumini"
3748
  },
3749
  {
3750
+ "tag": "CITY",
3751
  "start": 73,
3752
  "end": 85,
3753
  "value": "Oeschinensee"
 
4990
  {
4991
  "tag": "GIVENNAME",
4992
  "start": 0,
4993
+ "end": 5,
4994
+ "value": "Sugey"
4995
+ },
4996
+ {
4997
+ "tag": "SURNAME",
4998
+ "start": 6,
4999
  "end": 14,
5000
+ "value": "Lalicata"
5001
  }
5002
  ]
5003
  },
 
5272
  "start": 0,
5273
  "end": 19,
5274
  "value": "3127052588326222790"
 
 
 
 
 
 
5275
  }
5276
  ]
5277
  },
 
7505
  {
7506
  "tag": "GIVENNAME",
7507
  "start": 0,
7508
+ "end": 7,
7509
+ "value": "Maïlyss"
7510
+ },
7511
+ {
7512
+ "tag": "SURNAME",
7513
+ "start": 8,
7514
  "end": 17,
7515
+ "value": "Omokhuale"
7516
  },
7517
  {
7518
  "tag": "CREDITCARDNUMBER",
 
8705
  {
8706
  "tag": "GIVENNAME",
8707
  "start": 11,
8708
+ "end": 17,
8709
+ "value": "Fazela"
8710
+ },
8711
+ {
8712
+ "tag": "SURNAME",
8713
+ "start": 18,
8714
  "end": 23,
8715
+ "value": "Drori"
8716
  },
8717
  {
8718
  "tag": "EMAIL",
 
9885
  {
9886
  "tag": "GIVENNAME",
9887
  "start": 8,
9888
+ "end": 17,
9889
+ "value": "Ravirajah"
9890
+ },
9891
+ {
9892
+ "tag": "SURNAME",
9893
+ "start": 18,
9894
  "end": 22,
9895
+ "value": "Fung"
9896
  }
9897
  ]
9898
  },
 
10218
  "value": "Thaddeus Ignatius"
10219
  },
10220
  {
10221
+ "tag": "GIVENNAME",
10222
  "start": 36,
10223
+ "end": 41,
10224
+ "value": "Arbey"
10225
+ },
10226
+ {
10227
+ "tag": "SURNAME",
10228
+ "start": 42,
10229
  "end": 50,
10230
+ "value": "Drongdey"
10231
  }
10232
  ]
10233
  },
 
10896
  "value": "Slodowicz"
10897
  },
10898
  {
10899
+ "tag": "DRIVERLICENSENUM",
10900
  "start": 53,
10901
  "end": 63,
10902
  "value": "RNSUEEE42V"
 
12418
  "value": "Boulton Drive"
12419
  },
12420
  {
12421
+ "tag": "BUILDINGNUM",
12422
  "start": 65,
12423
  "end": 70,
12424
  "value": "43860"
 
13704
  "value": "38722832551847"
13705
  },
13706
  {
13707
+ "tag": "GENDER",
13708
  "start": 66,
13709
  "end": 73,
13710
  "value": "Femmina"
 
14186
  "predictions": [
14187
  {
14188
  "tag": "GIVENNAME",
14189
+ "start": 7,
14190
  "end": 30,
14191
+ "value": "Jamina Mihaela-Loredana"
14192
  },
14193
  {
14194
  "tag": "SURNAME",
 
15210
  {
15211
  "tag": "GIVENNAME",
15212
  "start": 79,
15213
+ "end": 83,
15214
+ "value": "Dình"
15215
+ },
15216
+ {
15217
+ "tag": "SURNAME",
15218
+ "start": 84,
15219
  "end": 90,
15220
+ "value": "Qemail"
15221
  }
15222
  ]
15223
  },
 
15506
  "start": 79,
15507
  "end": 84,
15508
  "value": "23823"
15509
+ },
15510
+ {
15511
+ "tag": "CITY",
15512
+ "start": 98,
15513
+ "end": 107,
15514
+ "value": "Cerveteri"
15515
  }
15516
  ]
15517
  },
 
15923
  {
15924
  "tag": "GIVENNAME",
15925
  "start": 7,
15926
+ "end": 23,
15927
+ "value": "Jacques-François"
15928
+ },
15929
+ {
15930
+ "tag": "SURNAME",
15931
+ "start": 24,
15932
  "end": 32,
15933
+ "value": "Yemaneab"
15934
  },
15935
  {
15936
  "tag": "STREET",
 
16133
  {
16134
  "tag": "GIVENNAME",
16135
  "start": 101,
16136
+ "end": 108,
16137
+ "value": "Adorján"
16138
+ },
16139
+ {
16140
+ "tag": "SURNAME",
16141
+ "start": 109,
16142
  "end": 112,
16143
+ "value": "Syl"
16144
  },
16145
  {
16146
  "tag": "DATE",
 
16270
  "end": 33,
16271
  "value": "mars/96"
16272
  },
16273
+ {
16274
+ "tag": "SEX",
16275
+ "start": 34,
16276
+ "end": 35,
16277
+ "value": "A"
16278
+ },
16279
  {
16280
  "tag": "CITY",
16281
  "start": 36,
 
17481
  {
17482
  "tag": "GIVENNAME",
17483
  "start": 112,
17484
+ "end": 120,
17485
+ "value": "Manolita"
17486
+ },
17487
+ {
17488
+ "tag": "SURNAME",
17489
+ "start": 121,
17490
  "end": 127,
17491
+ "value": "Cahide"
17492
  }
17493
  ]
17494
  },
 
17531
  {
17532
  "tag": "GIVENNAME",
17533
  "start": 40,
17534
+ "end": 45,
17535
+ "value": "Blend"
17536
+ },
17537
+ {
17538
+ "tag": "GIVENNAME",
17539
+ "start": 48,
17540
  "end": 53,
17541
+ "value": "Macie"
17542
  },
17543
  {
17544
  "tag": "SURNAME",
 
18213
  {
18214
  "tag": "GIVENNAME",
18215
  "start": 24,
18216
+ "end": 29,
18217
+ "value": "Anikò"
18218
+ },
18219
+ {
18220
+ "tag": "SURNAME",
18221
+ "start": 30,
18222
  "end": 34,
18223
+ "value": "Fibi"
18224
  }
18225
  ]
18226
  },
 
18805
  },
18806
  {
18807
  "tag": "SURNAME",
18808
+ "start": 73,
18809
  "end": 91,
18810
+ "value": "člověka Bardowicks"
18811
  }
18812
  ]
18813
  },
 
18958
  ],
18959
  "predictions": [
18960
  {
18961
+ "tag": "GIVENNAME",
18962
  "start": 21,
18963
  "end": 25,
18964
  "value": "Butz"
 
20690
  {
20691
  "tag": "GIVENNAME",
20692
  "start": 13,
20693
+ "end": 20,
20694
+ "value": "Joelson"
20695
  },
20696
  {
20697
  "tag": "SURNAME",
20698
+ "start": 21,
20699
  "end": 36,
20700
+ "value": "Nnaemeka Sutera"
20701
  },
20702
  {
20703
  "tag": "EMAIL",
 
21496
  ],
21497
  "predictions": [
21498
  {
21499
+ "tag": "TITLE",
21500
  "start": 38,
21501
  "end": 39,
21502
  "value": "M"
 
22120
  {
22121
  "tag": "GIVENNAME",
22122
  "start": 6,
22123
+ "end": 13,
22124
+ "value": "Lavinia"
22125
+ },
22126
+ {
22127
+ "tag": "SURNAME",
22128
+ "start": 14,
22129
  "end": 21,
22130
+ "value": "Binetou"
22131
  },
22132
  {
22133
  "tag": "GIVENNAME",
 
22203
  "value": "0691 40765773"
22204
  },
22205
  {
22206
+ "tag": "GIVENNAME",
22207
  "start": 218,
22208
  "end": 229,
22209
  "value": "Lalithadevi"
 
22541
  "end": 41,
22542
  "value": "Thuruvan"
22543
  },
 
 
 
 
 
 
22544
  {
22545
  "tag": "TELEPHONENUM",
22546
  "start": 73,
 
22921
  {
22922
  "tag": "GIVENNAME",
22923
  "start": 16,
 
 
 
 
 
 
22924
  "end": 27,
22925
+ "value": "Maya Burton"
22926
  },
22927
  {
22928
  "tag": "BUILDINGNUM",
 
23179
  {
23180
  "tag": "GIVENNAME",
23181
  "start": 31,
23182
+ "end": 38,
23183
+ "value": "Helmuth"
23184
+ },
23185
+ {
23186
+ "tag": "SURNAME",
23187
+ "start": 39,
23188
  "end": 45,
23189
+ "value": "Tonton"
23190
  },
23191
  {
23192
  "tag": "ZIPCODE",
 
23331
  ],
23332
  "predictions": [
23333
  {
23334
+ "tag": "SURNAME",
23335
  "start": 48,
23336
+ "end": 57,
23337
+ "value": "Dusautoir"
23338
+ },
23339
+ {
23340
+ "tag": "GIVENNAME",
23341
+ "start": 58,
23342
  "end": 64,
23343
+ "value": "Ofélie"
23344
  },
23345
  {
23346
  "tag": "STREET",
 
23826
  ],
23827
  "predictions": [
23828
  {
23829
+ "tag": "GIVENNAME",
23830
  "start": 72,
23831
  "end": 84,
23832
  "value": "Buenaventura"
 
24835
  {
24836
  "tag": "GIVENNAME",
24837
  "start": 0,
24838
+ "end": 7,
24839
+ "value": "Zekeria"
24840
+ },
24841
+ {
24842
+ "tag": "SURNAME",
24843
+ "start": 8,
24844
  "end": 14,
24845
+ "value": "Parham"
24846
  },
24847
  {
24848
  "tag": "SEX",
 
25013
  "value": "Op de Ries"
25014
  },
25015
  {
25016
+ "tag": "BUILDINGNUM",
25017
  "start": 105,
25018
  "end": 109,
25019
  "value": "4297"
 
26351
  "value": "86"
26352
  },
26353
  {
26354
+ "tag": "GENDER",
26355
  "start": 33,
26356
  "end": 41,
26357
  "value": "Männlich"
 
26783
  ],
26784
  "predictions": [
26785
  {
26786
+ "tag": "GENDER",
26787
  "start": 0,
26788
  "end": 6,
26789
  "value": "Female"
 
27082
  {
27083
  "tag": "GIVENNAME",
27084
  "start": 167,
27085
+ "end": 177,
27086
+ "value": "Banna Ciel"
27087
  },
27088
  {
27089
  "tag": "SURNAME",
27090
+ "start": 178,
27091
  "end": 194,
27092
+ "value": "Skerswetat Künze"
27093
  }
27094
  ]
27095
  },
 
28684
  ],
28685
  "predictions": [
28686
  {
28687
+ "tag": "GIVENNAME",
28688
  "start": 12,
28689
  "end": 20,
28690
  "value": "Richmond"
 
29207
  {
29208
  "tag": "GIVENNAME",
29209
  "start": 25,
29210
+ "end": 32,
29211
+ "value": "Nicolaï"
29212
+ },
29213
+ {
29214
+ "tag": "SURNAME",
29215
+ "start": 33,
29216
  "end": 37,
29217
+ "value": "Crom"
29218
  }
29219
  ]
29220
  },
 
29805
  "value": "Emka Idea"
29806
  },
29807
  {
29808
+ "tag": "CITY",
29809
  "start": 60,
29810
  "end": 65,
29811
  "value": "Létra"
 
30238
  "value": "Norgard"
30239
  },
30240
  {
30241
+ "tag": "GENDER",
30242
  "start": 43,
30243
  "end": 47,
30244
  "value": "Male"
 
30910
  "value": "Seuzach Oberohringen"
30911
  },
30912
  {
30913
+ "tag": "AGE",
30914
  "start": 106,
30915
+ "end": 107,
30916
+ "value": "9"
30917
  },
30918
  {
30919
  "tag": "DATE",
 
31368
  "value": "Jerez de la Frontera"
31369
  },
31370
  {
31371
+ "tag": "TAXNUM",
31372
  "start": 122,
31373
  "end": 131,
31374
  "value": "O8511777K"
 
31512
  {
31513
  "tag": "GIVENNAME",
31514
  "start": 118,
31515
+ "end": 122,
31516
+ "value": "Asmi"
31517
  },
31518
  {
31519
  "tag": "SURNAME",
31520
+ "start": 123,
31521
  "end": 137,
31522
+ "value": "Sivakami Bizot"
31523
  },
31524
  {
31525
  "tag": "DATE",
 
32230
  {
32231
  "tag": "GIVENNAME",
32232
  "start": 5,
32233
+ "end": 9,
32234
+ "value": "Acyl"
32235
+ },
32236
+ {
32237
+ "tag": "SURNAME",
32238
+ "start": 10,
32239
  "end": 16,
32240
+ "value": "Tsigab"
32241
  },
32242
  {
32243
  "tag": "STREET",
 
32291
  {
32292
  "tag": "GIVENNAME",
32293
  "start": 84,
32294
+ "end": 97,
32295
+ "value": "Brett Flandri"
32296
  },
32297
  {
32298
  "tag": "SURNAME",
32299
+ "start": 98,
32300
  "end": 105,
32301
+ "value": "Piffero"
32302
  }
32303
  ]
32304
  },
 
32357
  "value": "04/15/1964"
32358
  },
32359
  {
32360
+ "tag": "IDCARDNUM",
32361
  "start": 36,
32362
  "end": 45,
32363
  "value": "992211051"
 
32517
  "value": "Sen"
32518
  },
32519
  {
32520
+ "tag": "SURNAME",
32521
  "start": 59,
32522
  "end": 65,
32523
  "value": "Pepijn"
 
32726
  ],
32727
  "predictions": [
32728
  {
32729
+ "tag": "GIVENNAME",
32730
  "start": 8,
 
 
 
 
 
 
32731
  "end": 21,
32732
+ "value": "Artist Kanaan"
32733
  },
32734
  {
32735
  "tag": "CITY",
 
33050
  "value": "Moses"
33051
  },
33052
  {
33053
+ "tag": "BUILDINGNUM",
33054
  "start": 146,
33055
  "end": 148,
33056
  "value": "71"
 
33108
  {
33109
  "tag": "GIVENNAME",
33110
  "start": 24,
 
 
 
 
 
 
33111
  "end": 37,
33112
+ "value": "Gulnara Shams"
33113
  }
33114
  ]
33115
  },
open-pii-masking-500k-ai4privacy/evaluations/bert_plus_crf/seed_789_predictions.json CHANGED
@@ -18,9 +18,9 @@
18
  "predictions": [
19
  {
20
  "tag": "GIVENNAME",
21
- "start": 0,
22
  "end": 11,
23
- "value": "Ang Zoubair"
24
  },
25
  {
26
  "tag": "DATE",
@@ -180,8 +180,14 @@
180
  {
181
  "tag": "GIVENNAME",
182
  "start": 45,
 
 
 
 
 
 
183
  "end": 64,
184
- "value": "Zoltán Pannerselvam"
185
  }
186
  ]
187
  },
@@ -1284,7 +1290,7 @@
1284
  "value": "Rukman"
1285
  },
1286
  {
1287
- "tag": "GIVENNAME",
1288
  "start": 94,
1289
  "end": 105,
1290
  "value": "Tharmabalan"
@@ -2117,7 +2123,7 @@
2117
  "value": "Sholeh"
2118
  },
2119
  {
2120
- "tag": "GIVENNAME",
2121
  "start": 13,
2122
  "end": 19,
2123
  "value": "Bulduk"
@@ -2812,7 +2818,14 @@
2812
  "value": "Saeda"
2813
  }
2814
  ],
2815
- "predictions": []
 
 
 
 
 
 
 
2816
  },
2817
  {
2818
  "source_text": "Your generosity is appreciated, and we would like to acknowledge your in-kind donation. Please reply with your Thainá Isolde and Jahibasic to confirm.",
@@ -3042,8 +3055,14 @@
3042
  {
3043
  "tag": "GIVENNAME",
3044
  "start": 71,
 
 
 
 
 
 
3045
  "end": 84,
3046
- "value": "Xiujuan Raisa"
3047
  },
3048
  {
3049
  "tag": "CITY",
@@ -3788,14 +3807,14 @@
3788
  {
3789
  "tag": "GIVENNAME",
3790
  "start": 24,
3791
- "end": 39,
3792
- "value": "Jaswin Dhungana"
3793
  },
3794
  {
3795
  "tag": "SURNAME",
3796
- "start": 40,
3797
  "end": 46,
3798
- "value": "Kannan"
3799
  }
3800
  ]
3801
  },
@@ -3897,7 +3916,7 @@
3897
  "value": "Martika"
3898
  },
3899
  {
3900
- "tag": "SURNAME",
3901
  "start": 12,
3902
  "end": 30,
3903
  "value": "D'emilia Vendramet"
@@ -4001,12 +4020,6 @@
4001
  "start": 0,
4002
  "end": 22,
4003
  "value": "Iuliana-Madalina Lamai"
4004
- },
4005
- {
4006
- "tag": "GIVENNAME",
4007
- "start": 69,
4008
- "end": 75,
4009
- "value": "Garmin"
4010
  }
4011
  ]
4012
  },
@@ -4236,7 +4249,7 @@
4236
  "value": "Jos"
4237
  },
4238
  {
4239
- "tag": "SOCIALNUM",
4240
  "start": 73,
4241
  "end": 82,
4242
  "value": "773242235"
@@ -5708,8 +5721,14 @@
5708
  {
5709
  "tag": "GIVENNAME",
5710
  "start": 3,
 
 
 
 
 
 
5711
  "end": 16,
5712
- "value": "Sario Remedan"
5713
  }
5714
  ]
5715
  },
@@ -5942,14 +5961,14 @@
5942
  {
5943
  "tag": "GIVENNAME",
5944
  "start": 101,
5945
- "end": 107,
5946
- "value": "Dounia"
5947
  },
5948
  {
5949
  "tag": "SURNAME",
5950
- "start": 108,
5951
  "end": 120,
5952
- "value": "De e Gilland"
5953
  },
5954
  {
5955
  "tag": "STREET",
@@ -6099,13 +6118,13 @@
6099
  "value": "Ludvika"
6100
  },
6101
  {
6102
- "tag": "SEX",
6103
  "start": 47,
6104
  "end": 55,
6105
  "value": "Femenino"
6106
  },
6107
  {
6108
- "tag": "GIVENNAME",
6109
  "start": 72,
6110
  "end": 77,
6111
  "value": "Mitre"
@@ -6563,12 +6582,6 @@
6563
  "end": 24,
6564
  "value": "Gobelin"
6565
  },
6566
- {
6567
- "tag": "AGE",
6568
- "start": 60,
6569
- "end": 61,
6570
- "value": "5"
6571
- },
6572
  {
6573
  "tag": "IDCARDNUM",
6574
  "start": 107,
@@ -6994,6 +7007,12 @@
6994
  "start": 0,
6995
  "end": 15,
6996
  "value": "Medardus Jansan"
 
 
 
 
 
 
6997
  }
6998
  ]
6999
  },
@@ -7030,8 +7049,14 @@
7030
  {
7031
  "tag": "GIVENNAME",
7032
  "start": 31,
 
 
 
 
 
 
7033
  "end": 41,
7034
- "value": "Loe Valdas"
7035
  }
7036
  ]
7037
  },
@@ -7761,7 +7786,7 @@
7761
  "value": "58"
7762
  },
7763
  {
7764
- "tag": "SEX",
7765
  "start": 128,
7766
  "end": 133,
7767
  "value": "Autre"
@@ -8847,10 +8872,16 @@
8847
  "value": "44"
8848
  },
8849
  {
8850
- "tag": "SURNAME",
8851
  "start": 64,
 
 
 
 
 
 
8852
  "end": 94,
8853
- "value": "Hoger Bujari Bergmann Pozzerle"
8854
  },
8855
  {
8856
  "tag": "CITY",
@@ -9070,7 +9101,7 @@
9070
  "value": "II9367000"
9071
  },
9072
  {
9073
- "tag": "DRIVERLICENSENUM",
9074
  "start": 129,
9075
  "end": 139,
9076
  "value": "TOYPBKN22Z"
@@ -9177,14 +9208,14 @@
9177
  {
9178
  "tag": "GIVENNAME",
9179
  "start": 73,
9180
- "end": 87,
9181
- "value": "Massouda Nomin"
9182
  },
9183
  {
9184
  "tag": "SURNAME",
9185
- "start": 88,
9186
  "end": 107,
9187
- "value": "De la Mata Oberdorf"
9188
  },
9189
  {
9190
  "tag": "EMAIL",
@@ -9257,14 +9288,14 @@
9257
  {
9258
  "tag": "GIVENNAME",
9259
  "start": 19,
9260
- "end": 26,
9261
- "value": "Leonida"
9262
  },
9263
  {
9264
  "tag": "SURNAME",
9265
- "start": 27,
9266
  "end": 41,
9267
- "value": "Rotem Feldvari"
9268
  },
9269
  {
9270
  "tag": "GIVENNAME",
@@ -9758,8 +9789,8 @@
9758
  {
9759
  "tag": "GIVENNAME",
9760
  "start": 6,
9761
- "end": 14,
9762
- "value": "Xhejlane"
9763
  },
9764
  {
9765
  "tag": "DATE",
@@ -9954,10 +9985,10 @@
9954
  ],
9955
  "predictions": [
9956
  {
9957
- "tag": "GIVENNAME",
9958
- "start": 31,
9959
  "end": 37,
9960
- "value": "Aronne"
9961
  }
9962
  ]
9963
  },
@@ -10490,12 +10521,6 @@
10490
  "start": 66,
10491
  "end": 68,
10492
  "value": "81"
10493
- },
10494
- {
10495
- "tag": "AGE",
10496
- "start": 79,
10497
- "end": 81,
10498
- "value": "25"
10499
  }
10500
  ]
10501
  },
@@ -10923,12 +10948,6 @@
10923
  }
10924
  ],
10925
  "predictions": [
10926
- {
10927
- "tag": "GIVENNAME",
10928
- "start": 9,
10929
- "end": 13,
10930
- "value": "Afin"
10931
- },
10932
  {
10933
  "tag": "PASSPORTNUM",
10934
  "start": 78,
@@ -11080,8 +11099,14 @@
11080
  {
11081
  "tag": "STREET",
11082
  "start": 38,
 
 
 
 
 
 
11083
  "end": 88,
11084
- "value": "Carretera General Cepeda-Guelatao-E.C. Palma Gorda"
11085
  }
11086
  ]
11087
  },
@@ -11111,14 +11136,14 @@
11111
  {
11112
  "tag": "GIVENNAME",
11113
  "start": 27,
11114
- "end": 37,
11115
- "value": "Assadullah"
11116
  },
11117
  {
11118
  "tag": "SURNAME",
11119
- "start": 38,
11120
  "end": 53,
11121
- "value": "Oldani Khorsand"
11122
  },
11123
  {
11124
  "tag": "DATE",
@@ -11935,8 +11960,14 @@
11935
  {
11936
  "tag": "GIVENNAME",
11937
  "start": 19,
 
 
 
 
 
 
11938
  "end": 37,
11939
- "value": "Lülüfer Gunaratnam"
11940
  }
11941
  ]
11942
  },
@@ -12123,8 +12154,8 @@
12123
  {
12124
  "tag": "CITY",
12125
  "start": 0,
12126
- "end": 5,
12127
- "value": "Derby"
12128
  },
12129
  {
12130
  "tag": "GIVENNAME",
@@ -12459,7 +12490,7 @@
12459
  "value": "Ildiko"
12460
  },
12461
  {
12462
- "tag": "SEX",
12463
  "start": 149,
12464
  "end": 155,
12465
  "value": "Female"
@@ -12777,7 +12808,7 @@
12777
  "value": "13"
12778
  },
12779
  {
12780
- "tag": "SEX",
12781
  "start": 17,
12782
  "end": 21,
12783
  "value": "Male"
@@ -13347,8 +13378,14 @@
13347
  {
13348
  "tag": "GIVENNAME",
13349
  "start": 64,
 
 
 
 
 
 
13350
  "end": 79,
13351
- "value": "Bertille Nassar"
13352
  }
13353
  ]
13354
  },
@@ -13752,7 +13789,7 @@
13752
  "value": "Zlatimir Muhidin"
13753
  },
13754
  {
13755
- "tag": "CITY",
13756
  "start": 107,
13757
  "end": 126,
13758
  "value": "Motril - Al Hoceima"
@@ -14359,17 +14396,11 @@
14359
  "end": 18,
14360
  "value": "श्री"
14361
  },
14362
- {
14363
- "tag": "GIVENNAME",
14364
- "start": 19,
14365
- "end": 26,
14366
- "value": "Balutch"
14367
- },
14368
  {
14369
  "tag": "SURNAME",
14370
- "start": 27,
14371
  "end": 33,
14372
- "value": "Misman"
14373
  },
14374
  {
14375
  "tag": "DATE",
@@ -14576,14 +14607,8 @@
14576
  {
14577
  "tag": "GIVENNAME",
14578
  "start": 0,
14579
- "end": 7,
14580
- "value": "Derrick"
14581
- },
14582
- {
14583
- "tag": "SURNAME",
14584
- "start": 8,
14585
  "end": 13,
14586
- "value": "Lunze"
14587
  },
14588
  {
14589
  "tag": "IDCARDNUM",
@@ -14865,7 +14890,7 @@
14865
  "value": "06/08/1951"
14866
  },
14867
  {
14868
- "tag": "SEX",
14869
  "start": 57,
14870
  "end": 65,
14871
  "value": "Weiblich"
@@ -14904,14 +14929,14 @@
14904
  {
14905
  "tag": "GIVENNAME",
14906
  "start": 9,
14907
- "end": 16,
14908
- "value": "Niccola"
14909
  },
14910
  {
14911
  "tag": "SURNAME",
14912
- "start": 17,
14913
  "end": 35,
14914
- "value": "Shazimani Afowerki"
14915
  }
14916
  ]
14917
  },
@@ -14926,17 +14951,11 @@
14926
  }
14927
  ],
14928
  "predictions": [
14929
- {
14930
- "tag": "GIVENNAME",
14931
- "start": 9,
14932
- "end": 24,
14933
- "value": "Serifoska Caddy"
14934
- },
14935
  {
14936
  "tag": "SURNAME",
14937
- "start": 25,
14938
  "end": 29,
14939
- "value": "Röhl"
14940
  }
14941
  ]
14942
  },
@@ -15398,14 +15417,14 @@
15398
  {
15399
  "tag": "GIVENNAME",
15400
  "start": 24,
15401
- "end": 31,
15402
- "value": "Debjani"
15403
  },
15404
  {
15405
  "tag": "SURNAME",
15406
- "start": 32,
15407
  "end": 56,
15408
- "value": "Saulet Sjölin Corigliano"
15409
  },
15410
  {
15411
  "tag": "TELEPHONENUM",
@@ -15636,7 +15655,7 @@
15636
  "value": "Floresha"
15637
  },
15638
  {
15639
- "tag": "PASSPORTNUM",
15640
  "start": 76,
15641
  "end": 85,
15642
  "value": "718087585"
@@ -15998,6 +16017,12 @@
15998
  "end": 36,
15999
  "value": "Mr"
16000
  },
 
 
 
 
 
 
16001
  {
16002
  "tag": "TELEPHONENUM",
16003
  "start": 75,
@@ -16795,6 +16820,12 @@
16795
  "start": 11,
16796
  "end": 17,
16797
  "value": "Tamane"
 
 
 
 
 
 
16798
  }
16799
  ]
16800
  },
@@ -17561,7 +17592,7 @@
17561
  ],
17562
  "predictions": [
17563
  {
17564
- "tag": "CREDITCARDNUMBER",
17565
  "start": 36,
17566
  "end": 49,
17567
  "value": "4326124162560"
@@ -18265,7 +18296,7 @@
18265
  ],
18266
  "predictions": [
18267
  {
18268
- "tag": "IDCARDNUM",
18269
  "start": 26,
18270
  "end": 34,
18271
  "value": "M9120547"
@@ -19194,12 +19225,6 @@
19194
  }
19195
  ],
19196
  "predictions": [
19197
- {
19198
- "tag": "ZIPCODE",
19199
- "start": 26,
19200
- "end": 30,
19201
- "value": "1920"
19202
- },
19203
  {
19204
  "tag": "GIVENNAME",
19205
  "start": 45,
@@ -19763,8 +19788,14 @@
19763
  {
19764
  "tag": "GIVENNAME",
19765
  "start": 12,
 
 
 
 
 
 
19766
  "end": 28,
19767
- "value": "Ferhan Biyevanga"
19768
  },
19769
  {
19770
  "tag": "IDCARDNUM",
@@ -20496,7 +20527,7 @@
20496
  "value": "Op de Ries"
20497
  },
20498
  {
20499
- "tag": "ZIPCODE",
20500
  "start": 105,
20501
  "end": 109,
20502
  "value": "4297"
@@ -21029,7 +21060,7 @@
21029
  "value": "KQ5365007"
21030
  },
21031
  {
21032
- "tag": "DRIVERLICENSENUM",
21033
  "start": 63,
21034
  "end": 73,
21035
  "value": "E7VD1O9GWG"
@@ -21174,8 +21205,14 @@
21174
  {
21175
  "tag": "GIVENNAME",
21176
  "start": 22,
 
 
 
 
 
 
21177
  "end": 42,
21178
- "value": "Dan-Dumitru Cipriano"
21179
  }
21180
  ]
21181
  },
@@ -21328,8 +21365,14 @@
21328
  {
21329
  "tag": "GIVENNAME",
21330
  "start": 23,
 
 
 
 
 
 
21331
  "end": 36,
21332
- "value": "Pui Francklin"
21333
  },
21334
  {
21335
  "tag": "ZIPCODE",
@@ -21744,8 +21787,14 @@
21744
  {
21745
  "tag": "GIVENNAME",
21746
  "start": 33,
 
 
 
 
 
 
21747
  "end": 51,
21748
- "value": "Jan-Andri Chlaabba"
21749
  }
21750
  ]
21751
  },
@@ -22109,8 +22158,14 @@
22109
  {
22110
  "tag": "GIVENNAME",
22111
  "start": 0,
 
 
 
 
 
 
22112
  "end": 13,
22113
- "value": "Jadranko Soma"
22114
  },
22115
  {
22116
  "tag": "CITY",
@@ -22119,7 +22174,7 @@
22119
  "value": "Bad Neuenahr-Ahrweiler"
22120
  },
22121
  {
22122
- "tag": "GIVENNAME",
22123
  "start": 111,
22124
  "end": 117,
22125
  "value": "Kadric"
@@ -22552,8 +22607,14 @@
22552
  {
22553
  "tag": "GIVENNAME",
22554
  "start": 37,
 
 
 
 
 
 
22555
  "end": 56,
22556
- "value": "Vignesh Parasiraman"
22557
  },
22558
  {
22559
  "tag": "STREET",
@@ -23474,12 +23535,6 @@
23474
  }
23475
  ],
23476
  "predictions": [
23477
- {
23478
- "tag": "TITLE",
23479
- "start": 0,
23480
- "end": 8,
23481
- "value": "Monsieur"
23482
- },
23483
  {
23484
  "tag": "SURNAME",
23485
  "start": 9,
@@ -23602,14 +23657,7 @@
23602
  "value": "Theur"
23603
  }
23604
  ],
23605
- "predictions": [
23606
- {
23607
- "tag": "CITY",
23608
- "start": 31,
23609
- "end": 36,
23610
- "value": "Theur"
23611
- }
23612
- ]
23613
  },
23614
  {
23615
  "source_text": "Hallo Hafsia Ernestina, ich bin Cesc Mazuryk und ich interessiere mich für die von Ihnen angebotenen Gartendienstleistungen. Könnten Sie mir bitte weitere Informationen zu Ihren Referenzen und Erfahrungen senden? Vielen Dank für Ihre Zeit.",
@@ -23729,8 +23777,14 @@
23729
  {
23730
  "tag": "GIVENNAME",
23731
  "start": 0,
 
 
 
 
 
 
23732
  "end": 20,
23733
- "value": "Madhukar Baheerathan"
23734
  },
23735
  {
23736
  "tag": "DATE",
@@ -23813,7 +23867,7 @@
23813
  ],
23814
  "predictions": [
23815
  {
23816
- "tag": "GIVENNAME",
23817
  "start": 3,
23818
  "end": 12,
23819
  "value": "Larmagnac"
@@ -23850,7 +23904,7 @@
23850
  "value": "County Road 102"
23851
  },
23852
  {
23853
- "tag": "BUILDINGNUM",
23854
  "start": 80,
23855
  "end": 85,
23856
  "value": "99587"
@@ -24175,8 +24229,14 @@
24175
  {
24176
  "tag": "GIVENNAME",
24177
  "start": 0,
 
 
 
 
 
 
24178
  "end": 14,
24179
- "value": "Pravin Jemhati"
24180
  }
24181
  ]
24182
  },
@@ -24658,10 +24718,16 @@
24658
  "value": "22:50"
24659
  },
24660
  {
24661
- "tag": "STREET",
24662
  "start": 6,
 
 
 
 
 
 
24663
  "end": 27,
24664
- "value": "Huzur Byrasandra Road"
24665
  },
24666
  {
24667
  "tag": "BUILDINGNUM",
@@ -26564,8 +26630,14 @@
26564
  {
26565
  "tag": "GIVENNAME",
26566
  "start": 57,
 
 
 
 
 
 
26567
  "end": 67,
26568
- "value": "Seho Yihao"
26569
  },
26570
  {
26571
  "tag": "AGE",
@@ -26714,14 +26786,7 @@
26714
  {
26715
  "source_text": "Si tiene alguna duda con respecto a Browse our products a el representante anteriormente indicado, no dude en ponerse en contacto con nosotros.",
26716
  "ground_truth": [],
26717
- "predictions": [
26718
- {
26719
- "tag": "CITY",
26720
- "start": 36,
26721
- "end": 42,
26722
- "value": "Browse"
26723
- }
26724
- ]
26725
  },
26726
  {
26727
  "source_text": "Antuono e Kotsev stanno cercando di creare un nuovo acquario. Hanno bisogno di informazioni sulla scelta dei pesci adatti.",
@@ -27191,14 +27256,8 @@
27191
  {
27192
  "tag": "GIVENNAME",
27193
  "start": 33,
27194
- "end": 46,
27195
- "value": "Claude-Michel"
27196
- },
27197
- {
27198
- "tag": "SURNAME",
27199
- "start": 47,
27200
  "end": 50,
27201
- "value": "Rae"
27202
  },
27203
  {
27204
  "tag": "DATE",
@@ -27275,7 +27334,7 @@
27275
  ],
27276
  "predictions": [
27277
  {
27278
- "tag": "SURNAME",
27279
  "start": 31,
27280
  "end": 36,
27281
  "value": "Lotti"
@@ -27447,7 +27506,7 @@
27447
  "value": "Flisch"
27448
  },
27449
  {
27450
- "tag": "IDCARDNUM",
27451
  "start": 80,
27452
  "end": 89,
27453
  "value": "E0975174O"
@@ -27521,7 +27580,7 @@
27521
  ],
27522
  "predictions": [
27523
  {
27524
- "tag": "IDCARDNUM",
27525
  "start": 112,
27526
  "end": 120,
27527
  "value": "B3509304"
@@ -27966,14 +28025,8 @@
27966
  {
27967
  "tag": "PASSPORTNUM",
27968
  "start": 32,
27969
- "end": 33,
27970
- "value": "Q"
27971
- },
27972
- {
27973
- "tag": "IDCARDNUM",
27974
- "start": 33,
27975
  "end": 40,
27976
- "value": "1993920"
27977
  },
27978
  {
27979
  "tag": "DRIVERLICENSENUM",
@@ -28110,10 +28163,16 @@
28110
  "value": "Razel"
28111
  },
28112
  {
28113
- "tag": "SURNAME",
28114
  "start": 16,
 
 
 
 
 
 
28115
  "end": 42,
28116
- "value": "Harraca Bousseta Almodovar"
28117
  },
28118
  {
28119
  "tag": "CITY",
@@ -28251,7 +28310,7 @@
28251
  ],
28252
  "predictions": [
28253
  {
28254
- "tag": "SURNAME",
28255
  "start": 0,
28256
  "end": 22,
28257
  "value": "Vandelle Sathiyathasan"
@@ -28857,14 +28916,14 @@
28857
  {
28858
  "tag": "GIVENNAME",
28859
  "start": 0,
28860
- "end": 5,
28861
- "value": "Krist"
28862
  },
28863
  {
28864
  "tag": "SURNAME",
28865
- "start": 6,
28866
  "end": 21,
28867
- "value": "Murtez Westlund"
28868
  },
28869
  {
28870
  "tag": "CITY",
@@ -29920,8 +29979,14 @@
29920
  {
29921
  "tag": "GIVENNAME",
29922
  "start": 25,
 
 
 
 
 
 
29923
  "end": 43,
29924
- "value": "Domenica Benhalima"
29925
  },
29926
  {
29927
  "tag": "GENDER",
@@ -30332,7 +30397,7 @@
30332
  "value": "Myszkorowski Stoira"
30333
  },
30334
  {
30335
- "tag": "CREDITCARDNUMBER",
30336
  "start": 88,
30337
  "end": 102,
30338
  "value": "84936404851797"
@@ -31048,7 +31113,7 @@
31048
  ],
31049
  "predictions": [
31050
  {
31051
- "tag": "SOCIALNUM",
31052
  "start": 20,
31053
  "end": 30,
31054
  "value": "7886104597"
@@ -31871,8 +31936,14 @@
31871
  {
31872
  "tag": "GIVENNAME",
31873
  "start": 0,
 
 
 
 
 
 
31874
  "end": 15,
31875
- "value": "Abdulai Lazhari"
31876
  },
31877
  {
31878
  "tag": "IDCARDNUM",
@@ -32520,7 +32591,7 @@
32520
  "value": "29"
32521
  },
32522
  {
32523
- "tag": "SEX",
32524
  "start": 26,
32525
  "end": 30,
32526
  "value": "Male"
@@ -32636,12 +32707,6 @@
32636
  }
32637
  ],
32638
  "predictions": [
32639
- {
32640
- "tag": "CITY",
32641
- "start": 12,
32642
- "end": 27,
32643
- "value": "Piedras del Río"
32644
- },
32645
  {
32646
  "tag": "GIVENNAME",
32647
  "start": 30,
@@ -32851,17 +32916,11 @@
32851
  "end": 16,
32852
  "value": "Csa"
32853
  },
32854
- {
32855
- "tag": "GIVENNAME",
32856
- "start": 17,
32857
- "end": 20,
32858
- "value": "Den"
32859
- },
32860
  {
32861
  "tag": "SURNAME",
32862
- "start": 21,
32863
  "end": 29,
32864
- "value": "Breeijen"
32865
  },
32866
  {
32867
  "tag": "TELEPHONENUM",
 
18
  "predictions": [
19
  {
20
  "tag": "GIVENNAME",
21
+ "start": 4,
22
  "end": 11,
23
+ "value": "Zoubair"
24
  },
25
  {
26
  "tag": "DATE",
 
180
  {
181
  "tag": "GIVENNAME",
182
  "start": 45,
183
+ "end": 51,
184
+ "value": "Zoltán"
185
+ },
186
+ {
187
+ "tag": "SURNAME",
188
+ "start": 52,
189
  "end": 64,
190
+ "value": "Pannerselvam"
191
  }
192
  ]
193
  },
 
1290
  "value": "Rukman"
1291
  },
1292
  {
1293
+ "tag": "SURNAME",
1294
  "start": 94,
1295
  "end": 105,
1296
  "value": "Tharmabalan"
 
2123
  "value": "Sholeh"
2124
  },
2125
  {
2126
+ "tag": "SURNAME",
2127
  "start": 13,
2128
  "end": 19,
2129
  "value": "Bulduk"
 
2818
  "value": "Saeda"
2819
  }
2820
  ],
2821
+ "predictions": [
2822
+ {
2823
+ "tag": "GIVENNAME",
2824
+ "start": 10,
2825
+ "end": 15,
2826
+ "value": "Saeda"
2827
+ }
2828
+ ]
2829
  },
2830
  {
2831
  "source_text": "Your generosity is appreciated, and we would like to acknowledge your in-kind donation. Please reply with your Thainá Isolde and Jahibasic to confirm.",
 
3055
  {
3056
  "tag": "GIVENNAME",
3057
  "start": 71,
3058
+ "end": 78,
3059
+ "value": "Xiujuan"
3060
+ },
3061
+ {
3062
+ "tag": "SURNAME",
3063
+ "start": 79,
3064
  "end": 84,
3065
+ "value": "Raisa"
3066
  },
3067
  {
3068
  "tag": "CITY",
 
3807
  {
3808
  "tag": "GIVENNAME",
3809
  "start": 24,
3810
+ "end": 30,
3811
+ "value": "Jaswin"
3812
  },
3813
  {
3814
  "tag": "SURNAME",
3815
+ "start": 31,
3816
  "end": 46,
3817
+ "value": "Dhungana Kannan"
3818
  }
3819
  ]
3820
  },
 
3916
  "value": "Martika"
3917
  },
3918
  {
3919
+ "tag": "GIVENNAME",
3920
  "start": 12,
3921
  "end": 30,
3922
  "value": "D'emilia Vendramet"
 
4020
  "start": 0,
4021
  "end": 22,
4022
  "value": "Iuliana-Madalina Lamai"
 
 
 
 
 
 
4023
  }
4024
  ]
4025
  },
 
4249
  "value": "Jos"
4250
  },
4251
  {
4252
+ "tag": "TAXNUM",
4253
  "start": 73,
4254
  "end": 82,
4255
  "value": "773242235"
 
5721
  {
5722
  "tag": "GIVENNAME",
5723
  "start": 3,
5724
+ "end": 8,
5725
+ "value": "Sario"
5726
+ },
5727
+ {
5728
+ "tag": "SURNAME",
5729
+ "start": 9,
5730
  "end": 16,
5731
+ "value": "Remedan"
5732
  }
5733
  ]
5734
  },
 
5961
  {
5962
  "tag": "GIVENNAME",
5963
  "start": 101,
5964
+ "end": 110,
5965
+ "value": "Dounia De"
5966
  },
5967
  {
5968
  "tag": "SURNAME",
5969
+ "start": 111,
5970
  "end": 120,
5971
+ "value": "e Gilland"
5972
  },
5973
  {
5974
  "tag": "STREET",
 
6118
  "value": "Ludvika"
6119
  },
6120
  {
6121
+ "tag": "GENDER",
6122
  "start": 47,
6123
  "end": 55,
6124
  "value": "Femenino"
6125
  },
6126
  {
6127
+ "tag": "CITY",
6128
  "start": 72,
6129
  "end": 77,
6130
  "value": "Mitre"
 
6582
  "end": 24,
6583
  "value": "Gobelin"
6584
  },
 
 
 
 
 
 
6585
  {
6586
  "tag": "IDCARDNUM",
6587
  "start": 107,
 
7007
  "start": 0,
7008
  "end": 15,
7009
  "value": "Medardus Jansan"
7010
+ },
7011
+ {
7012
+ "tag": "TITLE",
7013
+ "start": 18,
7014
+ "end": 24,
7015
+ "value": "मंत्री"
7016
  }
7017
  ]
7018
  },
 
7049
  {
7050
  "tag": "GIVENNAME",
7051
  "start": 31,
7052
+ "end": 34,
7053
+ "value": "Loe"
7054
+ },
7055
+ {
7056
+ "tag": "SURNAME",
7057
+ "start": 35,
7058
  "end": 41,
7059
+ "value": "Valdas"
7060
  }
7061
  ]
7062
  },
 
7786
  "value": "58"
7787
  },
7788
  {
7789
+ "tag": "GENDER",
7790
  "start": 128,
7791
  "end": 133,
7792
  "value": "Autre"
 
8872
  "value": "44"
8873
  },
8874
  {
8875
+ "tag": "GIVENNAME",
8876
  "start": 64,
8877
+ "end": 69,
8878
+ "value": "Hoger"
8879
+ },
8880
+ {
8881
+ "tag": "SURNAME",
8882
+ "start": 70,
8883
  "end": 94,
8884
+ "value": "Bujari Bergmann Pozzerle"
8885
  },
8886
  {
8887
  "tag": "CITY",
 
9101
  "value": "II9367000"
9102
  },
9103
  {
9104
+ "tag": "IDCARDNUM",
9105
  "start": 129,
9106
  "end": 139,
9107
  "value": "TOYPBKN22Z"
 
9208
  {
9209
  "tag": "GIVENNAME",
9210
  "start": 73,
9211
+ "end": 81,
9212
+ "value": "Massouda"
9213
  },
9214
  {
9215
  "tag": "SURNAME",
9216
+ "start": 82,
9217
  "end": 107,
9218
+ "value": "Nomin De la Mata Oberdorf"
9219
  },
9220
  {
9221
  "tag": "EMAIL",
 
9288
  {
9289
  "tag": "GIVENNAME",
9290
  "start": 19,
9291
+ "end": 32,
9292
+ "value": "Leonida Rotem"
9293
  },
9294
  {
9295
  "tag": "SURNAME",
9296
+ "start": 33,
9297
  "end": 41,
9298
+ "value": "Feldvari"
9299
  },
9300
  {
9301
  "tag": "GIVENNAME",
 
9789
  {
9790
  "tag": "GIVENNAME",
9791
  "start": 6,
9792
+ "end": 21,
9793
+ "value": "Xhejlane Danche"
9794
  },
9795
  {
9796
  "tag": "DATE",
 
9985
  ],
9986
  "predictions": [
9987
  {
9988
+ "tag": "SURNAME",
9989
+ "start": 27,
9990
  "end": 37,
9991
+ "value": "van Aronne"
9992
  }
9993
  ]
9994
  },
 
10521
  "start": 66,
10522
  "end": 68,
10523
  "value": "81"
 
 
 
 
 
 
10524
  }
10525
  ]
10526
  },
 
10948
  }
10949
  ],
10950
  "predictions": [
 
 
 
 
 
 
10951
  {
10952
  "tag": "PASSPORTNUM",
10953
  "start": 78,
 
11099
  {
11100
  "tag": "STREET",
11101
  "start": 38,
11102
+ "end": 76,
11103
+ "value": "Carretera General Cepeda-Guelatao-E.C."
11104
+ },
11105
+ {
11106
+ "tag": "CITY",
11107
+ "start": 77,
11108
  "end": 88,
11109
+ "value": "Palma Gorda"
11110
  }
11111
  ]
11112
  },
 
11136
  {
11137
  "tag": "GIVENNAME",
11138
  "start": 27,
11139
+ "end": 44,
11140
+ "value": "Assadullah Oldani"
11141
  },
11142
  {
11143
  "tag": "SURNAME",
11144
+ "start": 45,
11145
  "end": 53,
11146
+ "value": "Khorsand"
11147
  },
11148
  {
11149
  "tag": "DATE",
 
11960
  {
11961
  "tag": "GIVENNAME",
11962
  "start": 19,
11963
+ "end": 26,
11964
+ "value": "Lülüfer"
11965
+ },
11966
+ {
11967
+ "tag": "SURNAME",
11968
+ "start": 27,
11969
  "end": 37,
11970
+ "value": "Gunaratnam"
11971
  }
11972
  ]
11973
  },
 
12154
  {
12155
  "tag": "CITY",
12156
  "start": 0,
12157
+ "end": 17,
12158
+ "value": "Derby City Centre"
12159
  },
12160
  {
12161
  "tag": "GIVENNAME",
 
12490
  "value": "Ildiko"
12491
  },
12492
  {
12493
+ "tag": "GENDER",
12494
  "start": 149,
12495
  "end": 155,
12496
  "value": "Female"
 
12808
  "value": "13"
12809
  },
12810
  {
12811
+ "tag": "GENDER",
12812
  "start": 17,
12813
  "end": 21,
12814
  "value": "Male"
 
13378
  {
13379
  "tag": "GIVENNAME",
13380
  "start": 64,
13381
+ "end": 72,
13382
+ "value": "Bertille"
13383
+ },
13384
+ {
13385
+ "tag": "SURNAME",
13386
+ "start": 73,
13387
  "end": 79,
13388
+ "value": "Nassar"
13389
  }
13390
  ]
13391
  },
 
13789
  "value": "Zlatimir Muhidin"
13790
  },
13791
  {
13792
+ "tag": "STREET",
13793
  "start": 107,
13794
  "end": 126,
13795
  "value": "Motril - Al Hoceima"
 
14396
  "end": 18,
14397
  "value": "श्री"
14398
  },
 
 
 
 
 
 
14399
  {
14400
  "tag": "SURNAME",
14401
+ "start": 19,
14402
  "end": 33,
14403
+ "value": "Balutch Misman"
14404
  },
14405
  {
14406
  "tag": "DATE",
 
14607
  {
14608
  "tag": "GIVENNAME",
14609
  "start": 0,
 
 
 
 
 
 
14610
  "end": 13,
14611
+ "value": "Derrick Lunze"
14612
  },
14613
  {
14614
  "tag": "IDCARDNUM",
 
14890
  "value": "06/08/1951"
14891
  },
14892
  {
14893
+ "tag": "GENDER",
14894
  "start": 57,
14895
  "end": 65,
14896
  "value": "Weiblich"
 
14929
  {
14930
  "tag": "GIVENNAME",
14931
  "start": 9,
14932
+ "end": 26,
14933
+ "value": "Niccola Shazimani"
14934
  },
14935
  {
14936
  "tag": "SURNAME",
14937
+ "start": 27,
14938
  "end": 35,
14939
+ "value": "Afowerki"
14940
  }
14941
  ]
14942
  },
 
14951
  }
14952
  ],
14953
  "predictions": [
 
 
 
 
 
 
14954
  {
14955
  "tag": "SURNAME",
14956
+ "start": 9,
14957
  "end": 29,
14958
+ "value": "Serifoska Caddy Röhl"
14959
  }
14960
  ]
14961
  },
 
15417
  {
15418
  "tag": "GIVENNAME",
15419
  "start": 24,
15420
+ "end": 38,
15421
+ "value": "Debjani Saulet"
15422
  },
15423
  {
15424
  "tag": "SURNAME",
15425
+ "start": 39,
15426
  "end": 56,
15427
+ "value": "Sjölin Corigliano"
15428
  },
15429
  {
15430
  "tag": "TELEPHONENUM",
 
15655
  "value": "Floresha"
15656
  },
15657
  {
15658
+ "tag": "SOCIALNUM",
15659
  "start": 76,
15660
  "end": 85,
15661
  "value": "718087585"
 
16017
  "end": 36,
16018
  "value": "Mr"
16019
  },
16020
+ {
16021
+ "tag": "CITY",
16022
+ "start": 59,
16023
+ "end": 66,
16024
+ "value": "Stookey"
16025
+ },
16026
  {
16027
  "tag": "TELEPHONENUM",
16028
  "start": 75,
 
16820
  "start": 11,
16821
  "end": 17,
16822
  "value": "Tamane"
16823
+ },
16824
+ {
16825
+ "tag": "GIVENNAME",
16826
+ "start": 22,
16827
+ "end": 28,
16828
+ "value": "Reddit"
16829
  }
16830
  ]
16831
  },
 
17592
  ],
17593
  "predictions": [
17594
  {
17595
+ "tag": "SOCIALNUM",
17596
  "start": 36,
17597
  "end": 49,
17598
  "value": "4326124162560"
 
18296
  ],
18297
  "predictions": [
18298
  {
18299
+ "tag": "PASSPORTNUM",
18300
  "start": 26,
18301
  "end": 34,
18302
  "value": "M9120547"
 
19225
  }
19226
  ],
19227
  "predictions": [
 
 
 
 
 
 
19228
  {
19229
  "tag": "GIVENNAME",
19230
  "start": 45,
 
19788
  {
19789
  "tag": "GIVENNAME",
19790
  "start": 12,
19791
+ "end": 18,
19792
+ "value": "Ferhan"
19793
+ },
19794
+ {
19795
+ "tag": "SURNAME",
19796
+ "start": 19,
19797
  "end": 28,
19798
+ "value": "Biyevanga"
19799
  },
19800
  {
19801
  "tag": "IDCARDNUM",
 
20527
  "value": "Op de Ries"
20528
  },
20529
  {
20530
+ "tag": "BUILDINGNUM",
20531
  "start": 105,
20532
  "end": 109,
20533
  "value": "4297"
 
21060
  "value": "KQ5365007"
21061
  },
21062
  {
21063
+ "tag": "IDCARDNUM",
21064
  "start": 63,
21065
  "end": 73,
21066
  "value": "E7VD1O9GWG"
 
21205
  {
21206
  "tag": "GIVENNAME",
21207
  "start": 22,
21208
+ "end": 33,
21209
+ "value": "Dan-Dumitru"
21210
+ },
21211
+ {
21212
+ "tag": "SURNAME",
21213
+ "start": 34,
21214
  "end": 42,
21215
+ "value": "Cipriano"
21216
  }
21217
  ]
21218
  },
 
21365
  {
21366
  "tag": "GIVENNAME",
21367
  "start": 23,
21368
+ "end": 26,
21369
+ "value": "Pui"
21370
+ },
21371
+ {
21372
+ "tag": "SURNAME",
21373
+ "start": 27,
21374
  "end": 36,
21375
+ "value": "Francklin"
21376
  },
21377
  {
21378
  "tag": "ZIPCODE",
 
21787
  {
21788
  "tag": "GIVENNAME",
21789
  "start": 33,
21790
+ "end": 42,
21791
+ "value": "Jan-Andri"
21792
+ },
21793
+ {
21794
+ "tag": "SURNAME",
21795
+ "start": 43,
21796
  "end": 51,
21797
+ "value": "Chlaabba"
21798
  }
21799
  ]
21800
  },
 
22158
  {
22159
  "tag": "GIVENNAME",
22160
  "start": 0,
22161
+ "end": 8,
22162
+ "value": "Jadranko"
22163
+ },
22164
+ {
22165
+ "tag": "SURNAME",
22166
+ "start": 9,
22167
  "end": 13,
22168
+ "value": "Soma"
22169
  },
22170
  {
22171
  "tag": "CITY",
 
22174
  "value": "Bad Neuenahr-Ahrweiler"
22175
  },
22176
  {
22177
+ "tag": "SURNAME",
22178
  "start": 111,
22179
  "end": 117,
22180
  "value": "Kadric"
 
22607
  {
22608
  "tag": "GIVENNAME",
22609
  "start": 37,
22610
+ "end": 44,
22611
+ "value": "Vignesh"
22612
+ },
22613
+ {
22614
+ "tag": "SURNAME",
22615
+ "start": 45,
22616
  "end": 56,
22617
+ "value": "Parasiraman"
22618
  },
22619
  {
22620
  "tag": "STREET",
 
23535
  }
23536
  ],
23537
  "predictions": [
 
 
 
 
 
 
23538
  {
23539
  "tag": "SURNAME",
23540
  "start": 9,
 
23657
  "value": "Theur"
23658
  }
23659
  ],
23660
+ "predictions": []
 
 
 
 
 
 
 
23661
  },
23662
  {
23663
  "source_text": "Hallo Hafsia Ernestina, ich bin Cesc Mazuryk und ich interessiere mich für die von Ihnen angebotenen Gartendienstleistungen. Könnten Sie mir bitte weitere Informationen zu Ihren Referenzen und Erfahrungen senden? Vielen Dank für Ihre Zeit.",
 
23777
  {
23778
  "tag": "GIVENNAME",
23779
  "start": 0,
23780
+ "end": 8,
23781
+ "value": "Madhukar"
23782
+ },
23783
+ {
23784
+ "tag": "SURNAME",
23785
+ "start": 9,
23786
  "end": 20,
23787
+ "value": "Baheerathan"
23788
  },
23789
  {
23790
  "tag": "DATE",
 
23867
  ],
23868
  "predictions": [
23869
  {
23870
+ "tag": "SURNAME",
23871
  "start": 3,
23872
  "end": 12,
23873
  "value": "Larmagnac"
 
23904
  "value": "County Road 102"
23905
  },
23906
  {
23907
+ "tag": "ZIPCODE",
23908
  "start": 80,
23909
  "end": 85,
23910
  "value": "99587"
 
24229
  {
24230
  "tag": "GIVENNAME",
24231
  "start": 0,
24232
+ "end": 6,
24233
+ "value": "Pravin"
24234
+ },
24235
+ {
24236
+ "tag": "SURNAME",
24237
+ "start": 7,
24238
  "end": 14,
24239
+ "value": "Jemhati"
24240
  }
24241
  ]
24242
  },
 
24718
  "value": "22:50"
24719
  },
24720
  {
24721
+ "tag": "CITY",
24722
  "start": 6,
24723
+ "end": 11,
24724
+ "value": "Huzur"
24725
+ },
24726
+ {
24727
+ "tag": "STREET",
24728
+ "start": 12,
24729
  "end": 27,
24730
+ "value": "Byrasandra Road"
24731
  },
24732
  {
24733
  "tag": "BUILDINGNUM",
 
26630
  {
26631
  "tag": "GIVENNAME",
26632
  "start": 57,
26633
+ "end": 61,
26634
+ "value": "Seho"
26635
+ },
26636
+ {
26637
+ "tag": "SURNAME",
26638
+ "start": 62,
26639
  "end": 67,
26640
+ "value": "Yihao"
26641
  },
26642
  {
26643
  "tag": "AGE",
 
26786
  {
26787
  "source_text": "Si tiene alguna duda con respecto a Browse our products a el representante anteriormente indicado, no dude en ponerse en contacto con nosotros.",
26788
  "ground_truth": [],
26789
+ "predictions": []
 
 
 
 
 
 
 
26790
  },
26791
  {
26792
  "source_text": "Antuono e Kotsev stanno cercando di creare un nuovo acquario. Hanno bisogno di informazioni sulla scelta dei pesci adatti.",
 
27256
  {
27257
  "tag": "GIVENNAME",
27258
  "start": 33,
 
 
 
 
 
 
27259
  "end": 50,
27260
+ "value": "Claude-Michel Rae"
27261
  },
27262
  {
27263
  "tag": "DATE",
 
27334
  ],
27335
  "predictions": [
27336
  {
27337
+ "tag": "GIVENNAME",
27338
  "start": 31,
27339
  "end": 36,
27340
  "value": "Lotti"
 
27506
  "value": "Flisch"
27507
  },
27508
  {
27509
+ "tag": "TAXNUM",
27510
  "start": 80,
27511
  "end": 89,
27512
  "value": "E0975174O"
 
27580
  ],
27581
  "predictions": [
27582
  {
27583
+ "tag": "PASSPORTNUM",
27584
  "start": 112,
27585
  "end": 120,
27586
  "value": "B3509304"
 
28025
  {
28026
  "tag": "PASSPORTNUM",
28027
  "start": 32,
 
 
 
 
 
 
28028
  "end": 40,
28029
+ "value": "Q1993920"
28030
  },
28031
  {
28032
  "tag": "DRIVERLICENSENUM",
 
28163
  "value": "Razel"
28164
  },
28165
  {
28166
+ "tag": "GIVENNAME",
28167
  "start": 16,
28168
+ "end": 23,
28169
+ "value": "Harraca"
28170
+ },
28171
+ {
28172
+ "tag": "SURNAME",
28173
+ "start": 24,
28174
  "end": 42,
28175
+ "value": "Bousseta Almodovar"
28176
  },
28177
  {
28178
  "tag": "CITY",
 
28310
  ],
28311
  "predictions": [
28312
  {
28313
+ "tag": "GIVENNAME",
28314
  "start": 0,
28315
  "end": 22,
28316
  "value": "Vandelle Sathiyathasan"
 
28916
  {
28917
  "tag": "GIVENNAME",
28918
  "start": 0,
28919
+ "end": 12,
28920
+ "value": "Krist Murtez"
28921
  },
28922
  {
28923
  "tag": "SURNAME",
28924
+ "start": 13,
28925
  "end": 21,
28926
+ "value": "Westlund"
28927
  },
28928
  {
28929
  "tag": "CITY",
 
29979
  {
29980
  "tag": "GIVENNAME",
29981
  "start": 25,
29982
+ "end": 33,
29983
+ "value": "Domenica"
29984
+ },
29985
+ {
29986
+ "tag": "SURNAME",
29987
+ "start": 34,
29988
  "end": 43,
29989
+ "value": "Benhalima"
29990
  },
29991
  {
29992
  "tag": "GENDER",
 
30397
  "value": "Myszkorowski Stoira"
30398
  },
30399
  {
30400
+ "tag": "IDCARDNUM",
30401
  "start": 88,
30402
  "end": 102,
30403
  "value": "84936404851797"
 
31113
  ],
31114
  "predictions": [
31115
  {
31116
+ "tag": "TAXNUM",
31117
  "start": 20,
31118
  "end": 30,
31119
  "value": "7886104597"
 
31936
  {
31937
  "tag": "GIVENNAME",
31938
  "start": 0,
31939
+ "end": 7,
31940
+ "value": "Abdulai"
31941
+ },
31942
+ {
31943
+ "tag": "SURNAME",
31944
+ "start": 8,
31945
  "end": 15,
31946
+ "value": "Lazhari"
31947
  },
31948
  {
31949
  "tag": "IDCARDNUM",
 
32591
  "value": "29"
32592
  },
32593
  {
32594
+ "tag": "GENDER",
32595
  "start": 26,
32596
  "end": 30,
32597
  "value": "Male"
 
32707
  }
32708
  ],
32709
  "predictions": [
 
 
 
 
 
 
32710
  {
32711
  "tag": "GIVENNAME",
32712
  "start": 30,
 
32916
  "end": 16,
32917
  "value": "Csa"
32918
  },
 
 
 
 
 
 
32919
  {
32920
  "tag": "SURNAME",
32921
+ "start": 17,
32922
  "end": 29,
32923
+ "value": "Den Breeijen"
32924
  },
32925
  {
32926
  "tag": "TELEPHONENUM",
open-pii-masking-500k-ai4privacy/evaluations/bert_plus_crf/seed_999_predictions.json CHANGED
@@ -513,6 +513,12 @@
513
  "end": 117,
514
  "value": "Senator"
515
  },
 
 
 
 
 
 
516
  {
517
  "tag": "TITLE",
518
  "start": 126,
@@ -588,7 +594,7 @@
588
  "value": "La Casa"
589
  },
590
  {
591
- "tag": "GENDER",
592
  "start": 38,
593
  "end": 42,
594
  "value": "Male"
@@ -751,14 +757,8 @@
751
  {
752
  "tag": "ZIPCODE",
753
  "start": 167,
754
- "end": 170,
755
- "value": "650"
756
- },
757
- {
758
- "tag": "PASSPORTNUM",
759
- "start": 170,
760
  "end": 175,
761
- "value": "01900"
762
  }
763
  ]
764
  },
@@ -1264,6 +1264,12 @@
1264
  "end": 83,
1265
  "value": "Adalie Irana"
1266
  },
 
 
 
 
 
 
1267
  {
1268
  "tag": "STREET",
1269
  "start": 91,
@@ -1861,8 +1867,14 @@
1861
  {
1862
  "tag": "GIVENNAME",
1863
  "start": 0,
 
 
 
 
 
 
1864
  "end": 14,
1865
- "value": "Klit Shemsidin"
1866
  },
1867
  {
1868
  "tag": "GIVENNAME",
@@ -3254,14 +3266,8 @@
3254
  {
3255
  "tag": "GIVENNAME",
3256
  "start": 0,
3257
- "end": 10,
3258
- "value": "Kristoffer"
3259
- },
3260
- {
3261
- "tag": "SURNAME",
3262
- "start": 11,
3263
  "end": 18,
3264
- "value": "Verlind"
3265
  },
3266
  {
3267
  "tag": "EMAIL",
@@ -3377,14 +3383,8 @@
3377
  {
3378
  "tag": "GIVENNAME",
3379
  "start": 59,
3380
- "end": 64,
3381
- "value": "Mieke"
3382
- },
3383
- {
3384
- "tag": "SURNAME",
3385
- "start": 65,
3386
  "end": 71,
3387
- "value": "Ruirui"
3388
  },
3389
  {
3390
  "tag": "DATE",
@@ -4845,14 +4845,8 @@
4845
  {
4846
  "tag": "GIVENNAME",
4847
  "start": 153,
4848
- "end": 158,
4849
- "value": "Xhevë"
4850
- },
4851
- {
4852
- "tag": "SURNAME",
4853
- "start": 159,
4854
  "end": 162,
4855
- "value": "Haz"
4856
  }
4857
  ]
4858
  },
@@ -5415,14 +5409,14 @@
5415
  {
5416
  "tag": "STREET",
5417
  "start": 111,
5418
- "end": 133,
5419
- "value": "Via Rodella di Edisona"
5420
  },
5421
  {
5422
  "tag": "CITY",
5423
- "start": 134,
5424
  "end": 139,
5425
- "value": "Negre"
5426
  }
5427
  ]
5428
  },
@@ -6489,14 +6483,8 @@
6489
  {
6490
  "tag": "GIVENNAME",
6491
  "start": 108,
6492
- "end": 114,
6493
- "value": "Jagjit"
6494
- },
6495
- {
6496
- "tag": "SURNAME",
6497
- "start": 115,
6498
  "end": 121,
6499
- "value": "Lukacs"
6500
  }
6501
  ]
6502
  },
@@ -6874,13 +6862,13 @@
6874
  "value": "Steffisburg"
6875
  },
6876
  {
6877
- "tag": "ZIPCODE",
6878
  "start": 53,
6879
  "end": 57,
6880
  "value": "3535"
6881
  },
6882
  {
6883
- "tag": "IDCARDNUM",
6884
  "start": 59,
6885
  "end": 67,
6886
  "value": "T5603982"
@@ -7415,7 +7403,7 @@
7415
  "value": "Herr"
7416
  },
7417
  {
7418
- "tag": "SURNAME",
7419
  "start": 19,
7420
  "end": 27,
7421
  "value": "Valentyn"
@@ -8243,6 +8231,12 @@
8243
  }
8244
  ],
8245
  "predictions": [
 
 
 
 
 
 
8246
  {
8247
  "tag": "DATE",
8248
  "start": 87,
@@ -8447,7 +8441,7 @@
8447
  "value": "Hata Rupbas Pachgahir"
8448
  },
8449
  {
8450
- "tag": "SEX",
8451
  "start": 78,
8452
  "end": 84,
8453
  "value": "Female"
@@ -9621,8 +9615,14 @@
9621
  {
9622
  "tag": "GIVENNAME",
9623
  "start": 33,
 
 
 
 
 
 
9624
  "end": 49,
9625
- "value": "Guggia Emilyanis"
9626
  },
9627
  {
9628
  "tag": "GIVENNAME",
@@ -10119,17 +10119,11 @@
10119
  }
10120
  ],
10121
  "predictions": [
10122
- {
10123
- "tag": "GIVENNAME",
10124
- "start": 102,
10125
- "end": 107,
10126
- "value": "Salvà"
10127
- },
10128
  {
10129
  "tag": "SURNAME",
10130
- "start": 108,
10131
  "end": 124,
10132
- "value": "Curioni Fraigedo"
10133
  },
10134
  {
10135
  "tag": "SURNAME",
@@ -10373,7 +10367,7 @@
10373
  "value": "31966.77949"
10374
  },
10375
  {
10376
- "tag": "IDCARDNUM",
10377
  "start": 66,
10378
  "end": 76,
10379
  "value": "XPFHGAIL6Z"
@@ -11165,8 +11159,14 @@
11165
  {
11166
  "tag": "GIVENNAME",
11167
  "start": 8,
 
 
 
 
 
 
11168
  "end": 22,
11169
- "value": "Ravirajah Fung"
11170
  }
11171
  ]
11172
  },
@@ -12084,6 +12084,12 @@
12084
  "start": 8,
12085
  "end": 21,
12086
  "value": "Vijayakumaran"
 
 
 
 
 
 
12087
  }
12088
  ]
12089
  },
@@ -12171,17 +12177,11 @@
12171
  "end": 35,
12172
  "value": "श्री"
12173
  },
12174
- {
12175
- "tag": "GIVENNAME",
12176
- "start": 36,
12177
- "end": 52,
12178
- "value": "Soultanis Lunang"
12179
- },
12180
  {
12181
  "tag": "SURNAME",
12182
- "start": 53,
12183
  "end": 61,
12184
- "value": "Yurtaeva"
12185
  },
12186
  {
12187
  "tag": "CITY",
@@ -12225,6 +12225,12 @@
12225
  "end": 18,
12226
  "value": "Soaad Eldina"
12227
  },
 
 
 
 
 
 
12228
  {
12229
  "tag": "SURNAME",
12230
  "start": 67,
@@ -13215,7 +13221,7 @@
13215
  "value": "Ass"
13216
  },
13217
  {
13218
- "tag": "GIVENNAME",
13219
  "start": 10,
13220
  "end": 17,
13221
  "value": "Frühauf"
@@ -13976,8 +13982,14 @@
13976
  {
13977
  "tag": "GIVENNAME",
13978
  "start": 90,
 
 
 
 
 
 
13979
  "end": 104,
13980
- "value": "Mirita Pramila"
13981
  },
13982
  {
13983
  "tag": "CITY",
@@ -14154,14 +14166,14 @@
14154
  {
14155
  "tag": "GIVENNAME",
14156
  "start": 7,
14157
- "end": 15,
14158
- "value": "Enkeleta"
14159
  },
14160
  {
14161
  "tag": "SURNAME",
14162
- "start": 16,
14163
  "end": 39,
14164
- "value": "Khatere Lacle-Djidjogbe"
14165
  },
14166
  {
14167
  "tag": "TELEPHONENUM",
@@ -15082,8 +15094,14 @@
15082
  {
15083
  "tag": "GIVENNAME",
15084
  "start": 0,
 
 
 
 
 
 
15085
  "end": 11,
15086
- "value": "Lendon Lend"
15087
  },
15088
  {
15089
  "tag": "CITY",
@@ -16067,14 +16085,8 @@
16067
  {
16068
  "tag": "GIVENNAME",
16069
  "start": 0,
16070
- "end": 5,
16071
- "value": "Adora"
16072
- },
16073
- {
16074
- "tag": "SURNAME",
16075
- "start": 6,
16076
  "end": 12,
16077
- "value": "Sobiga"
16078
  },
16079
  {
16080
  "tag": "TITLE",
@@ -17696,7 +17708,7 @@
17696
  "ground_truth": [],
17697
  "predictions": [
17698
  {
17699
- "tag": "BUILDINGNUM",
17700
  "start": 20,
17701
  "end": 25,
17702
  "value": "11301"
@@ -18136,14 +18148,8 @@
18136
  {
18137
  "tag": "GIVENNAME",
18138
  "start": 66,
18139
- "end": 72,
18140
- "value": "Antimo"
18141
- },
18142
- {
18143
- "tag": "SURNAME",
18144
- "start": 73,
18145
  "end": 77,
18146
- "value": "Omaj"
18147
  }
18148
  ]
18149
  },
@@ -18620,7 +18626,7 @@
18620
  "value": "Angiolina"
18621
  },
18622
  {
18623
- "tag": "CITY",
18624
  "start": 63,
18625
  "end": 68,
18626
  "value": "Kewin"
@@ -19132,20 +19138,20 @@
19132
  {
19133
  "tag": "GIVENNAME",
19134
  "start": 21,
19135
- "end": 32,
19136
- "value": "Tariku Goda"
19137
  },
19138
  {
19139
- "tag": "TITLE",
19140
- "start": 73,
19141
- "end": 77,
19142
- "value": "Solt"
19143
  },
19144
  {
19145
  "tag": "GIVENNAME",
19146
- "start": 78,
19147
  "end": 83,
19148
- "value": "Mekan"
19149
  },
19150
  {
19151
  "tag": "SURNAME",
@@ -19583,7 +19589,7 @@
19583
  ],
19584
  "predictions": [
19585
  {
19586
- "tag": "IDCARDNUM",
19587
  "start": 5,
19588
  "end": 15,
19589
  "value": "SDEVCMQAGF"
@@ -19934,7 +19940,7 @@
19934
  ],
19935
  "predictions": [
19936
  {
19937
- "tag": "IDCARDNUM",
19938
  "start": 26,
19939
  "end": 35,
19940
  "value": "J6495505V"
@@ -20128,8 +20134,14 @@
20128
  {
20129
  "tag": "GIVENNAME",
20130
  "start": 11,
 
 
 
 
 
 
20131
  "end": 25,
20132
- "value": "Mehrnaz Sumbul"
20133
  },
20134
  {
20135
  "tag": "CITY",
@@ -21601,7 +21613,7 @@
21601
  "value": "+41.85 888.9193"
21602
  },
21603
  {
21604
- "tag": "IDCARDNUM",
21605
  "start": 34,
21606
  "end": 42,
21607
  "value": "P2058540"
@@ -21812,8 +21824,14 @@
21812
  {
21813
  "tag": "GIVENNAME",
21814
  "start": 81,
 
 
 
 
 
 
21815
  "end": 94,
21816
- "value": "Helias Thorin"
21817
  },
21818
  {
21819
  "tag": "TELEPHONENUM",
@@ -22524,7 +22542,7 @@
22524
  "ground_truth": [],
22525
  "predictions": [
22526
  {
22527
- "tag": "DRIVERLICENSENUM",
22528
  "start": 112,
22529
  "end": 123,
22530
  "value": "SD34N342534"
@@ -22622,7 +22640,7 @@
22622
  "value": "Cataldi"
22623
  },
22624
  {
22625
- "tag": "TAXNUM",
22626
  "start": 39,
22627
  "end": 48,
22628
  "value": "522679613"
@@ -22899,7 +22917,7 @@
22899
  "value": "Sirikanya"
22900
  },
22901
  {
22902
- "tag": "SEX",
22903
  "start": 20,
22904
  "end": 28,
22905
  "value": "Männlich"
@@ -22957,8 +22975,14 @@
22957
  {
22958
  "tag": "GIVENNAME",
22959
  "start": 47,
 
 
 
 
 
 
22960
  "end": 62,
22961
- "value": "Zymryt Anutsara"
22962
  },
22963
  {
22964
  "tag": "AGE",
@@ -23317,7 +23341,7 @@
23317
  "value": "Karjan Sarupur Timbi"
23318
  },
23319
  {
23320
- "tag": "SOCIALNUM",
23321
  "start": 143,
23322
  "end": 155,
23323
  "value": "02-4197-3268"
@@ -23430,14 +23454,14 @@
23430
  {
23431
  "tag": "GIVENNAME",
23432
  "start": 0,
23433
- "end": 19,
23434
- "value": "Wanchai Kanagarajah"
23435
  },
23436
  {
23437
  "tag": "SURNAME",
23438
- "start": 20,
23439
  "end": 27,
23440
- "value": "la Sala"
23441
  }
23442
  ]
23443
  },
@@ -23543,7 +23567,7 @@
23543
  "value": "Patrick-Marc"
23544
  },
23545
  {
23546
- "tag": "CREDITCARDNUMBER",
23547
  "start": 94,
23548
  "end": 106,
23549
  "value": "470481527018"
@@ -24231,14 +24255,8 @@
24231
  {
24232
  "tag": "GIVENNAME",
24233
  "start": 30,
24234
- "end": 34,
24235
- "value": "Duke"
24236
- },
24237
- {
24238
- "tag": "SURNAME",
24239
- "start": 35,
24240
  "end": 40,
24241
- "value": "Macit"
24242
  }
24243
  ]
24244
  },
@@ -24565,12 +24583,6 @@
24565
  "source_text": "Sir, I think we should add some spiked wooden fences to the tents, what's your take on it Mr. President? ",
24566
  "ground_truth": [],
24567
  "predictions": [
24568
- {
24569
- "tag": "TITLE",
24570
- "start": 0,
24571
- "end": 3,
24572
- "value": "Sir"
24573
- },
24574
  {
24575
  "tag": "TITLE",
24576
  "start": 90,
@@ -25514,8 +25526,14 @@
25514
  {
25515
  "tag": "GIVENNAME",
25516
  "start": 6,
 
 
 
 
 
 
25517
  "end": 19,
25518
- "value": "Adjoa Kingori"
25519
  }
25520
  ]
25521
  },
@@ -25617,7 +25635,7 @@
25617
  ],
25618
  "predictions": [
25619
  {
25620
- "tag": "STREET",
25621
  "start": 52,
25622
  "end": 68,
25623
  "value": "Calzada del Coto"
@@ -25982,8 +26000,14 @@
25982
  {
25983
  "tag": "GIVENNAME",
25984
  "start": 51,
 
 
 
 
 
 
25985
  "end": 67,
25986
- "value": "Künsang Amarante"
25987
  }
25988
  ]
25989
  },
@@ -26664,8 +26688,8 @@
26664
  {
26665
  "tag": "GIVENNAME",
26666
  "start": 98,
26667
- "end": 102,
26668
- "value": "Bing"
26669
  }
26670
  ]
26671
  },
@@ -28519,7 +28543,7 @@
28519
  "value": "Evaldas"
28520
  },
28521
  {
28522
- "tag": "IDCARDNUM",
28523
  "start": 90,
28524
  "end": 98,
28525
  "value": "O1326531"
@@ -28964,17 +28988,11 @@
28964
  "end": 34,
28965
  "value": "Mairesse"
28966
  },
28967
- {
28968
- "tag": "GIVENNAME",
28969
- "start": 35,
28970
- "end": 41,
28971
- "value": "Bandak"
28972
- },
28973
  {
28974
  "tag": "SURNAME",
28975
- "start": 42,
28976
  "end": 66,
28977
- "value": "Dingetschweiler In-Albon"
28978
  }
28979
  ]
28980
  },
@@ -29836,14 +29854,8 @@
29836
  {
29837
  "tag": "GIVENNAME",
29838
  "start": 7,
29839
- "end": 15,
29840
- "value": "Abdullah"
29841
- },
29842
- {
29843
- "tag": "SURNAME",
29844
- "start": 16,
29845
  "end": 22,
29846
- "value": "Tiller"
29847
  }
29848
  ]
29849
  },
@@ -31321,7 +31333,7 @@
31321
  "ground_truth": [],
31322
  "predictions": [
31323
  {
31324
- "tag": "GIVENNAME",
31325
  "start": 35,
31326
  "end": 44,
31327
  "value": "Pushelden"
@@ -32260,7 +32272,7 @@
32260
  "value": "Córdoba"
32261
  },
32262
  {
32263
- "tag": "AGE",
32264
  "start": 75,
32265
  "end": 77,
32266
  "value": "59"
@@ -33362,8 +33374,8 @@
33362
  {
33363
  "tag": "GIVENNAME",
33364
  "start": 51,
33365
- "end": 59,
33366
- "value": "Katelyn-"
33367
  },
33368
  {
33369
  "tag": "SURNAME",
@@ -33409,7 +33421,7 @@
33409
  "value": "Iurii"
33410
  },
33411
  {
33412
- "tag": "GIVENNAME",
33413
  "start": 110,
33414
  "end": 119,
33415
  "value": "Barchitta"
@@ -34416,8 +34428,14 @@
34416
  {
34417
  "tag": "GIVENNAME",
34418
  "start": 109,
 
 
 
 
 
 
34419
  "end": 124,
34420
- "value": "Tharmikan Ivica"
34421
  }
34422
  ]
34423
  },
@@ -34495,7 +34513,7 @@
34495
  ],
34496
  "predictions": [
34497
  {
34498
- "tag": "CITY",
34499
  "start": 15,
34500
  "end": 24,
34501
  "value": "Fructuoso"
 
513
  "end": 117,
514
  "value": "Senator"
515
  },
516
+ {
517
+ "tag": "SURNAME",
518
+ "start": 118,
519
+ "end": 124,
520
+ "value": "Yellow"
521
+ },
522
  {
523
  "tag": "TITLE",
524
  "start": 126,
 
594
  "value": "La Casa"
595
  },
596
  {
597
+ "tag": "SEX",
598
  "start": 38,
599
  "end": 42,
600
  "value": "Male"
 
757
  {
758
  "tag": "ZIPCODE",
759
  "start": 167,
 
 
 
 
 
 
760
  "end": 175,
761
+ "value": "65001900"
762
  }
763
  ]
764
  },
 
1264
  "end": 83,
1265
  "value": "Adalie Irana"
1266
  },
1267
+ {
1268
+ "tag": "SURNAME",
1269
+ "start": 85,
1270
+ "end": 89,
1271
+ "value": "Note"
1272
+ },
1273
  {
1274
  "tag": "STREET",
1275
  "start": 91,
 
1867
  {
1868
  "tag": "GIVENNAME",
1869
  "start": 0,
1870
+ "end": 4,
1871
+ "value": "Klit"
1872
+ },
1873
+ {
1874
+ "tag": "SURNAME",
1875
+ "start": 5,
1876
  "end": 14,
1877
+ "value": "Shemsidin"
1878
  },
1879
  {
1880
  "tag": "GIVENNAME",
 
3266
  {
3267
  "tag": "GIVENNAME",
3268
  "start": 0,
 
 
 
 
 
 
3269
  "end": 18,
3270
+ "value": "Kristoffer Verlind"
3271
  },
3272
  {
3273
  "tag": "EMAIL",
 
3383
  {
3384
  "tag": "GIVENNAME",
3385
  "start": 59,
 
 
 
 
 
 
3386
  "end": 71,
3387
+ "value": "Mieke Ruirui"
3388
  },
3389
  {
3390
  "tag": "DATE",
 
4845
  {
4846
  "tag": "GIVENNAME",
4847
  "start": 153,
 
 
 
 
 
 
4848
  "end": 162,
4849
+ "value": "Xhevë Haz"
4850
  }
4851
  ]
4852
  },
 
5409
  {
5410
  "tag": "STREET",
5411
  "start": 111,
5412
+ "end": 122,
5413
+ "value": "Via Rodella"
5414
  },
5415
  {
5416
  "tag": "CITY",
5417
+ "start": 126,
5418
  "end": 139,
5419
+ "value": "Edisona Negre"
5420
  }
5421
  ]
5422
  },
 
6483
  {
6484
  "tag": "GIVENNAME",
6485
  "start": 108,
 
 
 
 
 
 
6486
  "end": 121,
6487
+ "value": "Jagjit Lukacs"
6488
  }
6489
  ]
6490
  },
 
6862
  "value": "Steffisburg"
6863
  },
6864
  {
6865
+ "tag": "BUILDINGNUM",
6866
  "start": 53,
6867
  "end": 57,
6868
  "value": "3535"
6869
  },
6870
  {
6871
+ "tag": "PASSPORTNUM",
6872
  "start": 59,
6873
  "end": 67,
6874
  "value": "T5603982"
 
7403
  "value": "Herr"
7404
  },
7405
  {
7406
+ "tag": "GIVENNAME",
7407
  "start": 19,
7408
  "end": 27,
7409
  "value": "Valentyn"
 
8231
  }
8232
  ],
8233
  "predictions": [
8234
+ {
8235
+ "tag": "GIVENNAME",
8236
+ "start": 48,
8237
+ "end": 53,
8238
+ "value": "Regid"
8239
+ },
8240
  {
8241
  "tag": "DATE",
8242
  "start": 87,
 
8441
  "value": "Hata Rupbas Pachgahir"
8442
  },
8443
  {
8444
+ "tag": "GENDER",
8445
  "start": 78,
8446
  "end": 84,
8447
  "value": "Female"
 
9615
  {
9616
  "tag": "GIVENNAME",
9617
  "start": 33,
9618
+ "end": 39,
9619
+ "value": "Guggia"
9620
+ },
9621
+ {
9622
+ "tag": "SURNAME",
9623
+ "start": 40,
9624
  "end": 49,
9625
+ "value": "Emilyanis"
9626
  },
9627
  {
9628
  "tag": "GIVENNAME",
 
10119
  }
10120
  ],
10121
  "predictions": [
 
 
 
 
 
 
10122
  {
10123
  "tag": "SURNAME",
10124
+ "start": 102,
10125
  "end": 124,
10126
+ "value": "Salvà Curioni Fraigedo"
10127
  },
10128
  {
10129
  "tag": "SURNAME",
 
10367
  "value": "31966.77949"
10368
  },
10369
  {
10370
+ "tag": "DRIVERLICENSENUM",
10371
  "start": 66,
10372
  "end": 76,
10373
  "value": "XPFHGAIL6Z"
 
11159
  {
11160
  "tag": "GIVENNAME",
11161
  "start": 8,
11162
+ "end": 17,
11163
+ "value": "Ravirajah"
11164
+ },
11165
+ {
11166
+ "tag": "SURNAME",
11167
+ "start": 18,
11168
  "end": 22,
11169
+ "value": "Fung"
11170
  }
11171
  ]
11172
  },
 
12084
  "start": 8,
12085
  "end": 21,
12086
  "value": "Vijayakumaran"
12087
+ },
12088
+ {
12089
+ "tag": "GIVENNAME",
12090
+ "start": 93,
12091
+ "end": 98,
12092
+ "value": "Hindu"
12093
  }
12094
  ]
12095
  },
 
12177
  "end": 35,
12178
  "value": "श्री"
12179
  },
 
 
 
 
 
 
12180
  {
12181
  "tag": "SURNAME",
12182
+ "start": 36,
12183
  "end": 61,
12184
+ "value": "Soultanis Lunang Yurtaeva"
12185
  },
12186
  {
12187
  "tag": "CITY",
 
12225
  "end": 18,
12226
  "value": "Soaad Eldina"
12227
  },
12228
+ {
12229
+ "tag": "TITLE",
12230
+ "start": 57,
12231
+ "end": 66,
12232
+ "value": "Ehrenwert"
12233
+ },
12234
  {
12235
  "tag": "SURNAME",
12236
  "start": 67,
 
13221
  "value": "Ass"
13222
  },
13223
  {
13224
+ "tag": "SURNAME",
13225
  "start": 10,
13226
  "end": 17,
13227
  "value": "Frühauf"
 
13982
  {
13983
  "tag": "GIVENNAME",
13984
  "start": 90,
13985
+ "end": 96,
13986
+ "value": "Mirita"
13987
+ },
13988
+ {
13989
+ "tag": "SURNAME",
13990
+ "start": 97,
13991
  "end": 104,
13992
+ "value": "Pramila"
13993
  },
13994
  {
13995
  "tag": "CITY",
 
14166
  {
14167
  "tag": "GIVENNAME",
14168
  "start": 7,
14169
+ "end": 23,
14170
+ "value": "Enkeleta Khatere"
14171
  },
14172
  {
14173
  "tag": "SURNAME",
14174
+ "start": 24,
14175
  "end": 39,
14176
+ "value": "Lacle-Djidjogbe"
14177
  },
14178
  {
14179
  "tag": "TELEPHONENUM",
 
15094
  {
15095
  "tag": "GIVENNAME",
15096
  "start": 0,
15097
+ "end": 6,
15098
+ "value": "Lendon"
15099
+ },
15100
+ {
15101
+ "tag": "SURNAME",
15102
+ "start": 7,
15103
  "end": 11,
15104
+ "value": "Lend"
15105
  },
15106
  {
15107
  "tag": "CITY",
 
16085
  {
16086
  "tag": "GIVENNAME",
16087
  "start": 0,
 
 
 
 
 
 
16088
  "end": 12,
16089
+ "value": "Adora Sobiga"
16090
  },
16091
  {
16092
  "tag": "TITLE",
 
17708
  "ground_truth": [],
17709
  "predictions": [
17710
  {
17711
+ "tag": "ZIPCODE",
17712
  "start": 20,
17713
  "end": 25,
17714
  "value": "11301"
 
18148
  {
18149
  "tag": "GIVENNAME",
18150
  "start": 66,
 
 
 
 
 
 
18151
  "end": 77,
18152
+ "value": "Antimo Omaj"
18153
  }
18154
  ]
18155
  },
 
18626
  "value": "Angiolina"
18627
  },
18628
  {
18629
+ "tag": "GIVENNAME",
18630
  "start": 63,
18631
  "end": 68,
18632
  "value": "Kewin"
 
19138
  {
19139
  "tag": "GIVENNAME",
19140
  "start": 21,
19141
+ "end": 27,
19142
+ "value": "Tariku"
19143
  },
19144
  {
19145
+ "tag": "SURNAME",
19146
+ "start": 28,
19147
+ "end": 32,
19148
+ "value": "Goda"
19149
  },
19150
  {
19151
  "tag": "GIVENNAME",
19152
+ "start": 73,
19153
  "end": 83,
19154
+ "value": "Solt Mekan"
19155
  },
19156
  {
19157
  "tag": "SURNAME",
 
19589
  ],
19590
  "predictions": [
19591
  {
19592
+ "tag": "DRIVERLICENSENUM",
19593
  "start": 5,
19594
  "end": 15,
19595
  "value": "SDEVCMQAGF"
 
19940
  ],
19941
  "predictions": [
19942
  {
19943
+ "tag": "TAXNUM",
19944
  "start": 26,
19945
  "end": 35,
19946
  "value": "J6495505V"
 
20134
  {
20135
  "tag": "GIVENNAME",
20136
  "start": 11,
20137
+ "end": 18,
20138
+ "value": "Mehrnaz"
20139
+ },
20140
+ {
20141
+ "tag": "SURNAME",
20142
+ "start": 19,
20143
  "end": 25,
20144
+ "value": "Sumbul"
20145
  },
20146
  {
20147
  "tag": "CITY",
 
21613
  "value": "+41.85 888.9193"
21614
  },
21615
  {
21616
+ "tag": "PASSPORTNUM",
21617
  "start": 34,
21618
  "end": 42,
21619
  "value": "P2058540"
 
21824
  {
21825
  "tag": "GIVENNAME",
21826
  "start": 81,
21827
+ "end": 87,
21828
+ "value": "Helias"
21829
+ },
21830
+ {
21831
+ "tag": "SURNAME",
21832
+ "start": 88,
21833
  "end": 94,
21834
+ "value": "Thorin"
21835
  },
21836
  {
21837
  "tag": "TELEPHONENUM",
 
22542
  "ground_truth": [],
22543
  "predictions": [
22544
  {
22545
+ "tag": "IDCARDNUM",
22546
  "start": 112,
22547
  "end": 123,
22548
  "value": "SD34N342534"
 
22640
  "value": "Cataldi"
22641
  },
22642
  {
22643
+ "tag": "SOCIALNUM",
22644
  "start": 39,
22645
  "end": 48,
22646
  "value": "522679613"
 
22917
  "value": "Sirikanya"
22918
  },
22919
  {
22920
+ "tag": "GENDER",
22921
  "start": 20,
22922
  "end": 28,
22923
  "value": "Männlich"
 
22975
  {
22976
  "tag": "GIVENNAME",
22977
  "start": 47,
22978
+ "end": 53,
22979
+ "value": "Zymryt"
22980
+ },
22981
+ {
22982
+ "tag": "SURNAME",
22983
+ "start": 54,
22984
  "end": 62,
22985
+ "value": "Anutsara"
22986
  },
22987
  {
22988
  "tag": "AGE",
 
23341
  "value": "Karjan Sarupur Timbi"
23342
  },
23343
  {
23344
+ "tag": "TELEPHONENUM",
23345
  "start": 143,
23346
  "end": 155,
23347
  "value": "02-4197-3268"
 
23454
  {
23455
  "tag": "GIVENNAME",
23456
  "start": 0,
23457
+ "end": 7,
23458
+ "value": "Wanchai"
23459
  },
23460
  {
23461
  "tag": "SURNAME",
23462
+ "start": 8,
23463
  "end": 27,
23464
+ "value": "Kanagarajah la Sala"
23465
  }
23466
  ]
23467
  },
 
23567
  "value": "Patrick-Marc"
23568
  },
23569
  {
23570
+ "tag": "SOCIALNUM",
23571
  "start": 94,
23572
  "end": 106,
23573
  "value": "470481527018"
 
24255
  {
24256
  "tag": "GIVENNAME",
24257
  "start": 30,
 
 
 
 
 
 
24258
  "end": 40,
24259
+ "value": "Duke Macit"
24260
  }
24261
  ]
24262
  },
 
24583
  "source_text": "Sir, I think we should add some spiked wooden fences to the tents, what's your take on it Mr. President? ",
24584
  "ground_truth": [],
24585
  "predictions": [
 
 
 
 
 
 
24586
  {
24587
  "tag": "TITLE",
24588
  "start": 90,
 
25526
  {
25527
  "tag": "GIVENNAME",
25528
  "start": 6,
25529
+ "end": 11,
25530
+ "value": "Adjoa"
25531
+ },
25532
+ {
25533
+ "tag": "SURNAME",
25534
+ "start": 12,
25535
  "end": 19,
25536
+ "value": "Kingori"
25537
  }
25538
  ]
25539
  },
 
25635
  ],
25636
  "predictions": [
25637
  {
25638
+ "tag": "CITY",
25639
  "start": 52,
25640
  "end": 68,
25641
  "value": "Calzada del Coto"
 
26000
  {
26001
  "tag": "GIVENNAME",
26002
  "start": 51,
26003
+ "end": 58,
26004
+ "value": "Künsang"
26005
+ },
26006
+ {
26007
+ "tag": "SURNAME",
26008
+ "start": 59,
26009
  "end": 67,
26010
+ "value": "Amarante"
26011
  }
26012
  ]
26013
  },
 
26688
  {
26689
  "tag": "GIVENNAME",
26690
  "start": 98,
26691
+ "end": 103,
26692
+ "value": "Bingo"
26693
  }
26694
  ]
26695
  },
 
28543
  "value": "Evaldas"
28544
  },
28545
  {
28546
+ "tag": "PASSPORTNUM",
28547
  "start": 90,
28548
  "end": 98,
28549
  "value": "O1326531"
 
28988
  "end": 34,
28989
  "value": "Mairesse"
28990
  },
 
 
 
 
 
 
28991
  {
28992
  "tag": "SURNAME",
28993
+ "start": 35,
28994
  "end": 66,
28995
+ "value": "Bandak Dingetschweiler In-Albon"
28996
  }
28997
  ]
28998
  },
 
29854
  {
29855
  "tag": "GIVENNAME",
29856
  "start": 7,
 
 
 
 
 
 
29857
  "end": 22,
29858
+ "value": "Abdullah Tiller"
29859
  }
29860
  ]
29861
  },
 
31333
  "ground_truth": [],
31334
  "predictions": [
31335
  {
31336
+ "tag": "CITY",
31337
  "start": 35,
31338
  "end": 44,
31339
  "value": "Pushelden"
 
32272
  "value": "Córdoba"
32273
  },
32274
  {
32275
+ "tag": "BUILDINGNUM",
32276
  "start": 75,
32277
  "end": 77,
32278
  "value": "59"
 
33374
  {
33375
  "tag": "GIVENNAME",
33376
  "start": 51,
33377
+ "end": 58,
33378
+ "value": "Katelyn"
33379
  },
33380
  {
33381
  "tag": "SURNAME",
 
33421
  "value": "Iurii"
33422
  },
33423
  {
33424
+ "tag": "SURNAME",
33425
  "start": 110,
33426
  "end": 119,
33427
  "value": "Barchitta"
 
34428
  {
34429
  "tag": "GIVENNAME",
34430
  "start": 109,
34431
+ "end": 118,
34432
+ "value": "Tharmikan"
34433
+ },
34434
+ {
34435
+ "tag": "SURNAME",
34436
+ "start": 119,
34437
  "end": 124,
34438
+ "value": "Ivica"
34439
  }
34440
  ]
34441
  },
 
34513
  ],
34514
  "predictions": [
34515
  {
34516
+ "tag": "GIVENNAME",
34517
  "start": 15,
34518
  "end": 24,
34519
  "value": "Fructuoso"