daelba commited on
Commit
c29d915
·
verified ·
1 Parent(s): f235e99
Files changed (1) hide show
  1. models.json +244 -66
models.json CHANGED
@@ -12,100 +12,278 @@
12
  "desc": "enrich: conversion from m. d. YYYY to ISO",
13
  "items": 10000,
14
  "source": "generated by script",
15
- "loss before": 24.0673828125,
16
- "loss after": 0.0028942381031811237,
17
- "date": "2024-03-12",
18
- "max length": 59
19
  },
20
  {
21
- "name": "wd_bscz_1",
22
  "desc": "enrich: data from WD, birthdate: full, deathdate: full",
23
- "items": 10000,
24
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%3Fnarkde%20rdfs%3Alabel%20%3FnarkdeLabel.%20FILTER(LANG(%3FnarkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%3Fzemkde%20rdfs%3Alabel%20%3FzemkdeLabel.%20FILTER(LANG(%3FzemkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP106%20%3Fprof.%20%3Fprof%20rdfs%3Alabel%20%3FprofLabel.%20FILTER(LANG(%3FprofLabel)%3D%22de%22)%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20'%2CSTR(%3FprofLabel)%2C'%2C%20*%20'%2CSTR(DAY(%3Fnarkdy))%2C'.%20'%2CSTR(MONTH(%3Fnarkdy))%2C'.%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%20'%2CSTR(%3FnarkdeLabel)%2C'%2C%20%E2%80%A0%20'%2CSTR(DAY(%3Fzemkdy))%2C'.%20'%2CSTR(MONTH(%3Fzemkdy))%2C'.%20'%2CSTR(YEAR(%3Fzemkdy))%2C'%20'%2CSTR(%3FzemkdeLabel)%2C'.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20%7B%7BWD%7CP106%7C'%2CREPLACE(STR(%3Fprof)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FprofLabel)%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C'%2CREPLACE(STR(%3Fnarkdy)%2C%22T.*%22%2C%22%22)%2C'%7C'%2CSTR(DAY(%3Fnarkdy))%2C'.%20'%2CSTR(MONTH(%3Fnarkdy))%2C'.%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%7D%7D%20%7B%7BWD%7CP19%7C'%2CREPLACE(STR(%3Fnarkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FnarkdeLabel)%2C'%7D%7D%2C%20%E2%80%A0%20%7B%7BWD%7CP570%7C'%2CREPLACE(STR(%3Fzemkdy)%2C%22T.*%22%2C%22%22)%2C'%7C'%2CSTR(DAY(%3Fzemkdy))%2C'.%20'%2CSTR(MONTH(%3Fzemkdy))%2C'.%20'%2CSTR(YEAR(%3Fzemkdy))%2C'%7D%7D%20%7B%7BWD%7CP20%7C'%2CREPLACE(STR(%3Fzemkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FzemkdeLabel)%2C'%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%2010000",
25
- "loss before": 17.901836395263672,
26
- "loss after": 0.21804147958755493,
27
- "date": "2024-03-12",
28
- "max length": 401
 
 
 
 
 
 
 
 
 
 
29
  },
30
  {
31
- "name": "wd_bscz_2",
32
  "desc": "enrich: data from WD, birthdate: full, deathdate: year",
33
- "items": 10000,
34
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%3Fnarkde%20rdfs%3Alabel%20%3FnarkdeLabel.%20FILTER(LANG(%3FnarkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%3Fzemkde%20rdfs%3Alabel%20%3FzemkdeLabel.%20FILTER(LANG(%3FzemkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP106%20%3Fprof.%20%3Fprof%20rdfs%3Alabel%20%3FprofLabel.%20FILTER(LANG(%3FprofLabel)%3D%22de%22)%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20'%2CSTR(%3FprofLabel)%2C'%2C%20*%20'%2CSTR(DAY(%3Fnarkdy))%2C'.%20'%2CSTR(MONTH(%3Fnarkdy))%2C'.%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%20'%2CSTR(%3FnarkdeLabel)%2C'%2C%20%E2%80%A0%20'%2CSTR(YEAR(%3Fzemkdy))%2C'%20'%2CSTR(%3FzemkdeLabel)%2C'.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20%7B%7BWD%7CP106%7C'%2CREPLACE(STR(%3Fprof)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FprofLabel)%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C'%2CREPLACE(STR(%3Fnarkdy)%2C%22T.*%22%2C%22%22)%2C'%7C'%2CSTR(DAY(%3Fnarkdy))%2C'.%20'%2CSTR(MONTH(%3Fnarkdy))%2C'.%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%7D%7D%20%7B%7BWD%7CP19%7C'%2CREPLACE(STR(%3Fnarkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FnarkdeLabel)%2C'%7D%7D%2C%20%E2%80%A0%20%7B%7BWD%7CP570%7C'%2CREPLACE(STR(%3Fzemkdy)%2C%22-.*%22%2C%22%22)%2C'%7D%7D%20%7B%7BWD%7CP20%7C'%2CREPLACE(STR(%3Fzemkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FzemkdeLabel)%2C'%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%2010000%0AOFFSET%2010000",
35
- "loss before": 0.5377106070518494,
36
- "loss after": 0.1428946554660797,
37
- "date": "2024-03-12",
38
- "max length": 358
 
 
 
 
 
 
 
 
 
 
39
  },
40
  {
41
- "name": "wd_bscz_3",
42
  "desc": "enrich: data from WD, birthdate: year, deathdate: full",
43
- "items": 10000,
44
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%3Fnarkde%20rdfs%3Alabel%20%3FnarkdeLabel.%20FILTER(LANG(%3FnarkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%3Fzemkde%20rdfs%3Alabel%20%3FzemkdeLabel.%20FILTER(LANG(%3FzemkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP106%20%3Fprof.%20%3Fprof%20rdfs%3Alabel%20%3FprofLabel.%20FILTER(LANG(%3FprofLabel)%3D%22de%22)%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20'%2CSTR(%3FprofLabel)%2C'%2C%20*%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%20'%2CSTR(%3FnarkdeLabel)%2C'%2C%20%E2%80%A0%20'%2CSTR(DAY(%3Fzemkdy))%2C'.%20'%2CSTR(MONTH(%3Fzemkdy))%2C'.%20'%2CSTR(YEAR(%3Fzemkdy))%2C'%20'%2CSTR(%3FzemkdeLabel)%2C'.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20%7B%7BWD%7CP106%7C'%2CREPLACE(STR(%3Fprof)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FprofLabel)%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C'%2CSTR(YEAR(%3Fnarkdy))%2C'%7D%7D%20%7B%7BWD%7CP19%7C'%2CREPLACE(STR(%3Fnarkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FnarkdeLabel)%2C'%7D%7D%2C%20%E2%80%A0%20%7B%7BWD%7CP570%7C'%2CREPLACE(STR(%3Fzemkdy)%2C%22T.*%22%2C%22%22)%2C'%7C'%2CSTR(DAY(%3Fzemkdy))%2C'.%20'%2CSTR(MONTH(%3Fzemkdy))%2C'.%20'%2CSTR(YEAR(%3Fzemkdy))%2C'%7D%7D%20%7B%7BWD%7CP20%7C'%2CREPLACE(STR(%3Fzemkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FzemkdeLabel)%2C'%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%2010000%0AOFFSET%2020000",
45
- "loss before": 0.9282719492912292,
46
- "loss after": 0.12308310717344284,
47
- "date": "2024-03-14",
48
- "max length": 352
 
 
 
 
 
 
 
 
 
 
49
  },
50
  {
51
- "name": "wd_bscz_4",
52
  "desc": "enrich: data from WD, birthdate: year, deathdate: year",
53
- "items": 10000,
54
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%3Fnarkde%20rdfs%3Alabel%20%3FnarkdeLabel.%20FILTER(LANG(%3FnarkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%3Fzemkde%20rdfs%3Alabel%20%3FzemkdeLabel.%20FILTER(LANG(%3FzemkdeLabel)%3D%22de%22)%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP106%20%3Fprof.%20%3Fprof%20rdfs%3Alabel%20%3FprofLabel.%20FILTER(LANG(%3FprofLabel)%3D%22de%22)%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20'%2CSTR(%3FprofLabel)%2C'%2C%20*%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%20'%2CSTR(%3FnarkdeLabel)%2C'%2C%20%E2%80%A0%20'%2CSTR(YEAR(%3Fzemkdy))%2C'%20'%2CSTR(%3FzemkdeLabel)%2C'.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20%7B%7BWD%7CP106%7C'%2CREPLACE(STR(%3Fprof)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FprofLabel)%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C'%2CSTR(YEAR(%3Fnarkdy))%2C'%7D%7D%20%7B%7BWD%7CP19%7C'%2CREPLACE(STR(%3Fnarkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FnarkdeLabel)%2C'%7D%7D%2C%20%E2%80%A0%20%7B%7BWD%7CP570%7C'%2CSTR(YEAR(%3Fzemkdy))%2C'%7D%7D%20%7B%7BWD%7CP20%7C'%2CREPLACE(STR(%3Fzemkde)%2C%22.*%2FQ%22%2C%22Q%22)%2C'%7C'%2CSTR(%3FzemkdeLabel)%2C'%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%2010000%0AOFFSET%2030000",
55
- "loss before": 0.6698053479194641,
56
- "loss after": 0.12252699583768845,
57
- "date": "2024-03-14",
58
- "max length": 327
 
 
 
 
 
 
 
 
 
 
59
  },
60
  {
61
- "name": "wd_bscz_5",
62
  "desc": "enrich: data from WD, birthdate: year, deathdate: year, profession: none",
63
- "items": 500,
64
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%7D%0A%20%23%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP106%20%3Fprof.%20%3Fprof%20rdfs%3Alabel%20%3FprofLabel.%20FILTER(LANG(%3FprofLabel)%3D%22de%22)%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20*%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%2C%20%E2%80%A0%20'%2CSTR(YEAR(%3Fzemkdy))%2C'.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C'%2CSTR(YEAR(%3Fnarkdy))%2C'%7D%7D%20%E2%80%A0%20%7B%7BWD%7CP570%7C'%2CSTR(YEAR(%3Fzemkdy))%2C'%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%20500%0A%23OFFSET%2040000",
65
- "loss before": 3.490724563598633,
66
- "loss after": 0.0016380766173824668,
67
- "date": "2024-03-14",
68
- "max length": 166
69
  },
70
  {
71
- "name": "wd_bscz_6",
 
 
 
 
 
 
 
 
 
 
72
  "desc": "enrich: data from WD, birthdate: year, deathdate: none, profession: none",
73
- "items": 500,
74
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%7D%0A%20%23%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP106%20%3Fprof.%20%3Fprof%20rdfs%3Alabel%20%3FprofLabel.%20FILTER(LANG(%3FprofLabel)%3D%22de%22)%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20*%20'%2CSTR(YEAR(%3Fnarkdy))%2C'%2C%20%E2%80%A0%20%3F.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C'%2CSTR(YEAR(%3Fnarkdy))%2C'%7D%7D%20%E2%80%A0%20%3F%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%20500%0A%23OFFSET%2040000",
75
- "loss before": 3.8766534328460693,
76
- "loss after": 4.379506663099164e-06,
77
- "date": "2024-03-14",
78
- "max length": 156
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
79
  },
80
  {
81
- "name": "wd_bscz_7",
82
  "desc": "enrich: data from WD, birthdate: none, deathdate: year, profession: none",
83
- "items": 500,
84
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%7D%0A%20%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%7D%0A%20%23%20OPTIONAL%20%7B%20%3Fitem%20wdt%3AP106%20%3Fprof.%20%3Fprof%20rdfs%3Alabel%20%3FprofLabel.%20FILTER(LANG(%3FprofLabel)%3D%22de%22)%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20*%20%3F%2C%20%E2%80%A0%20'%2CSTR(YEAR(%3Fzemkdy))%2C'.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C%3F%7C%3F%7D%7D%20%E2%80%A0%20%7B%7BWD%7CP570%7C'%2CSTR(YEAR(%3Fzemkdy))%2C'%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%20500%0A%23OFFSET%2040000",
85
- "loss before": 4.1504807472229,
86
- "loss after": 1.5070370864123106e-05,
87
- "date": "2024-03-14",
88
- "max length": 168
 
 
 
 
 
 
 
 
 
 
89
  },
90
  {
91
- "name": "wd_bscz_8",
92
  "desc": "enrich: data from WD, birthdate: none, deathdate: none, profession: none",
93
- "items": 291,
94
- "source": "https://query.wikidata.org/#SELECT%20%3Fresult%20WHERE%20%7B%0A%20%20%3Fitem%20wdt%3AP9160%20%3Fid%3B%0A%20%20%20%20%20%20%20%20rdfs%3Alabel%20%3Flabel.%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP569%20%3Fnarkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP19%20%3Fnarkde.%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP570%20%3Fzemkdy%20%7D%0A%20%20MINUS%20%7B%20%3Fitem%20wdt%3AP20%20%3Fzemkde.%20%7D%0A%20%20FILTER(LANG(%3Flabel)%3D%22de%22)%0A%20%20BIND(REPLACE(STR(%3Flabel)%2C%22(%5B%5E%20%5D%2B)%20(%5B%5E%20%5D%2B)%22%2C%22%242%2C%20%241%22)%20AS%20%3FlabelEdit)%0A%20%20BIND(CONCAT('%22wd%3A'%2C%3FlabelEdit%2C'%2C%20*%20%3F%2C%20%E2%80%A0%20%3F.%22%2C%22%7B%7BWD%7Clabel%7C'%2C%3FlabelEdit%2C'%7D%7D%2C%20*%20%7B%7BWD%7CP569%7C%3F%7C%3F%7D%7D%20%E2%80%A0%20%7B%7BWD%7CP570%7C%3F%7C%3F%7D%7D.%22')%20AS%20%3Fresult)%0A%20%20FILTER(%3Fresult!%3D%22%22)%0A%7D%0ALIMIT%20500%0A%23OFFSET%20500",
95
- "loss before": 4.866212844848633,
96
- "loss after": 0.0021445967722684145,
97
- "date": "2024-03-14",
98
- "max length": 150
99
  },
100
  {
101
  "name": "blgbl-I-1",
102
  "desc": "Biographisches Lexikon zu Geschichte der Böhmischen Länder I/1",
103
- "items": 500,
104
  "source": "",
105
- "loss before": 3.910360336303711,
106
- "loss after": 1.032591462135315,
107
- "date": "2024-03-14",
108
- "max length": 931
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
109
  }
110
  ]
111
- }
 
12
  "desc": "enrich: conversion from m. d. YYYY to ISO",
13
  "items": 10000,
14
  "source": "generated by script",
15
+ "date": "2024-07-18",
16
+ "max length": 59,
17
+ "loss before": 24.15882110595703,
18
+ "loss after": 0.022161545231938362
19
  },
20
  {
21
+ "name": "wd_bscz_1_de",
22
  "desc": "enrich: data from WD, birthdate: full, deathdate: full",
23
+ "items": 30000,
24
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='de')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='de')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='de') }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}, * {{WD|P569|',REPLACE(STR(?narkdy),'T.*',''),'|',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}, † {{WD|P570|',REPLACE(STR(?zemkdy),'T.*',''),'|',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}.\"') AS ?result)\n FILTER(?result!='')\n}",
25
+ "date": "2024-07-18",
26
+ "max length": 419,
27
+ "loss before": 10.54973030090332,
28
+ "loss after": 0.3109029233455658
29
+ },
30
+ {
31
+ "name": "wd_bscz_1_cs",
32
+ "desc": "enrich: data from WD, birthdate: full, deathdate: full",
33
+ "items": 30000,
34
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='cs')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='cs')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='cs') }\n FILTER(LANG(?label)='cs')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}, * {{WD|P569|',REPLACE(STR(?narkdy),'T.*',''),'|',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}, † {{WD|P570|',REPLACE(STR(?zemkdy),'T.*',''),'|',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}.\"') AS ?result)\n FILTER(?result!='')\n}",
35
+ "date": "2024-07-18",
36
+ "max length": 395,
37
+ "loss before": 0.48948758840560913,
38
+ "loss after": 0.2783867120742798
39
  },
40
  {
41
+ "name": "wd_bscz_2_de",
42
  "desc": "enrich: data from WD, birthdate: full, deathdate: year",
43
+ "items": 30000,
44
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='de')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='de')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='de') }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}}, * {{WD|P569|',REPLACE(STR(?narkdy),'T.*',''),'|',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}}, † {{WD|P570|',REPLACE(STR(?zemkdy),'-.*',''),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
45
+ "date": "2024-07-18",
46
+ "max length": 397,
47
+ "loss before": 2.422574520111084,
48
+ "loss after": 0.24791918694972992
49
+ },
50
+ {
51
+ "name": "wd_bscz_2_cs",
52
+ "desc": "enrich: data from WD, birthdate: full, deathdate: year",
53
+ "items": 30000,
54
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='de')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='de')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='de') }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}}, * {{WD|P569|',REPLACE(STR(?narkdy),'T.*',''),'|',STR(DAY(?narkdy)),'. ',STR(MONTH(?narkdy)),'. ',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}}, † {{WD|P570|',REPLACE(STR(?zemkdy),'-.*',''),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
55
+ "date": "2024-07-18",
56
+ "max length": 397,
57
+ "loss before": 0.24678942561149597,
58
+ "loss after": 0.2253396362066269
59
  },
60
  {
61
+ "name": "wd_bscz_3_de",
62
  "desc": "enrich: data from WD, birthdate: year, deathdate: full",
63
+ "items": 30000,
64
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='de')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='de')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='de') }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}}, † {{WD|P570|',REPLACE(STR(?zemkdy),'T.*',''),'|',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
65
+ "date": "2024-07-18",
66
+ "max length": 397,
67
+ "loss before": 0.94584059715271,
68
+ "loss after": 0.2024272084236145
69
+ },
70
+ {
71
+ "name": "wd_bscz_3_cs",
72
+ "desc": "enrich: data from WD, birthdate: year, deathdate: full",
73
+ "items": 30000,
74
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='cs')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='cs')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='cs') }\n FILTER(LANG(?label)='cs')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}}, † {{WD|P570|',REPLACE(STR(?zemkdy),'T.*',''),'|',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
75
+ "date": "2024-07-18",
76
+ "max length": 375,
77
+ "loss before": 0.28801560401916504,
78
+ "loss after": 0.2155514657497406
79
  },
80
  {
81
+ "name": "wd_bscz_4_de",
82
  "desc": "enrich: data from WD, birthdate: year, deathdate: year",
83
+ "items": 30000,
84
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='de')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='de')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='de') }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}}, † {{WD|P570|',REPLACE(STR(?zemkdy),'T.*',''),'|',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
85
+ "date": "2024-07-18",
86
+ "max length": 397,
87
+ "loss before": 0.19279958307743073,
88
+ "loss after": 0.17653045058250427
89
+ },
90
+ {
91
+ "name": "wd_bscz_4_cs",
92
+ "desc": "enrich: data from WD, birthdate: year, deathdate: year",
93
+ "items": 30000,
94
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n OPTIONAL { ?item wdt:P19 ?narkde. ?narkde rdfs:label ?narkdeLabel. FILTER(LANG(?narkdeLabel)='cs')}\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n OPTIONAL { ?item wdt:P20 ?zemkde. ?zemkde rdfs:label ?zemkdeLabel. FILTER(LANG(?zemkdeLabel)='cs')}\n OPTIONAL { ?item wdt:P106 ?prof. ?prof rdfs:label ?profLabel. FILTER(LANG(?profLabel)='cs') }\n FILTER(LANG(?label)='cs')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', ',STR(?profLabel),', * ',STR(YEAR(?narkdy)),' ',STR(?narkdeLabel),', † ',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),' ',STR(?zemkdeLabel),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, {{WD|P106|',REPLACE(STR(?prof),'.*/Q','Q'),'|',STR(?profLabel),'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} {{WD|P19|',REPLACE(STR(?narkde),'.*/Q','Q'),'|',STR(?narkdeLabel),'}}, † {{WD|P570|',REPLACE(STR(?zemkdy),'T.*',''),'|',STR(DAY(?zemkdy)),'. ',STR(MONTH(?zemkdy)),'. ',STR(YEAR(?zemkdy)),'}} {{WD|P20|',REPLACE(STR(?zemkde),'.*/Q','Q'),'|',STR(?zemkdeLabel),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
95
+ "date": "2024-07-18",
96
+ "max length": 375,
97
+ "loss before": 0.2162504494190216,
98
+ "loss after": 0.18714365363121033
99
  },
100
  {
101
+ "name": "wd_bscz_5_de",
102
  "desc": "enrich: data from WD, birthdate: year, deathdate: year, profession: none",
103
+ "items": 30000,
104
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ',STR(YEAR(?narkdy)),', † ',STR(YEAR(?zemkdy)),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} † {{WD|P570|',STR(YEAR(?zemkdy)),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
105
+ "date": "2024-07-18",
106
+ "max length": 254,
107
+ "loss before": 3.0714218616485596,
108
+ "loss after": 0.38618239760398865
109
  },
110
  {
111
+ "name": "wd_bscz_5_cs",
112
+ "desc": "enrich: data from WD, birthdate: year, deathdate: year, profession: none",
113
+ "items": 30000,
114
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='cs')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ',STR(YEAR(?narkdy)),', † ',STR(YEAR(?zemkdy)),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} † {{WD|P570|',STR(YEAR(?zemkdy)),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
115
+ "date": "2024-07-18",
116
+ "max length": 183,
117
+ "loss before": 0.3803560435771942,
118
+ "loss after": 0.3697205185890198
119
+ },
120
+ {
121
+ "name": "wd_bscz_6_de",
122
  "desc": "enrich: data from WD, birthdate: year, deathdate: none, profession: none",
123
+ "items": 30000,
124
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n MINUS { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ',STR(YEAR(?narkdy)),', † ?.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} † {{WD|P570|?}}.\"') AS ?result)\n FILTER(?result!='')\n}",
125
+ "date": "2024-07-18",
126
+ "max length": 164,
127
+ "loss before": 0.7456120252609253,
128
+ "loss after": 0.44568684697151184
129
+ },
130
+ {
131
+ "name": "wd_bscz_6_cs",
132
+ "desc": "enrich: data from WD, birthdate: year, deathdate: none, profession: none",
133
+ "items": 30000,
134
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n MINUS { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='cs')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ',STR(YEAR(?narkdy)),', † ?.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|',STR(YEAR(?narkdy)),'}} † {{WD|P570|?}}.\"') AS ?result)\n FILTER(?result!='')\n}",
135
+ "date": "2024-07-18",
136
+ "max length": 154,
137
+ "loss before": 0.4441145956516266,
138
+ "loss after": 0.4394545257091522
139
+ },
140
+ {
141
+ "name": "wd_bscz_7_de",
142
+ "desc": "enrich: data from WD, birthdate: none, deathdate: year, profession: none",
143
+ "items": 30000,
144
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ?, † ',STR(YEAR(?zemkdy)),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|?}} † {{WD|P570|',STR(YEAR(?zemkdy)),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
145
+ "date": "2024-07-18",
146
+ "max length": 248,
147
+ "loss before": 0.375357449054718,
148
+ "loss after": 0.34558600187301636
149
  },
150
  {
151
+ "name": "wd_bscz_7_cs",
152
  "desc": "enrich: data from WD, birthdate: none, deathdate: year, profession: none",
153
+ "items": 30000,
154
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n OPTIONAL { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n OPTIONAL { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='cs')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ?, † ',STR(YEAR(?zemkdy)),'.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|?}} † {{WD|P570|',STR(YEAR(?zemkdy)),'}}.\"') AS ?result)\n FILTER(?result!='')\n}",
155
+ "date": "2024-07-18",
156
+ "max length": 177,
157
+ "loss before": 0.33053824305534363,
158
+ "loss after": 0.3306645154953003
159
+ },
160
+ {
161
+ "name": "wd_bscz_8_de",
162
+ "desc": "enrich: data from WD, birthdate: none, deathdate: none, profession: none",
163
+ "items": 30000,
164
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n MINUS { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n MINUS { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='de')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ?, † ?.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|?}} † {{WD|P570|?}}.\"') AS ?result)\n FILTER(?result!='')\n}",
165
+ "date": "2024-07-18",
166
+ "max length": 155,
167
+ "loss before": 0.5916451215744019,
168
+ "loss after": 0.49150529503822327
169
  },
170
  {
171
+ "name": "wd_bscz_8_cs",
172
  "desc": "enrich: data from WD, birthdate: none, deathdate: none, profession: none",
173
+ "items": 30000,
174
+ "source": "SELECT ?result WHERE {\n ?item wdt:P9160 ?id;\n rdfs:label ?label.\n MINUS { ?item wdt:P569 ?narkdy }\n MINUS { ?item wdt:P19 ?narkde. }\n MINUS { ?item wdt:P570 ?zemkdy }\n MINUS { ?item wdt:P20 ?zemkde. }\n FILTER(LANG(?label)='cs')\n BIND(REPLACE(STR(?label),'([^ ]+) ([^ ]+)','$2, $1') AS ?labelEdit)\n BIND(CONCAT('\"wd:',?labelEdit,', * ?, † ?.\",\"{{WD|label|',REPLACE(STR(?item),'.*/Q','Q'),'|',?labelEdit,'}}, * {{WD|P569|?}} † {{WD|P570|?}}.\"') AS ?result)\n FILTER(?result!='')\n}",
175
+ "date": "2024-07-18",
176
+ "max length": 153,
177
+ "loss before": 0.47962987422943115,
178
+ "loss after": 0.46871593594551086
179
  },
180
  {
181
  "name": "blgbl-I-1",
182
  "desc": "Biographisches Lexikon zu Geschichte der Böhmischen Länder I/1",
 
183
  "source": "",
184
+ "date": "2025-01-09",
185
+ "max length": 3133,
186
+ "records": 549,
187
+ "loss before 2024-11-21": 4.604732036590576,
188
+ "loss after 2024-11-21": 0.6298858523368835,
189
+ "loss before": 4.701245307922363,
190
+ "loss after": 0.5900019407272339
191
+ },
192
+ {
193
+ "name": "blgbl-I-2",
194
+ "desc": "Biographisches Lexikon zu Geschichte der Böhmischen Länder I/2",
195
+ "source": "",
196
+ "records": 636,
197
+ "max length": 2703,
198
+ "date": "2025-01-09",
199
+ "loss before 2024-11-21": 0.7166669368743896,
200
+ "loss after 2024-11-21": 0.5336414575576782,
201
+ "loss before": 0.7134875655174255,
202
+ "loss after": 0.5306755900382996
203
+ },
204
+ {
205
+ "name": "blgbl-I-3",
206
+ "desc": "Biographisches Lexikon zu Geschichte der Böhmischen Länder I/3",
207
+ "source": "",
208
+ "date": "2025-01-09",
209
+ "max length": 3948,
210
+ "records": 579,
211
+ "loss before 2024-11-21": 0.5424748063087463,
212
+ "loss after 2024-11-21": 0.47353771328926086,
213
+ "loss before": 0.5465303659439087,
214
+ "loss after": 0.4764151871204376
215
+ },
216
+ {
217
+ "name": "blgbl-I-4",
218
+ "desc": "Biographisches Lexikon zur Geschichte der Böhmischen Länder I/4",
219
+ "source": "",
220
+ "records": 612,
221
+ "max length": 3601,
222
+ "date": "2025-01-09",
223
+ "loss before 2024-11-21": 0.49382275342941284,
224
+ "loss after 2024-11-21": 0.4336855113506317,
225
+ "loss before": 0.5028115510940552,
226
+ "loss after": 0.4394499957561493
227
+ },
228
+ {
229
+ "name": "blgbl-I-5",
230
+ "desc": "Biographisches Lexikon zur Geschichte der Böhmischen Länder I/5",
231
+ "source": "",
232
+ "records": 620,
233
+ "max length": 4216,
234
+ "date": "2025-01-09",
235
+ "loss before 2024-11-21": 0.4291462302207947,
236
+ "loss after 2024-11-21": 0.3830949366092682,
237
+ "loss before": 0.4262952208518982,
238
+ "loss after": 0.38063767552375793
239
+ },
240
+ {
241
+ "name": "blgbl-I-6",
242
+ "desc": "Biographisches Lexikon zur Geschichte der Böhmischen Länder I/6",
243
+ "source": "",
244
+ "records": 268,
245
+ "max length": 2965,
246
+ "date": "2025-01-21",
247
+ "loss before 014": 0.47205042839050293,
248
+ "loss after 014": 0.4726303517818451,
249
+ "loss before 032": 0.3916228413581848,
250
+ "loss after 032": 0.3902609050273895,
251
+ "loss before 036": 0.42318350076675415,
252
+ "loss after 036": 0.42163747549057007,
253
+ "loss before 048": 0.37494370341300964,
254
+ "loss after 048": 0.3687383532524109,
255
+ "loss before 096": 0.39310532808303833,
256
+ "loss after 096": 0.40272587537765503,
257
+ "loss before 158": 0.42209357023239136,
258
+ "loss after 158": 0.42246097326278687,
259
+ "loss before 170": 0.4203546345233917,
260
+ "loss after 170": 0.4167018234729767,
261
+ "loss before 268": 0.39955317974090576,
262
+ "loss after 268": 0.3944759964942932
263
+ },
264
+ {
265
+ "name": "blgbl-I-7",
266
+ "desc": "Biographisches Lexikon zur Geschichte der Böhmischen Länder I/7",
267
+ "source": "",
268
+ "records": 231,
269
+ "max length": 2317,
270
+ "date": "2025-01-21",
271
+ "loss before 050": 0.3967258930206299,
272
+ "loss after 050": 0.37953120470046997,
273
+ "loss before 079": 0.4065577983856201,
274
+ "loss after 079": 0.39681532979011536,
275
+ "loss before 116": 0.4132721424102783,
276
+ "loss after 116": 0.4017845094203949,
277
+ "loss before 135": 0.4154694378376007,
278
+ "loss after 135": 0.39745032787323,
279
+ "loss before 193": 0.43908724188804626,
280
+ "loss after 193": 0.41222572326660156,
281
+ "loss before 214": 0.4212968945503235,
282
+ "loss after 214": 0.3941657543182373,
283
+ "loss before 231": 0.42109838128089905,
284
+ "loss after 231": 0.38987934589385986,
285
+ "loss before": 0.41905006766319275,
286
+ "loss after": 0.3887978494167328
287
  }
288
  ]
289
+ }