File size: 2,195 Bytes
c6617b2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
{
  "model_name": "trankit decompressed weights",
  "version": "1.0.0",
  "library_name": "trankit",
  "source": "https://github.com/nlp-uoregon/trankit",
  "license": "apache-2.0",
  "architectures": [
    "xlm-roberta-base",
    "xlm-roberta-large"
  ],
  "tasks": [
    "tokenization",
    "pos-tagging",
    "dependency-parsing",
    "named-entity-recognition",
    "lemmatization"
  ],
  "languages": [
    "afrikaans",
    "ancient-greek",
    "ancient-greek-perseus",
    "arabic",
    "armenian",
    "basque",
    "belarusian",
    "bulgarian",
    "catalan",
    "chinese",
    "classical-chinese",
    "croatian",
    "czech",
    "czech-cac",
    "czech-cltt",
    "czech-fictree",
    "danish",
    "dutch",
    "dutch-lassysmall",
    "english",
    "english-gum",
    "english-lines",
    "english-partut",
    "estonian",
    "estonian-ewt",
    "finnish",
    "finnish-ftb",
    "french",
    "french-partut",
    "french-sequoia",
    "french-spoken",
    "galician",
    "galician-treegal",
    "german",
    "german-hdt",
    "greek",
    "hebrew",
    "hindi",
    "hungarian",
    "indonesian",
    "irish",
    "italian",
    "italian-partut",
    "italian-postwita",
    "italian-twittiro",
    "italian-vit",
    "japanese",
    "kazakh",
    "korean",
    "korean-kaist",
    "kurmanji",
    "latin",
    "latin-perseus",
    "latin-proiel",
    "latvian",
    "lithuanian",
    "lithuanian-hse",
    "marathi",
    "norwegian-bokmaal",
    "norwegian-nynorsk",
    "norwegian-nynorsklia",
    "old-french",
    "old-russian",
    "persian",
    "polish",
    "polish-lfg",
    "portuguese",
    "portuguese-gsd",
    "romanian",
    "romanian-nonstandard",
    "russian",
    "russian-gsd",
    "russian-taiga",
    "scottish-gaelic",
    "serbian",
    "slovak",
    "slovenian",
    "slovenian-sst",
    "spanish",
    "spanish-gsd",
    "swedish",
    "swedish-lines",
    "tamil",
    "telugu",
    "traditional-chinese",
    "turkish",
    "ukrainian",
    "urdu",
    "uyghur",
    "vietnamese",
    "vietnamese-vtb"
  ],
  "notes": "All files were extracted from uonlp/trankit so that downstream users can download ready-to-use weights without zip archives."
}