lfoppiano commited on
Commit
e2cd6d9
·
verified ·
1 Parent(s): a45a29f

Upload config-docker.yml

Browse files
Files changed (1) hide show
  1. config-docker.yml +129 -0
config-docker.yml ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ version: "0.8.0"
2
+
3
+ grobidHome: /opt/grobid/grobid-home
4
+
5
+ # entity-fishing server information for performing entity disambiguation
6
+ # for https, indicate 443 as port
7
+ entityFishingHost:
8
+ entityFishingPort:
9
+ #entityFishingHost: localhost
10
+ #entityFishingPort: 8090
11
+
12
+ corpusPath: resources/dataset/
13
+ tmpPath: tmp/
14
+
15
+ # path to Pub2TEI repository as available at https://github.com/kermitt2/Pub2TEI
16
+ pub2teiPath: "../../Pub2TEI/"
17
+
18
+ # if true we use binary classifiers for the contexts, otherwise use a single multi-label classifier
19
+ # binary classifiers perform better, but havier to use
20
+ useBinaryContextClassifiers: true
21
+
22
+ models:
23
+ - name: "software"
24
+ engine: "wapiti"
25
+ #engine: "delft"
26
+ wapiti:
27
+ # wapiti training parameters, only considered when wapiti is used as engine for the model,
28
+ # these parameters are be used at training time only
29
+ epsilon: 0.00001
30
+ window: 30
31
+ nbMaxIterations: 1500
32
+ delft:
33
+ # deep learning parameters
34
+ #architecture: "BidLSTM_CRF"
35
+ #useELMo: false
36
+ #embeddings_name: "glove-840B"
37
+ architecture: "BERT"
38
+ transformer: "allenai/scibert_scivocab_cased"
39
+ #transformer: "michiyasunaga/LinkBERT-basecased"
40
+
41
+ - name: "software-type"
42
+ engine: "wapiti"
43
+ #engine: "delft"
44
+ wapiti:
45
+ # wapiti training parameters, only considered when wapiti is used as engine for the model,
46
+ # these parameters are be used at training time only
47
+ epsilon: 0.00001
48
+ window: 30
49
+ nbMaxIterations: 1500
50
+ delft:
51
+ # deep learning parameters
52
+ #architecture: "BidLSTM_CRF"
53
+ #useELMo: false
54
+ #embeddings_name: "glove-840B"
55
+ architecture: "BERT_CRF"
56
+ transformer: "michiyasunaga/LinkBERT-basecased"
57
+
58
+ - name: "context"
59
+ # multi-label classifier for the context
60
+ engine: "delft"
61
+ delft:
62
+ #architecture: "gru"
63
+ #embeddings_name: "glove-840B"
64
+ architecture: "bert"
65
+ transformer: "michiyasunaga/LinkBERT-basecased"
66
+
67
+ - name: "context_used"
68
+ # binary classifier to predict if the context of the mention correspond to a usage of the software
69
+ engine: "delft"
70
+ delft:
71
+ #architecture: "gru"
72
+ #embeddings_name: "glove-840B"
73
+ architecture: "bert"
74
+ transformer: "michiyasunaga/LinkBERT-basecased"
75
+
76
+ - name: "context_creation"
77
+ # binary classifier to predict if the context of the mention correspond to a creation of the software
78
+ engine: "delft"
79
+ delft:
80
+ #architecture: "gru"
81
+ #embeddings_name: "glove-840B"
82
+ architecture: "bert"
83
+ transformer: "michiyasunaga/LinkBERT-basecased"
84
+
85
+ - name: "context_shared"
86
+ # binary classifier to predict if the context of the mention correspond to a sharing of the software
87
+ engine: "delft"
88
+ delft:
89
+ #architecture: "gru"
90
+ #embeddings_name: "glove-840B"
91
+ architecture: "bert"
92
+ transformer: "michiyasunaga/LinkBERT-basecased"
93
+
94
+ # Limit the maximum number of requests
95
+ maxParallelRequests: 0
96
+
97
+ # CORS configuration for the web API service
98
+ corsAllowedOrigins: "*"
99
+ corsAllowedMethods: "OPTIONS,GET,PUT,POST,DELETE,HEAD"
100
+ corsAllowedHeaders: "X-Requested-With,Content-Type,Accept,Origin"
101
+
102
+ server:
103
+ type: custom
104
+ idleTimeout: 120 seconds
105
+ applicationConnectors:
106
+ - type: http
107
+ port: 8060
108
+ adminConnectors:
109
+ - type: http
110
+ port: 8061
111
+ registerDefaultExceptionMappers: false
112
+ maxThreads: 2048
113
+ maxQueuedRequests: 2048
114
+ acceptQueueSize: 2048
115
+ # change the following for having all http requests logged
116
+ requestLog:
117
+ appenders: []
118
+
119
+ # these logging settings apply to the service usage mode
120
+ logging:
121
+ level: INFO
122
+ loggers:
123
+ org.apache.pdfbox.pdmodel.font.PDSimpleFont: "OFF"
124
+ org.glassfish.jersey.internal: "OFF"
125
+ com.squarespace.jersey2.guice.JerseyGuiceUtils: "OFF"
126
+ appenders:
127
+ - type: console
128
+ threshold: WARN
129
+ timeZone: UTC