datastet-dev

Paused

App Files Files Community

lfoppiano commited on Apr 21, 2025

Commit

26db885

verified ·

1 Parent(s): baa8dd0

Update config-docker.yml

Browse files

Files changed (1) hide show

config-docker.yml +19 -8

config-docker.yml CHANGED Viewed

@@ -1,4 +1,4 @@
-version: "0.8.0"
 corpusPath: "./resources/dataset/dataseer/corpus"
 templatePath: "./resources/dataset/dataseer/crfpp-templates/dataseer.template"
@@ -8,18 +8,18 @@ tmpPath: "/opt/grobid/grobid-home/tmp/"
 # path to Pub2TEI repository as available at https://github.com/kermitt2/Pub2TEI
 pub2teiPath: "/opt/Pub2TEI/"
-gluttonHost: "https://cloud.science-miner.com/glutton"
 gluttonPort:
 # entity-fishing server information for performing entity disambiguation
 # for https, indicate 443 as port
-entityFishingHost: notanumber.com
 entityFishingPort: 443
 #entityFishingHost: localhost
 #entityFishingPort: 8090
 # if true we use binary classifiers for the contexts, otherwise use a single multi-label classifier
-# binary classifiers perform better, but havier to use
 useBinaryContextClassifiers: false
 # sequence labeling model (identify data-related sections)
@@ -35,7 +35,7 @@ models:
       window: 20
       nbMaxIterations: 2000
-  # classifier model, dataset binary (datset or not dataset in the current sentence)
   - name: "dataseer-binary"
     engine: "delft"
     delft:
@@ -130,17 +130,18 @@ corsAllowedHeaders: "X-Requested-With,Content-Type,Accept,Origin"
 server:
   type: custom
-  idleTimeout: 120 seconds
   applicationConnectors:
     - type: http
       port: 8060
   adminConnectors:
     - type: http
       port: 8061
   registerDefaultExceptionMappers: false
   maxThreads: 2048
   maxQueuedRequests: 2048
-  acceptQueueSize: 2048
   requestLog:
     appenders: []
@@ -157,4 +158,14 @@ logging:
       timeZone: UTC
       # uncomment to have the logs in json format
       #layout:
-      #  type: json

+version: "0.8.1"
 corpusPath: "./resources/dataset/dataseer/corpus"
 templatePath: "./resources/dataset/dataseer/crfpp-templates/dataseer.template"
 # path to Pub2TEI repository as available at https://github.com/kermitt2/Pub2TEI
 pub2teiPath: "/opt/Pub2TEI/"
+gluttonHost:
 gluttonPort:
 # entity-fishing server information for performing entity disambiguation
 # for https, indicate 443 as port
+entityFishingHost: cloud.science-miner.com/nerd
 entityFishingPort: 443
 #entityFishingHost: localhost
 #entityFishingPort: 8090
 # if true we use binary classifiers for the contexts, otherwise use a single multi-label classifier
+# binary classifiers perform better, but heavier to use
 useBinaryContextClassifiers: false
 # sequence labeling model (identify data-related sections)
       window: 20
       nbMaxIterations: 2000
+  # classifier model, dataset binary (dataset or not dataset in the current sentence)
   - name: "dataseer-binary"
     engine: "delft"
     delft:
 server:
   type: custom
   applicationConnectors:
     - type: http
       port: 8060
+      idleTimeout: 120 seconds
+      acceptQueueSize: 2048
   adminConnectors:
     - type: http
       port: 8061
   registerDefaultExceptionMappers: false
   maxThreads: 2048
   maxQueuedRequests: 2048
   requestLog:
     appenders: []
       timeZone: UTC
       # uncomment to have the logs in json format
       #layout:
+      #  type: json
+#    - type: file
+#      currentLogFilename: logs/datastet-service.log
+#      threshold: INFO
+#      archive: true
+#      archivedLogFilenamePattern: logs/datastet-service-%d.log
+#      archivedFileCount: 7
+#      timeZone: UTC
+      # uncomment to have the logs in json format
+      #layout:
+      #  type: json