|
version: "0.8.0" |
|
|
|
corpusPath: "./resources/dataset/dataseer/corpus" |
|
templatePath: "./resources/dataset/dataseer/crfpp-templates/dataseer.template" |
|
grobidHome: "/opt/grobid/grobid-home" |
|
tmpPath: "/opt/grobid/grobid-home/tmp/" |
|
|
|
|
|
pub2teiPath: "/opt/Pub2TEI/" |
|
|
|
gluttonHost: |
|
gluttonPort: |
|
|
|
|
|
|
|
entityFishingHost: cloud.science-miner.com/nerd |
|
entityFishingPort: 443 |
|
|
|
|
|
|
|
|
|
|
|
useBinaryContextClassifiers: false |
|
|
|
|
|
models: |
|
|
|
|
|
- name: "dataseer" |
|
engine: "wapiti" |
|
|
|
wapiti: |
|
|
|
epsilon: 0.00001 |
|
window: 20 |
|
nbMaxIterations: 2000 |
|
|
|
|
|
- name: "dataseer-binary" |
|
engine: "delft" |
|
delft: |
|
|
|
|
|
architecture: "bert" |
|
|
|
transformer: "allenai/scibert_scivocab_cased" |
|
|
|
|
|
- name: "dataseer-first" |
|
engine: "delft" |
|
delft: |
|
|
|
|
|
architecture: "bert" |
|
|
|
transformer: "allenai/scibert_scivocab_cased" |
|
|
|
|
|
- name: "dataseer-reuse" |
|
engine: "delft" |
|
delft: |
|
|
|
|
|
architecture: "bert" |
|
|
|
transformer: "allenai/scibert_scivocab_cased" |
|
|
|
|
|
- name: "datasets" |
|
|
|
engine: "delft" |
|
wapiti: |
|
|
|
epsilon: 0.00001 |
|
window: 20 |
|
nbMaxIterations: 2000 |
|
delft: |
|
|
|
|
|
architecture: "BERT_CRF" |
|
|
|
transformer: "michiyasunaga/LinkBERT-basecased" |
|
|
|
|
|
runtime: |
|
|
|
max_sequence_length: 200 |
|
|
|
batch_size: 20 |
|
|
|
- name: "context" |
|
engine: "delft" |
|
delft: |
|
|
|
|
|
architecture: "bert" |
|
transformer: "michiyasunaga/LinkBERT-basecased" |
|
|
|
- name: "context_used" |
|
engine: "delft" |
|
delft: |
|
|
|
|
|
architecture: "bert" |
|
transformer: "michiyasunaga/LinkBERT-basecased" |
|
|
|
- name: "context_creation" |
|
engine: "delft" |
|
delft: |
|
|
|
|
|
architecture: "bert" |
|
transformer: "michiyasunaga/LinkBERT-basecased" |
|
|
|
- name: "context_shared" |
|
engine: "delft" |
|
delft: |
|
|
|
|
|
architecture: "bert" |
|
transformer: "michiyasunaga/LinkBERT-basecased" |
|
|
|
|
|
maxParallelRequests: 0 |
|
|
|
|
|
corsAllowedOrigins: "*" |
|
corsAllowedMethods: "OPTIONS,GET,PUT,POST,DELETE,HEAD" |
|
corsAllowedHeaders: "X-Requested-With,Content-Type,Accept,Origin" |
|
|
|
server: |
|
type: custom |
|
idleTimeout: 120 seconds |
|
applicationConnectors: |
|
- type: http |
|
port: 8060 |
|
adminConnectors: |
|
- type: http |
|
port: 8061 |
|
registerDefaultExceptionMappers: false |
|
maxThreads: 2048 |
|
maxQueuedRequests: 2048 |
|
acceptQueueSize: 2048 |
|
requestLog: |
|
appenders: [] |
|
|
|
|
|
logging: |
|
level: INFO |
|
loggers: |
|
org.apache.pdfbox.pdmodel.font.PDSimpleFont: "OFF" |
|
org.glassfish.jersey.internal: "OFF" |
|
com.squarespace.jersey2.guice.JerseyGuiceUtils: "OFF" |
|
appenders: |
|
- type: console |
|
threshold: INFO |
|
timeZone: UTC |
|
|
|
|
|
|