-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig.ini
46 lines (39 loc) · 1.19 KB
/
config.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
# ----------------------- Settings -----------------------------
[Encoding]
file-encoding=utf-8
outfile-encoding=utf-8
[Data]
corpus-path=./data
output-path=./output
# ----------- FILE FORMAT RELATED SETTINGS ----------
[Corpus-Format]
line-machine = ([^\t]+)\t([^\t])[^\t]*\t([^\t]+)\t([^\t]+)\t([^\t]+)\t([^\t]+)
global-columns = word,pos,lemma,id,head,deprel
type = lemma/pos
colloc = lemma/pos
token = lemma/pos/fid/lid
# boundary-detection-mechanism = left-right
boundary-detection-mechanism = single
separator-line-machine = </s>
single-boundary-machine = </s>
# single-boundary-machine = <[^>\t]+>
left-boundary-machine = ^<artikel naam = "([^"]+)" > $
right-boundary-machine = ^</artikel>$
# if you have dependency info
node-attr = lemma,pos
edge-attr = deprel
currID = id
headID = head
# ----------- SPAN RELATED SETTINGS -----------
[Span]
# number of tokens to left of node
left-span=4
# number of tokens to right of node
right-span=4
# number of tokens to left of node for MWU identification
left-MWUspan=0
# number of tokens to right of node for MWU identification
right-MWUspan=0
[Special]
wqueries-default-key = _DEFAULT_
# ----------- FILENAME RELATED SETTINGS (NOT IN USE) -----------