-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathproper.prm
128 lines (112 loc) · 3.46 KB
/
proper.prm
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
# Evaluation parameter file, based on COLLINS.prm distributed with EVALB
##-------------------------------------------##
## Debug mode ##
## 0: No debugging ##
## 1: print data for individual sentence ##
##-------------------------------------------##
DEBUG 0
##-------------------------------------------##
## MAX error ##
## Number of error to stop the process. ##
## This is useful if there could be ##
## tokenization error. ##
## The process will stop when this number ##
## of errors are accumulated. ##
##-------------------------------------------##
MAX_ERROR 10
##------------------------------------------ ##
## Cut-off length for statistics ##
## At the end of evaluation, the ##
## statistics for the sentences of length ##
## less than or equal to this number will ##
## be shown, on top of the statistics ##
## for all the sentences ##
##-------------------------------------------##
CUTOFF_LEN 40
##-------------------------------------------##
## unlabeled or labeled bracketing ##
## 0: unlabeled bracketing ##
## 1: labeled bracketing ##
##-------------------------------------------##
LABELED 1
##-------------------------------------------##
## Delete labels ##
## list of labels to be ignored. ##
## If it is a pre-terminal label, delete ##
## the word along with the brackets. ##
## If it is a non-terminal label, just ##
## delete the brackets (don't delete ##
## children). ##
##-------------------------------------------##
# Sentences for which parsing failed may be marked with a 'NOPARSE' constituent,
# we ignore this label because it is not intended as an actual bracketing
DELETE_LABEL NOPARSE
# Delete root node
DELETE_LABEL TOP
DELETE_LABEL ROOT
DELETE_LABEL VROOT
# Punctuation
# NB: contrary to COLLINS.prm, ignore ALL punctuation (including brackets)
# Negra / Tiger
DELETE_LABEL $,
DELETE_LABEL $(
DELETE_LABEL $[
DELETE_LABEL $.
# Alpino
DELETE_LABEL PUNCT
DELETE_LABEL punct
DELETE_LABEL LET[]
DELETE_LABEL LET()
DELETE_LABEL LET
DELETE_LABEL let[]
DELETE_LABEL let()
DELETE_LABEL let
# PTB
DELETE_LABEL ,
DELETE_LABEL :
DELETE_LABEL ``
DELETE_LABEL ''
DELETE_LABEL .
DELETE_LABEL -NONE-
# Treebank independent, match punctuation by word
DELETE_WORD .
DELETE_WORD ,
DELETE_WORD :
DELETE_WORD ;
DELETE_WORD '
DELETE_WORD `
DELETE_WORD "
DELETE_WORD ``
DELETE_WORD ''
DELETE_WORD -
DELETE_WORD (
DELETE_WORD )
DELETE_WORD /
DELETE_WORD &
DELETE_WORD $
DELETE_WORD !
DELETE_WORD !!!
DELETE_WORD !!!
DELETE_WORD ?
DELETE_WORD ??
DELETE_WORD ???
DELETE_WORD ..
DELETE_WORD ...
DELETE_WORD «
DELETE_WORD »
##------------------------------------------##
## Delete labels for length calculation ##
## list of labels to be ignored for ##
## length calculation purpose ##
##------------------------------------------##
#DELETE_LABEL_FOR_LENGTH -NONE-
##------------------------------------------##
## Equivalent labels, words ##
## the pairs are considered equivalent ##
## This is non-directional. ##
##------------------------------------------##
EQ_LABEL ADVP PRT
EQ_WORD -LRB- (
EQ_WORD -RRB- )
# Whether to evaluate only on discontinuous constituents:
DISC_ONLY 0