-
Notifications
You must be signed in to change notification settings - Fork 29
/
evaluate.py
81 lines (58 loc) · 1.79 KB
/
evaluate.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
def normalize_pretag(pretag):
if pretag == "S":
return "B"
elif pretag == "E":
return "I"
return pretag
def preprocess_labels(label_sents):
data = []
for sent in label_sents:
for label in sent:
tokens = label.split("-")
if len(tokens) == 2:
pretag = tokens[0]
tag = tokens[1]
pretag = normalize_pretag(pretag)
elif len(tokens) == 1:
pretag, tag = "O", "O"
else:
continue
data.append((pretag, tag))
return data
def load_file(path):
with open(path, 'r') as fp:
return [l.strip().split() for l in fp.readlines()]
def compute_f1(preds, y):
prec = compute_precision(preds, y)
rec = compute_precision(y, preds)
f1 = 0
if (rec + prec) > 0:
f1 = 2.0 * prec * rec / (prec + rec)
return (prec, rec, f1)
def compute_precision(guessed, correct):
correctCount = 0
count = 0
idx = 0
while idx < len(guessed):
if guessed[idx][0] == 'B': # A new chunk starts
count += 1
if guessed[idx] == correct[idx]:
idx += 1
correctlyFound = True
while idx < len(guessed) and guessed[idx][0] == 'I':
if guessed[idx] != correct[idx]:
correctlyFound = False
idx += 1
if idx < len(guessed):
if correct[idx][0] == 'I':
correctlyFound = False
if correctlyFound:
correctCount += 1
else:
idx += 1
else:
idx += 1
precision = 0
if count > 0:
precision = float(correctCount) / count
return precision