-
Notifications
You must be signed in to change notification settings - Fork 16
/
cocoeval.py
138 lines (124 loc) · 5.59 KB
/
cocoeval.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
from pycocoevalcap.bleu.bleu import Bleu
from pycocoevalcap.rouge.rouge import Rouge
from pycocoevalcap.cider.cider import Cider
from pycocoevalcap.meteor.meteor import Meteor
from pycocoevalcap.tokenizer.ptbtokenizer import PTBTokenizer
import os, cPickle
class COCOScorer(object):
def __init__(self):
print 'init COCO-EVAL scorer'
def score(self, GT, RES, IDs):
self.eval = {}
self.imgToEval = {}
gts = {}
res = {}
for ID in IDs:
gts[ID] = GT[ID]
res[ID] = RES[ID]
print 'tokenization...'
tokenizer = PTBTokenizer()
gts = tokenizer.tokenize(gts)
res = tokenizer.tokenize(res)
# =================================================
# Set up scorers
# =================================================
print 'setting up scorers...'
scorers = [
(Bleu(4), ["Bleu_1", "Bleu_2", "Bleu_3", "Bleu_4"]),
(Meteor(),"METEOR"),
(Rouge(), "ROUGE_L"),
(Cider(), "CIDEr")
]
# =================================================
# Compute scores
# =================================================
eval = {}
for scorer, method in scorers:
print 'computing %s score...'%(scorer.method())
score, scores = scorer.compute_score(gts, res)
if type(method) == list:
for sc, scs, m in zip(score, scores, method):
self.setEval(sc, m)
self.setImgToEvalImgs(scs, IDs, m)
print "%s: %0.3f"%(m, sc)
else:
self.setEval(score, method)
self.setImgToEvalImgs(scores, IDs, method)
print "%s: %0.3f"%(method, score)
for metric, score in self.eval.items():
print '%s: %.3f'%(metric, score)
return self.eval
def setEval(self, score, method):
self.eval[method] = score
def setImgToEvalImgs(self, scores, imgIds, method):
for imgId, score in zip(imgIds, scores):
if not imgId in self.imgToEval:
self.imgToEval[imgId] = {}
self.imgToEval[imgId]["image_id"] = imgId
self.imgToEval[imgId][method] = score
def load_pkl(path):
f = open(path, 'rb')
try:
rval = cPickle.load(f)
finally:
f.close()
return rval
def score(ref, sample):
# ref and sample are both dict
scorers = [
(Bleu(4), ["Bleu_1", "Bleu_2", "Bleu_3", "Bleu_4"]),
(Meteor(),"METEOR"),
(Rouge(), "ROUGE_L"),
(Cider(), "CIDEr")
]
final_scores = {}
for scorer, method in scorers:
print 'computing %s score with COCO-EVAL...'%(scorer.method())
score, scores = scorer.compute_score(ref, sample)
if type(score) == list:
for m, s in zip(method, score):
final_scores[m] = s
else:
final_scores[method] = score
return final_scores
def test_cocoscorer():
'''gts = {
184321:[
{u'image_id': 184321, u'id': 352188, u'caption': u'A train traveling down-tracks next to lights.'},
{u'image_id': 184321, u'id': 356043, u'caption': u"A blue and silver train next to train's station and trees."},
{u'image_id': 184321, u'id': 356382, u'caption': u'A blue train is next to a sidewalk on the rails.'},
{u'image_id': 184321, u'id': 361110, u'caption': u'A passenger train pulls into a train station.'},
{u'image_id': 184321, u'id': 362544, u'caption': u'A train coming down the tracks arriving at a station.'}],
81922: [
{u'image_id': 81922, u'id': 86779, u'caption': u'A large jetliner flying over a traffic filled street.'},
{u'image_id': 81922, u'id': 90172, u'caption': u'An airplane flies low in the sky over a city street. '},
{u'image_id': 81922, u'id': 91615, u'caption': u'An airplane flies over a street with many cars.'},
{u'image_id': 81922, u'id': 92689, u'caption': u'An airplane comes in to land over a road full of cars'},
{u'image_id': 81922, u'id': 823814, u'caption': u'The plane is flying over top of the cars'}]
}
samples = {
184321: [{u'image_id': 184321, 'id': 111, u'caption': u'train traveling down a track in front of a road'}],
81922: [{u'image_id': 81922, 'id': 219, u'caption': u'plane is flying through the sky'}],
}
'''
gts = {
'184321':[
{u'image_id': '184321', u'cap_id': 0, u'caption': u'A train traveling down tracks next to lights.',
'tokenized': 'a train traveling down tracks next to lights'},
{u'image_id': '184321', u'cap_id': 1, u'caption': u'A train coming down the tracks arriving at a station.',
'tokenized': 'a train coming down the tracks arriving at a station'}],
'81922': [
{u'image_id': '81922', u'cap_id': 0, u'caption': u'A large jetliner flying over a traffic filled street.',
'tokenized': 'a large jetliner flying over a traffic filled street'},
{u'image_id': '81922', u'cap_id': 1, u'caption': u'The plane is flying over top of the cars',
'tokenized': 'the plan is flying over top of the cars'},]
}
samples = {
'184321': [{u'image_id': '184321', u'caption': u'train traveling down a track in front of a road'}],
'81922': [{u'image_id': '81922', u'caption': u'plane is flying through the sky'}],
}
IDs = ['184321', '81922']
scorer = COCOScorer()
scorer.score(gts, samples, IDs)
if __name__ == '__main__':
test_cocoscorer()