Comment out Spice in caption task so that don't need to download stan… · EvolvingLMMs-Lab/lmms-eval@b2b4dbd (original) (raw)

7 files changed

lines changed

Original file line number Diff line number Diff line change
@@ -43,7 +43,7 @@ def coco_process_result(doc, result):
43 43
44 44
45 45 def coco_aggregation_result(results, metric, args):
46 -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")]
46 +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")]
47 47 scorers_dict = {s[1]: s for s in scorers}
48 48
49 49 stored_results = []
Original file line number Diff line number Diff line change
@@ -41,7 +41,7 @@ def flickr_process_result(doc, result):
41 41
42 42
43 43 def flickr_aggregation_result(results, metric, args):
44 -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")]
44 +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")]
45 45 scorers_dict = {s[1]: s for s in scorers}
46 46
47 47 stored_results = []
Original file line number Diff line number Diff line change
@@ -42,7 +42,7 @@ def nocaps_process_result(doc, result):
42 42
43 43
44 44 def nocaps_aggregation_result(results, metric, args=None):
45 -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")]
45 +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")]
46 46 scorers_dict = {s[1]: s for s in scorers}
47 47
48 48 stored_results = []
Original file line number Diff line number Diff line change
@@ -49,7 +49,7 @@ def refcoco_process_result(doc, result):
49 49
50 50
51 51 def refcoco_aggregation_result(results, metric):
52 -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")]
52 +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")]
53 53 scorers_dict = {s[1]: s for s in scorers}
54 54
55 55 stored_results = []
Original file line number Diff line number Diff line change
@@ -49,7 +49,7 @@ def refcoco_process_result(doc, result):
49 49
50 50
51 51 def refcoco_aggregation_result(results, metric):
52 -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")]
52 +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")]
53 53 scorers_dict = {s[1]: s for s in scorers}
54 54
55 55 stored_results = []
Original file line number Diff line number Diff line change
@@ -49,7 +49,7 @@ def refcoco_process_result(doc, result):
49 49
50 50
51 51 def refcoco_aggregation_result(results, metric):
52 -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")]
52 +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")]
53 53 scorers_dict = {s[1]: s for s in scorers}
54 54
55 55 stored_results = []
Original file line number Diff line number Diff line change
@@ -38,7 +38,7 @@ def textcaps_process_result(doc, result):
38 38
39 39
40 40 def textcaps_aggregation_result(results, metric, args=None):
41 -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")]
41 +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")]
42 42 scorers_dict = {s[1]: s for s in scorers}
43 43
44 44 stored_results = []