Comment out Spice in caption task so that don't need to download stan… · EvolvingLMMs-Lab/lmms-eval@b2b4dbd (original) (raw)
7 files changed
lines changed
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -43,7 +43,7 @@ def coco_process_result(doc, result): | ||
43 | 43 | |
44 | 44 | |
45 | 45 | def coco_aggregation_result(results, metric, args): |
46 | -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")] | |
46 | +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")] | |
47 | 47 | scorers_dict = {s[1]: s for s in scorers} |
48 | 48 | |
49 | 49 | stored_results = [] |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -41,7 +41,7 @@ def flickr_process_result(doc, result): | ||
41 | 41 | |
42 | 42 | |
43 | 43 | def flickr_aggregation_result(results, metric, args): |
44 | -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")] | |
44 | +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")] | |
45 | 45 | scorers_dict = {s[1]: s for s in scorers} |
46 | 46 | |
47 | 47 | stored_results = [] |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -42,7 +42,7 @@ def nocaps_process_result(doc, result): | ||
42 | 42 | |
43 | 43 | |
44 | 44 | def nocaps_aggregation_result(results, metric, args=None): |
45 | -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")] | |
45 | +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")] | |
46 | 46 | scorers_dict = {s[1]: s for s in scorers} |
47 | 47 | |
48 | 48 | stored_results = [] |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -49,7 +49,7 @@ def refcoco_process_result(doc, result): | ||
49 | 49 | |
50 | 50 | |
51 | 51 | def refcoco_aggregation_result(results, metric): |
52 | -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")] | |
52 | +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")] | |
53 | 53 | scorers_dict = {s[1]: s for s in scorers} |
54 | 54 | |
55 | 55 | stored_results = [] |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -49,7 +49,7 @@ def refcoco_process_result(doc, result): | ||
49 | 49 | |
50 | 50 | |
51 | 51 | def refcoco_aggregation_result(results, metric): |
52 | -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")] | |
52 | +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")] | |
53 | 53 | scorers_dict = {s[1]: s for s in scorers} |
54 | 54 | |
55 | 55 | stored_results = [] |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -49,7 +49,7 @@ def refcoco_process_result(doc, result): | ||
49 | 49 | |
50 | 50 | |
51 | 51 | def refcoco_aggregation_result(results, metric): |
52 | -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")] | |
52 | +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")] | |
53 | 53 | scorers_dict = {s[1]: s for s in scorers} |
54 | 54 | |
55 | 55 | stored_results = [] |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -38,7 +38,7 @@ def textcaps_process_result(doc, result): | ||
38 | 38 | |
39 | 39 | |
40 | 40 | def textcaps_aggregation_result(results, metric, args=None): |
41 | -scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr"), (Spice(), "SPICE")] | |
41 | +scorers = [(Bleu(4), "Bleu_1"), (Bleu(4), "Bleu_2"), (Bleu(4), "Bleu_3"), (Bleu(4), "Bleu_4"), (Meteor(), "METEOR"), (Rouge(), "ROUGE_L"), (Cider(), "CIDEr")]#, (Spice(), "SPICE")] | |
42 | 42 | scorers_dict = {s[1]: s for s in scorers} |
43 | 43 | |
44 | 44 | stored_results = [] |