merge model_specific_prompt_kwargs and dataset_name into each task yaml · EvolvingLMMs-Lab/lmms-eval@0581ab3 (original) (raw)
18 files changed
lines changed
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,9 +1,5 @@ | ||
1 | 1 | dataset_path: MM-UPD/MM-UPD |
2 | 2 | doc_to_target: "answer" |
3 | -model_specific_prompt_kwargs: | |
4 | - default: | |
5 | - pre_prompt: "" | |
6 | - post_prompt: "\n" | |
7 | 3 | doc_to_visual: !function utils.mmupd_doc_to_visual |
8 | 4 | doc_to_text: !function utils.mmupd_doc_to_text |
9 | 5 | doc_to_target: "answer" |
@@ -12,7 +8,6 @@ model_specific_generation_kwargs: | ||
12 | 8 | llava: |
13 | 9 | image_aspect_ratio: original |
14 | 10 | output_type: generate_until |
15 | -dataset_name: mmaad_base | |
16 | 11 | generation_kwargs: |
17 | 12 | until: |
18 | 13 | - "ASSISTANT:" |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmaad_base" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmaad_base_yaml | |
3 | +dataset_name: mmaad_base | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\n" | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmaad_base |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmaad_instruction" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmaad_instruction_yaml | |
3 | +dataset_name: mmaad_base | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\nIf all the options are incorrect, answer \"F. None of the above\"." | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmaad_instruction |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmaad_option" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmaad_option_yaml | |
3 | +dataset_name: mmaad_option | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\nAnswer with the option's letter from the given choices directly." | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmaad_option |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmiasd_base" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmiasd_base_yaml | |
3 | +dataset_name: mmiasd_base | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\n" | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmiasd_base |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmiasd_instruction" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmiasd_instruction_yaml | |
3 | +dataset_name: mmiasd_base | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\nIf all the options are incorrect, answer \"F. None of the above\"." | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmiasd_instruction |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmiasd_option" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmiasd_option_yaml | |
3 | +dataset_name: mmiasd_option | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\nAnswer with the option's letter from the given choices directly." | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmiasd_option |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmivqd_base" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmivqd_base_yaml | |
3 | +dataset_name: mmivqd_base | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\n" | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmivqd_base |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmivqd_instruction" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmivqd_instruction_yaml | |
3 | +dataset_name: mmivqd_base | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\nIf the given image is irrelevant to the question, answer \"F. The image and question are irrelevant.\"." | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmivqd_instruction |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,6 +1,11 @@ | ||
1 | 1 | task: "mmivqd_option" |
2 | 2 | test_split: test |
3 | -include: _default_template_mmivqd_option_yaml | |
3 | +dataset_name: mmivqd_option | |
4 | +model_specific_prompt_kwargs: | |
5 | +default: | |
6 | +pre_prompt: "" | |
7 | +post_prompt: "\nAnswer with the option's letter from the given choices directly." | |
8 | +include: _default_template_mmupd_yaml | |
4 | 9 | metric_list: |
5 | 10 | - metric: gpt_eval_score |
6 | 11 | aggregation: !function utils.mmivqd_option |