Skip to content

Commit

Permalink
[Fix] import issues of multilingual llava and olympiadbench
Browse files Browse the repository at this point in the history
  • Loading branch information
Luodian committed May 27, 2024
1 parent 4c5a99e commit 616edf4
Show file tree
Hide file tree
Showing 15 changed files with 111 additions and 448 deletions.
Original file line number Diff line number Diff line change
@@ -0,0 +1,35 @@
test_split: train
output_type: generate_until
doc_to_visual: !function utils.llava_doc_to_visual
doc_to_text: !function utils.llava_doc_to_text
doc_to_target: "gpt_answer"
generation_kwargs:
until:
- "ASSISTANT:"
image_aspect_ratio: original
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.llava_process_results
metric_list:
- metric: gpt_eval_llava_all
aggregation: !function utils.llava_all_aggregation
higher_is_better: true
- metric: gpt_eval_llava_conv
aggregation: !function utils.llava_conv_aggregation
higher_is_better: true
- metric: gpt_eval_llava_detail
aggregation: !function utils.llava_detail_aggregation
higher_is_better: true
- metric: gpt_eval_llava_complex
aggregation: !function utils.llava_complex_aggregation
higher_is_better: true
metadata:
version: 0.0
gpt_eval_model_name: "gpt-4-0613"
model_specific_prompt_kwargs:
default:
pre_prompt: ""
post_prompt: ""

This file was deleted.

Original file line number Diff line number Diff line change
@@ -1,42 +1,6 @@

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: arabic
token: True
task: "llava_in_the_wild_arabic"
test_split: train
output_type: generate_until
doc_to_visual: !function utils.llava_doc_to_visual
doc_to_text: !function utils.llava_doc_to_text
doc_to_target: "gpt_answer"
generation_kwargs:
until:
- "ASSISTANT:"
image_aspect_ratio: original
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.llava_process_results
metric_list:
- metric: gpt_eval_llava_all
aggregation: !function utils.llava_all_aggregation
higher_is_better: true
- metric: gpt_eval_llava_conv
aggregation: !function utils.llava_conv_aggregation
higher_is_better: true
- metric: gpt_eval_llava_detail
aggregation: !function utils.llava_detail_aggregation
higher_is_better: true
- metric: gpt_eval_llava_complex
aggregation: !function utils.llava_complex_aggregation
higher_is_better: true
metadata:
version: 0.0
gpt_eval_model_name: "gpt-4-0613"
model_specific_prompt_kwargs:
default:
pre_prompt: ""
post_prompt: ""

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: arabic
token: True
task: "llava_in_the_wild_arabic"
include: _default_template.yaml
Original file line number Diff line number Diff line change
@@ -1,42 +1,6 @@

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: bengali
token: True
task: "llava_in_the_wild_bengali"
test_split: train
output_type: generate_until
doc_to_visual: !function utils.llava_doc_to_visual
doc_to_text: !function utils.llava_doc_to_text
doc_to_target: "gpt_answer"
generation_kwargs:
until:
- "ASSISTANT:"
image_aspect_ratio: original
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.llava_process_results
metric_list:
- metric: gpt_eval_llava_all
aggregation: !function utils.llava_all_aggregation
higher_is_better: true
- metric: gpt_eval_llava_conv
aggregation: !function utils.llava_conv_aggregation
higher_is_better: true
- metric: gpt_eval_llava_detail
aggregation: !function utils.llava_detail_aggregation
higher_is_better: true
- metric: gpt_eval_llava_complex
aggregation: !function utils.llava_complex_aggregation
higher_is_better: true
metadata:
version: 0.0
gpt_eval_model_name: "gpt-4-0613"
model_specific_prompt_kwargs:
default:
pre_prompt: ""
post_prompt: ""

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: bengali
token: True
task: "llava_in_the_wild_bengali"
include: _default_template.yaml
Original file line number Diff line number Diff line change
@@ -1,42 +1,6 @@

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: chinese
token: True
task: "llava_in_the_wild_chinese"
test_split: train
output_type: generate_until
doc_to_visual: !function utils.llava_doc_to_visual
doc_to_text: !function utils.llava_doc_to_text
doc_to_target: "gpt_answer"
generation_kwargs:
until:
- "ASSISTANT:"
image_aspect_ratio: original
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.llava_process_results
metric_list:
- metric: gpt_eval_llava_all
aggregation: !function utils.llava_all_aggregation
higher_is_better: true
- metric: gpt_eval_llava_conv
aggregation: !function utils.llava_conv_aggregation
higher_is_better: true
- metric: gpt_eval_llava_detail
aggregation: !function utils.llava_detail_aggregation
higher_is_better: true
- metric: gpt_eval_llava_complex
aggregation: !function utils.llava_complex_aggregation
higher_is_better: true
metadata:
version: 0.0
gpt_eval_model_name: "gpt-4-0613"
model_specific_prompt_kwargs:
default:
pre_prompt: ""
post_prompt: ""

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: chinese
token: True
task: "llava_in_the_wild_chinese"
include: _default_template.yaml
Original file line number Diff line number Diff line change
@@ -1,42 +1,6 @@

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: french
token: True
task: "llava_in_the_wild_french"
test_split: train
output_type: generate_until
doc_to_visual: !function utils.llava_doc_to_visual
doc_to_text: !function utils.llava_doc_to_text
doc_to_target: "gpt_answer"
generation_kwargs:
until:
- "ASSISTANT:"
image_aspect_ratio: original
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.llava_process_results
metric_list:
- metric: gpt_eval_llava_all
aggregation: !function utils.llava_all_aggregation
higher_is_better: true
- metric: gpt_eval_llava_conv
aggregation: !function utils.llava_conv_aggregation
higher_is_better: true
- metric: gpt_eval_llava_detail
aggregation: !function utils.llava_detail_aggregation
higher_is_better: true
- metric: gpt_eval_llava_complex
aggregation: !function utils.llava_complex_aggregation
higher_is_better: true
metadata:
version: 0.0
gpt_eval_model_name: "gpt-4-0613"
model_specific_prompt_kwargs:
default:
pre_prompt: ""
post_prompt: ""

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: french
token: True
task: "llava_in_the_wild_french"
include: _default_template.yaml
Original file line number Diff line number Diff line change
@@ -1,42 +1,6 @@

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: hindi
token: True
task: "llava_in_the_wild_hindi"
test_split: train
output_type: generate_until
doc_to_visual: !function utils.llava_doc_to_visual
doc_to_text: !function utils.llava_doc_to_text
doc_to_target: "gpt_answer"
generation_kwargs:
until:
- "ASSISTANT:"
image_aspect_ratio: original
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.llava_process_results
metric_list:
- metric: gpt_eval_llava_all
aggregation: !function utils.llava_all_aggregation
higher_is_better: true
- metric: gpt_eval_llava_conv
aggregation: !function utils.llava_conv_aggregation
higher_is_better: true
- metric: gpt_eval_llava_detail
aggregation: !function utils.llava_detail_aggregation
higher_is_better: true
- metric: gpt_eval_llava_complex
aggregation: !function utils.llava_complex_aggregation
higher_is_better: true
metadata:
version: 0.0
gpt_eval_model_name: "gpt-4-0613"
model_specific_prompt_kwargs:
default:
pre_prompt: ""
post_prompt: ""

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: hindi
token: True
task: "llava_in_the_wild_hindi"
include: _default_template.yaml
Original file line number Diff line number Diff line change
@@ -1,42 +1,6 @@

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: japanese
token: True
task: "llava_in_the_wild_japanese"
test_split: train
output_type: generate_until
doc_to_visual: !function utils.llava_doc_to_visual
doc_to_text: !function utils.llava_doc_to_text
doc_to_target: "gpt_answer"
generation_kwargs:
until:
- "ASSISTANT:"
image_aspect_ratio: original
max_new_tokens: 1024
temperature: 0
top_p: 0
num_beams: 1
do_sample: false
process_results: !function utils.llava_process_results
metric_list:
- metric: gpt_eval_llava_all
aggregation: !function utils.llava_all_aggregation
higher_is_better: true
- metric: gpt_eval_llava_conv
aggregation: !function utils.llava_conv_aggregation
higher_is_better: true
- metric: gpt_eval_llava_detail
aggregation: !function utils.llava_detail_aggregation
higher_is_better: true
- metric: gpt_eval_llava_complex
aggregation: !function utils.llava_complex_aggregation
higher_is_better: true
metadata:
version: 0.0
gpt_eval_model_name: "gpt-4-0613"
model_specific_prompt_kwargs:
default:
pre_prompt: ""
post_prompt: ""

dataset_path: "gagan3012/multilingual-llava-bench"
dataset_kwargs:
config: japanese
token: True
task: "llava_in_the_wild_japanese"
include: _default_template.yaml
Loading

0 comments on commit 616edf4

Please sign in to comment.