Skip to content

Commit

Permalink
update eval
Browse files Browse the repository at this point in the history
  • Loading branch information
rayguan97 committed Nov 16, 2023
1 parent d0114ff commit 3733d9c
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion evaluation.py
Original file line number Diff line number Diff line change
Expand Up @@ -128,7 +128,7 @@ def generate_answer(data, model_output_entry):

print("##### Leaderboard Stats #####")

table = [["", "Acc per question pair", "Acc per figure", "Acc per easy question", "Acc per hard question", "Acc per question"],
table = [["", "Acc per question pair (qAcc)", "Acc per figure (fAcc)", "Acc per easy question (easy aAcc)", "Acc per hard question (hard aAcc)", "Acc per question (aAcc)"],
["GPT Eval", pair_acc_gpt, figure_acc_gpt, easy_acc_gpt, hard_acc_gpt, q_acc_gpt]]
leaderboard = PrettyTable(table[0])
leaderboard.add_rows(table[1:])
Expand Down
2 changes: 1 addition & 1 deletion gpt4v_benchmark.py
Original file line number Diff line number Diff line change
Expand Up @@ -232,7 +232,7 @@ def generate_answer(data, model_output_entry):

print("##### Leaderboard Stats #####")

table = [["", "Acc per question pair", "Acc per figure", "Acc per easy question", "Acc per hard question", "Acc per question"],
table = [["", "Acc per question pair (qAcc)", "Acc per figure (fAcc)", "Acc per easy question (easy aAcc)", "Acc per hard question (hard aAcc)", "Acc per question (aAcc)"],
["Human Eval", pair_acc_human, figure_acc_human, easy_acc_human, hard_acc_human, q_acc_human],
["GPT Eval", pair_acc_gpt, figure_acc_gpt, easy_acc_gpt, hard_acc_gpt, q_acc_gpt]]
leaderboard = PrettyTable(table[0])
Expand Down

0 comments on commit 3733d9c

Please sign in to comment.