Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -448,6 +448,19 @@ def get_baseline_df_long():
|
|
| 448 |
df = convert_scores_to_percentage(df)
|
| 449 |
return df
|
| 450 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 451 |
def get_all_df(selected_columns, dir=CSV_DIR):
|
| 452 |
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
| 453 |
submission_repo.git_pull()
|
|
@@ -480,6 +493,14 @@ def get_all_df_long(selected_columns, dir=LONG_DIR):
|
|
| 480 |
df = df.sort_values(by="Selected Score", ascending=False)
|
| 481 |
return df
|
| 482 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 483 |
|
| 484 |
def convert_scores_to_percentage(df):
|
| 485 |
# Operate on every column in the DataFrame (except the'name 'column)
|
|
@@ -608,6 +629,34 @@ def on_filter_model_size_method_change_long(selected_columns, vbench_team_sample
|
|
| 608 |
)
|
| 609 |
return filter_component#.value
|
| 610 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 611 |
block = gr.Blocks()
|
| 612 |
|
| 613 |
|
|
@@ -617,7 +666,7 @@ with block:
|
|
| 617 |
)
|
| 618 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
| 619 |
# Table 0
|
| 620 |
-
with gr.TabItem("π VBench", elem_id="vbench-tab-table", id=1):
|
| 621 |
with gr.Row():
|
| 622 |
with gr.Accordion("Citation", open=False):
|
| 623 |
citation_button = gr.Textbox(
|
|
@@ -673,8 +722,47 @@ with block:
|
|
| 673 |
checkbox_group.change(fn=on_filter_model_size_method_change, inputs=[ checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
| 674 |
vbench_team_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
| 675 |
vbench_validate_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
| 676 |
-
#
|
| 677 |
-
with gr.TabItem("
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 678 |
with gr.Accordion("INSTRUCTION", open=False):
|
| 679 |
citation_button = gr.Textbox(
|
| 680 |
value=QUALITY_CLAIM_TEXT,
|
|
@@ -705,7 +793,7 @@ with block:
|
|
| 705 |
checkbox_group_quality.change(fn=on_filter_model_size_method_change_quality, inputs=[checkbox_group_quality], outputs=data_component_quality)
|
| 706 |
|
| 707 |
# Table i2v
|
| 708 |
-
with gr.TabItem("VBench-I2V", elem_id="vbench-tab-table", id=
|
| 709 |
with gr.Accordion("NOTE", open=False):
|
| 710 |
i2v_note_button = gr.Textbox(
|
| 711 |
value=I2V_CLAIM_TEXT,
|
|
@@ -747,7 +835,7 @@ with block:
|
|
| 747 |
vbench_team_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
| 748 |
vbench_validate_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
| 749 |
|
| 750 |
-
with gr.TabItem("π VBench-Long", elem_id="vbench-tab-table", id=
|
| 751 |
with gr.Row():
|
| 752 |
with gr.Accordion("INSTRUCTION", open=False):
|
| 753 |
citation_button = gr.Textbox(
|
|
@@ -805,11 +893,11 @@ with block:
|
|
| 805 |
vbench_validate_filter_long.change(fn=on_filter_model_size_method_change_long, inputs=[checkbox_group_long, vbench_team_filter_long,vbench_validate_filter_long], outputs=data_component)
|
| 806 |
|
| 807 |
# table info
|
| 808 |
-
with gr.TabItem("π About", elem_id="mvbench-tab-table", id=
|
| 809 |
gr.Markdown(LEADERBORAD_INFO, elem_classes="markdown-text")
|
| 810 |
|
| 811 |
# table submission
|
| 812 |
-
with gr.TabItem("π [T2V]Submit here! ", elem_id="mvbench-tab-table", id=
|
| 813 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
| 814 |
|
| 815 |
with gr.Row():
|
|
@@ -881,7 +969,7 @@ with block:
|
|
| 881 |
outputs=[submit_button, submit_succ_button, fail_textbox]
|
| 882 |
)
|
| 883 |
|
| 884 |
-
with gr.TabItem("π [I2V]Submit here! ", elem_id="mvbench-i2v-tab-table", id=
|
| 885 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
| 886 |
|
| 887 |
with gr.Row():
|
|
@@ -965,4 +1053,4 @@ with block:
|
|
| 965 |
data_run.click(on_filter_model_size_method_change, inputs=[checkbox_group], outputs=data_component)
|
| 966 |
|
| 967 |
|
| 968 |
-
block.launch()
|
|
|
|
| 448 |
df = convert_scores_to_percentage(df)
|
| 449 |
return df
|
| 450 |
|
| 451 |
+
def get_baseline_df_2():
|
| 452 |
+
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
| 453 |
+
submission_repo.git_pull()
|
| 454 |
+
df = pd.read_csv(VBENCH2_DIR)
|
| 455 |
+
# df = get_final_score(df, checkbox_group.value)
|
| 456 |
+
# df = df.sort_values(by="Selected Score", ascending=False)
|
| 457 |
+
# present_columns = MODEL_INFO + checkbox_group.value
|
| 458 |
+
# print(present_columns)
|
| 459 |
+
df = df[COLUMN_NAMES_2]
|
| 460 |
+
# Add this line to display the results evaluated by VBench by default
|
| 461 |
+
df = convert_scores_to_percentage(df)
|
| 462 |
+
return df
|
| 463 |
+
|
| 464 |
def get_all_df(selected_columns, dir=CSV_DIR):
|
| 465 |
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
| 466 |
submission_repo.git_pull()
|
|
|
|
| 493 |
df = df.sort_values(by="Selected Score", ascending=False)
|
| 494 |
return df
|
| 495 |
|
| 496 |
+
def get_all_df2(dir=VBENCH2_DIR):
|
| 497 |
+
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
| 498 |
+
submission_repo.git_pull()
|
| 499 |
+
df = pd.read_csv(dir)
|
| 500 |
+
# df = get_final_score(df, selected_columns)
|
| 501 |
+
# df = df.sort_values(by="Selected Score", ascending=False)
|
| 502 |
+
return df
|
| 503 |
+
|
| 504 |
|
| 505 |
def convert_scores_to_percentage(df):
|
| 506 |
# Operate on every column in the DataFrame (except the'name 'column)
|
|
|
|
| 629 |
)
|
| 630 |
return filter_component#.value
|
| 631 |
|
| 632 |
+
|
| 633 |
+
def on_filter_model_size_method_change_2(vbench_team_sample, vbench_team_eval=False):
|
| 634 |
+
updated_data = get_all_df(VBENCH2_DIR)
|
| 635 |
+
if vbench_team_sample:
|
| 636 |
+
updated_data = updated_data[updated_data["Sampled by"] == 'VBench Team']
|
| 637 |
+
if vbench_team_eval:
|
| 638 |
+
updated_data = updated_data[updated_data['Evaluated by'] == 'VBench Team']
|
| 639 |
+
#print(updated_data)
|
| 640 |
+
# columns:
|
| 641 |
+
# selected_columns = [item for item in TASK_INFO if item in selected_columns]
|
| 642 |
+
# present_columns = MODEL_INFO + selected_columns
|
| 643 |
+
# updated_data = updated_data[present_columns]
|
| 644 |
+
# updated_data = updated_data.sort_values(by="Selected Score", ascending=False)
|
| 645 |
+
# updated_data = convert_scores_to_percentage(updated_data)
|
| 646 |
+
updated_headers = COLUMN_NAMES_2
|
| 647 |
+
# print(COLUMN_NAMES,updated_headers,DATA_TITILE_TYPE )
|
| 648 |
+
update_datatype = VBENCH2_TITLE_TYPE
|
| 649 |
+
# print(updated_data,present_columns,update_datatype)
|
| 650 |
+
filter_component = gr.components.Dataframe(
|
| 651 |
+
value=updated_data,
|
| 652 |
+
headers=updated_headers,
|
| 653 |
+
type="pandas",
|
| 654 |
+
datatype=update_datatype,
|
| 655 |
+
interactive=False,
|
| 656 |
+
visible=True,
|
| 657 |
+
)
|
| 658 |
+
return filter_component#.value
|
| 659 |
+
|
| 660 |
block = gr.Blocks()
|
| 661 |
|
| 662 |
|
|
|
|
| 666 |
)
|
| 667 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
| 668 |
# Table 0
|
| 669 |
+
with gr.TabItem("π VBench 1.0", elem_id="vbench-tab-table", id=1):
|
| 670 |
with gr.Row():
|
| 671 |
with gr.Accordion("Citation", open=False):
|
| 672 |
citation_button = gr.Textbox(
|
|
|
|
| 722 |
checkbox_group.change(fn=on_filter_model_size_method_change, inputs=[ checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
| 723 |
vbench_team_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
| 724 |
vbench_validate_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
| 725 |
+
# VBench 2.0
|
| 726 |
+
with gr.TabItem("β VBench 2.0", elem_id="vbench-tab-table", id=2):
|
| 727 |
+
with gr.Row():
|
| 728 |
+
with gr.Accordion("Citation", open=False):
|
| 729 |
+
citation_button2 = gr.Textbox(
|
| 730 |
+
value=CITATION_BUTTON_TEXT,
|
| 731 |
+
label=CITATION_BUTTON_LABEL,
|
| 732 |
+
elem_id="citation-button",
|
| 733 |
+
lines=14,
|
| 734 |
+
)
|
| 735 |
+
|
| 736 |
+
gr.Markdown(
|
| 737 |
+
TABLE_INTRODUCTION
|
| 738 |
+
)
|
| 739 |
+
with gr.Row():
|
| 740 |
+
with gr.Column():
|
| 741 |
+
vbench_team_filter_2 = gr.Checkbox(
|
| 742 |
+
label="Sampled by VBench Team (Uncheck to view all submissions)",
|
| 743 |
+
value=False,
|
| 744 |
+
interactive=True
|
| 745 |
+
)
|
| 746 |
+
vbench_validate_filter_2 = gr.Checkbox(
|
| 747 |
+
label="Evaluated by VBench Team (Uncheck to view all submissions)",
|
| 748 |
+
value=True,
|
| 749 |
+
interactive=True
|
| 750 |
+
)
|
| 751 |
+
|
| 752 |
+
|
| 753 |
+
data_component_2 = gr.components.Dataframe(
|
| 754 |
+
value=get_baseline_df_2,
|
| 755 |
+
headers=COLUMN_NAMES_2,
|
| 756 |
+
type="pandas",
|
| 757 |
+
datatype=VBENCH2_TITLE_TYPE,
|
| 758 |
+
interactive=False,
|
| 759 |
+
visible=True,
|
| 760 |
+
height=700,
|
| 761 |
+
)
|
| 762 |
+
vbench_team_filter.change(fn=on_filter_model_size_method_change_2, inputs=[vbench_team_filter_2, vbench_validate_filter], outputs=data_component_2)
|
| 763 |
+
vbench_validate_filter.change(fn=on_filter_model_size_method_change_2, inputs=[vbench_team_filter_2, vbench_validate_filter], outputs=data_component_2)
|
| 764 |
+
|
| 765 |
+
with gr.TabItem("Video Quality", elem_id="vbench-tab-table", id=3):
|
| 766 |
with gr.Accordion("INSTRUCTION", open=False):
|
| 767 |
citation_button = gr.Textbox(
|
| 768 |
value=QUALITY_CLAIM_TEXT,
|
|
|
|
| 793 |
checkbox_group_quality.change(fn=on_filter_model_size_method_change_quality, inputs=[checkbox_group_quality], outputs=data_component_quality)
|
| 794 |
|
| 795 |
# Table i2v
|
| 796 |
+
with gr.TabItem("VBench-I2V", elem_id="vbench-tab-table", id=4):
|
| 797 |
with gr.Accordion("NOTE", open=False):
|
| 798 |
i2v_note_button = gr.Textbox(
|
| 799 |
value=I2V_CLAIM_TEXT,
|
|
|
|
| 835 |
vbench_team_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
| 836 |
vbench_validate_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
| 837 |
|
| 838 |
+
with gr.TabItem("π VBench-Long", elem_id="vbench-tab-table", id=5):
|
| 839 |
with gr.Row():
|
| 840 |
with gr.Accordion("INSTRUCTION", open=False):
|
| 841 |
citation_button = gr.Textbox(
|
|
|
|
| 893 |
vbench_validate_filter_long.change(fn=on_filter_model_size_method_change_long, inputs=[checkbox_group_long, vbench_team_filter_long,vbench_validate_filter_long], outputs=data_component)
|
| 894 |
|
| 895 |
# table info
|
| 896 |
+
with gr.TabItem("π About", elem_id="mvbench-tab-table", id=6):
|
| 897 |
gr.Markdown(LEADERBORAD_INFO, elem_classes="markdown-text")
|
| 898 |
|
| 899 |
# table submission
|
| 900 |
+
with gr.TabItem("π [T2V]Submit here! ", elem_id="mvbench-tab-table", id=7):
|
| 901 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
| 902 |
|
| 903 |
with gr.Row():
|
|
|
|
| 969 |
outputs=[submit_button, submit_succ_button, fail_textbox]
|
| 970 |
)
|
| 971 |
|
| 972 |
+
with gr.TabItem("π [I2V]Submit here! ", elem_id="mvbench-i2v-tab-table", id=8):
|
| 973 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
| 974 |
|
| 975 |
with gr.Row():
|
|
|
|
| 1053 |
data_run.click(on_filter_model_size_method_change, inputs=[checkbox_group], outputs=data_component)
|
| 1054 |
|
| 1055 |
|
| 1056 |
+
block.launch()
|