Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
@@ -448,6 +448,19 @@ def get_baseline_df_long():
|
|
448 |
df = convert_scores_to_percentage(df)
|
449 |
return df
|
450 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
451 |
def get_all_df(selected_columns, dir=CSV_DIR):
|
452 |
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
453 |
submission_repo.git_pull()
|
@@ -480,6 +493,14 @@ def get_all_df_long(selected_columns, dir=LONG_DIR):
|
|
480 |
df = df.sort_values(by="Selected Score", ascending=False)
|
481 |
return df
|
482 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
483 |
|
484 |
def convert_scores_to_percentage(df):
|
485 |
# Operate on every column in the DataFrame (except the'name 'column)
|
@@ -608,6 +629,34 @@ def on_filter_model_size_method_change_long(selected_columns, vbench_team_sample
|
|
608 |
)
|
609 |
return filter_component#.value
|
610 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
611 |
block = gr.Blocks()
|
612 |
|
613 |
|
@@ -617,7 +666,7 @@ with block:
|
|
617 |
)
|
618 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
619 |
# Table 0
|
620 |
-
with gr.TabItem("π VBench", elem_id="vbench-tab-table", id=1):
|
621 |
with gr.Row():
|
622 |
with gr.Accordion("Citation", open=False):
|
623 |
citation_button = gr.Textbox(
|
@@ -673,8 +722,47 @@ with block:
|
|
673 |
checkbox_group.change(fn=on_filter_model_size_method_change, inputs=[ checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
674 |
vbench_team_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
675 |
vbench_validate_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
676 |
-
#
|
677 |
-
with gr.TabItem("
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
678 |
with gr.Accordion("INSTRUCTION", open=False):
|
679 |
citation_button = gr.Textbox(
|
680 |
value=QUALITY_CLAIM_TEXT,
|
@@ -705,7 +793,7 @@ with block:
|
|
705 |
checkbox_group_quality.change(fn=on_filter_model_size_method_change_quality, inputs=[checkbox_group_quality], outputs=data_component_quality)
|
706 |
|
707 |
# Table i2v
|
708 |
-
with gr.TabItem("VBench-I2V", elem_id="vbench-tab-table", id=
|
709 |
with gr.Accordion("NOTE", open=False):
|
710 |
i2v_note_button = gr.Textbox(
|
711 |
value=I2V_CLAIM_TEXT,
|
@@ -747,7 +835,7 @@ with block:
|
|
747 |
vbench_team_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
748 |
vbench_validate_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
749 |
|
750 |
-
with gr.TabItem("π VBench-Long", elem_id="vbench-tab-table", id=
|
751 |
with gr.Row():
|
752 |
with gr.Accordion("INSTRUCTION", open=False):
|
753 |
citation_button = gr.Textbox(
|
@@ -805,11 +893,11 @@ with block:
|
|
805 |
vbench_validate_filter_long.change(fn=on_filter_model_size_method_change_long, inputs=[checkbox_group_long, vbench_team_filter_long,vbench_validate_filter_long], outputs=data_component)
|
806 |
|
807 |
# table info
|
808 |
-
with gr.TabItem("π About", elem_id="mvbench-tab-table", id=
|
809 |
gr.Markdown(LEADERBORAD_INFO, elem_classes="markdown-text")
|
810 |
|
811 |
# table submission
|
812 |
-
with gr.TabItem("π [T2V]Submit here! ", elem_id="mvbench-tab-table", id=
|
813 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
814 |
|
815 |
with gr.Row():
|
@@ -881,7 +969,7 @@ with block:
|
|
881 |
outputs=[submit_button, submit_succ_button, fail_textbox]
|
882 |
)
|
883 |
|
884 |
-
with gr.TabItem("π [I2V]Submit here! ", elem_id="mvbench-i2v-tab-table", id=
|
885 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
886 |
|
887 |
with gr.Row():
|
@@ -965,4 +1053,4 @@ with block:
|
|
965 |
data_run.click(on_filter_model_size_method_change, inputs=[checkbox_group], outputs=data_component)
|
966 |
|
967 |
|
968 |
-
block.launch()
|
|
|
448 |
df = convert_scores_to_percentage(df)
|
449 |
return df
|
450 |
|
451 |
+
def get_baseline_df_2():
|
452 |
+
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
453 |
+
submission_repo.git_pull()
|
454 |
+
df = pd.read_csv(VBENCH2_DIR)
|
455 |
+
# df = get_final_score(df, checkbox_group.value)
|
456 |
+
# df = df.sort_values(by="Selected Score", ascending=False)
|
457 |
+
# present_columns = MODEL_INFO + checkbox_group.value
|
458 |
+
# print(present_columns)
|
459 |
+
df = df[COLUMN_NAMES_2]
|
460 |
+
# Add this line to display the results evaluated by VBench by default
|
461 |
+
df = convert_scores_to_percentage(df)
|
462 |
+
return df
|
463 |
+
|
464 |
def get_all_df(selected_columns, dir=CSV_DIR):
|
465 |
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
466 |
submission_repo.git_pull()
|
|
|
493 |
df = df.sort_values(by="Selected Score", ascending=False)
|
494 |
return df
|
495 |
|
496 |
+
def get_all_df2(dir=VBENCH2_DIR):
|
497 |
+
submission_repo = Repository(local_dir=SUBMISSION_NAME, clone_from=SUBMISSION_URL, use_auth_token=HF_TOKEN, repo_type="dataset")
|
498 |
+
submission_repo.git_pull()
|
499 |
+
df = pd.read_csv(dir)
|
500 |
+
# df = get_final_score(df, selected_columns)
|
501 |
+
# df = df.sort_values(by="Selected Score", ascending=False)
|
502 |
+
return df
|
503 |
+
|
504 |
|
505 |
def convert_scores_to_percentage(df):
|
506 |
# Operate on every column in the DataFrame (except the'name 'column)
|
|
|
629 |
)
|
630 |
return filter_component#.value
|
631 |
|
632 |
+
|
633 |
+
def on_filter_model_size_method_change_2(vbench_team_sample, vbench_team_eval=False):
|
634 |
+
updated_data = get_all_df(VBENCH2_DIR)
|
635 |
+
if vbench_team_sample:
|
636 |
+
updated_data = updated_data[updated_data["Sampled by"] == 'VBench Team']
|
637 |
+
if vbench_team_eval:
|
638 |
+
updated_data = updated_data[updated_data['Evaluated by'] == 'VBench Team']
|
639 |
+
#print(updated_data)
|
640 |
+
# columns:
|
641 |
+
# selected_columns = [item for item in TASK_INFO if item in selected_columns]
|
642 |
+
# present_columns = MODEL_INFO + selected_columns
|
643 |
+
# updated_data = updated_data[present_columns]
|
644 |
+
# updated_data = updated_data.sort_values(by="Selected Score", ascending=False)
|
645 |
+
# updated_data = convert_scores_to_percentage(updated_data)
|
646 |
+
updated_headers = COLUMN_NAMES_2
|
647 |
+
# print(COLUMN_NAMES,updated_headers,DATA_TITILE_TYPE )
|
648 |
+
update_datatype = VBENCH2_TITLE_TYPE
|
649 |
+
# print(updated_data,present_columns,update_datatype)
|
650 |
+
filter_component = gr.components.Dataframe(
|
651 |
+
value=updated_data,
|
652 |
+
headers=updated_headers,
|
653 |
+
type="pandas",
|
654 |
+
datatype=update_datatype,
|
655 |
+
interactive=False,
|
656 |
+
visible=True,
|
657 |
+
)
|
658 |
+
return filter_component#.value
|
659 |
+
|
660 |
block = gr.Blocks()
|
661 |
|
662 |
|
|
|
666 |
)
|
667 |
with gr.Tabs(elem_classes="tab-buttons") as tabs:
|
668 |
# Table 0
|
669 |
+
with gr.TabItem("π VBench 1.0", elem_id="vbench-tab-table", id=1):
|
670 |
with gr.Row():
|
671 |
with gr.Accordion("Citation", open=False):
|
672 |
citation_button = gr.Textbox(
|
|
|
722 |
checkbox_group.change(fn=on_filter_model_size_method_change, inputs=[ checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
723 |
vbench_team_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
724 |
vbench_validate_filter.change(fn=on_filter_model_size_method_change, inputs=[checkbox_group, vbench_team_filter, vbench_validate_filter], outputs=data_component)
|
725 |
+
# VBench 2.0
|
726 |
+
with gr.TabItem("β VBench 2.0", elem_id="vbench-tab-table", id=2):
|
727 |
+
with gr.Row():
|
728 |
+
with gr.Accordion("Citation", open=False):
|
729 |
+
citation_button2 = gr.Textbox(
|
730 |
+
value=CITATION_BUTTON_TEXT,
|
731 |
+
label=CITATION_BUTTON_LABEL,
|
732 |
+
elem_id="citation-button",
|
733 |
+
lines=14,
|
734 |
+
)
|
735 |
+
|
736 |
+
gr.Markdown(
|
737 |
+
TABLE_INTRODUCTION
|
738 |
+
)
|
739 |
+
with gr.Row():
|
740 |
+
with gr.Column():
|
741 |
+
vbench_team_filter_2 = gr.Checkbox(
|
742 |
+
label="Sampled by VBench Team (Uncheck to view all submissions)",
|
743 |
+
value=False,
|
744 |
+
interactive=True
|
745 |
+
)
|
746 |
+
vbench_validate_filter_2 = gr.Checkbox(
|
747 |
+
label="Evaluated by VBench Team (Uncheck to view all submissions)",
|
748 |
+
value=True,
|
749 |
+
interactive=True
|
750 |
+
)
|
751 |
+
|
752 |
+
|
753 |
+
data_component_2 = gr.components.Dataframe(
|
754 |
+
value=get_baseline_df_2,
|
755 |
+
headers=COLUMN_NAMES_2,
|
756 |
+
type="pandas",
|
757 |
+
datatype=VBENCH2_TITLE_TYPE,
|
758 |
+
interactive=False,
|
759 |
+
visible=True,
|
760 |
+
height=700,
|
761 |
+
)
|
762 |
+
vbench_team_filter.change(fn=on_filter_model_size_method_change_2, inputs=[vbench_team_filter_2, vbench_validate_filter], outputs=data_component_2)
|
763 |
+
vbench_validate_filter.change(fn=on_filter_model_size_method_change_2, inputs=[vbench_team_filter_2, vbench_validate_filter], outputs=data_component_2)
|
764 |
+
|
765 |
+
with gr.TabItem("Video Quality", elem_id="vbench-tab-table", id=3):
|
766 |
with gr.Accordion("INSTRUCTION", open=False):
|
767 |
citation_button = gr.Textbox(
|
768 |
value=QUALITY_CLAIM_TEXT,
|
|
|
793 |
checkbox_group_quality.change(fn=on_filter_model_size_method_change_quality, inputs=[checkbox_group_quality], outputs=data_component_quality)
|
794 |
|
795 |
# Table i2v
|
796 |
+
with gr.TabItem("VBench-I2V", elem_id="vbench-tab-table", id=4):
|
797 |
with gr.Accordion("NOTE", open=False):
|
798 |
i2v_note_button = gr.Textbox(
|
799 |
value=I2V_CLAIM_TEXT,
|
|
|
835 |
vbench_team_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
836 |
vbench_validate_filter_i2v.change(fn=on_filter_model_size_method_change_i2v, inputs=[checkbox_group_i2v, vbench_team_filter_i2v,vbench_validate_filter_i2v], outputs=data_component_i2v)
|
837 |
|
838 |
+
with gr.TabItem("π VBench-Long", elem_id="vbench-tab-table", id=5):
|
839 |
with gr.Row():
|
840 |
with gr.Accordion("INSTRUCTION", open=False):
|
841 |
citation_button = gr.Textbox(
|
|
|
893 |
vbench_validate_filter_long.change(fn=on_filter_model_size_method_change_long, inputs=[checkbox_group_long, vbench_team_filter_long,vbench_validate_filter_long], outputs=data_component)
|
894 |
|
895 |
# table info
|
896 |
+
with gr.TabItem("π About", elem_id="mvbench-tab-table", id=6):
|
897 |
gr.Markdown(LEADERBORAD_INFO, elem_classes="markdown-text")
|
898 |
|
899 |
# table submission
|
900 |
+
with gr.TabItem("π [T2V]Submit here! ", elem_id="mvbench-tab-table", id=7):
|
901 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
902 |
|
903 |
with gr.Row():
|
|
|
969 |
outputs=[submit_button, submit_succ_button, fail_textbox]
|
970 |
)
|
971 |
|
972 |
+
with gr.TabItem("π [I2V]Submit here! ", elem_id="mvbench-i2v-tab-table", id=8):
|
973 |
gr.Markdown(LEADERBORAD_INTRODUCTION, elem_classes="markdown-text")
|
974 |
|
975 |
with gr.Row():
|
|
|
1053 |
data_run.click(on_filter_model_size_method_change, inputs=[checkbox_group], outputs=data_component)
|
1054 |
|
1055 |
|
1056 |
+
block.launch()
|