Spaces:

FSMBench
/

Leaderboard

Sleeping

App Files Files Community

taesiri commited on Apr 21, 2024

Commit

5b905b8

1 Parent(s): 05e4334

update

Browse files

Files changed (1) hide show

app.py +8 -7

app.py CHANGED Viewed

@@ -38,12 +38,13 @@ def load_data(files, model_type):
 # Load and label all data
 data = load_data(noncot_results, "Text Only")
 vision_data = load_data(vision_results, "Vision")
 cot_text_data = load_data(cot_text_results, "CoT Text Only")
 # cot_vision_data = load_data(cot_vision_results, "CoT Vision")
 # Combine all data into a single DataFrame
-all_data = pd.concat([data, vision_data, cot_text_data], ignore_index=True)
 all_model_names = all_data["Model Name"].unique()
 all_text_only_model_names = list(
@@ -414,7 +415,7 @@ def generate_heatmap_for_intersection_model(model_name):
     sns.despine(ax=ax, top=True, right=True, left=True, bottom=True)
-    plt.close(fig)  # Prevent it from showing immediately
     return fig
@@ -443,7 +444,7 @@ with gr.Blocks() as demo:
         heatmap_image_qwen = gr.Image(label="", show_label=False)
         leader_board.select(fn=load_heatmap_qwen, outputs=[heatmap_image_qwen])
-    with gr.Tab("Vision Benchmark"):
         gr.Markdown("# Vision Benchmark Leaderboard")
         leader_board_vision = gr.Dataframe(
             vision_accuracy_df, headers=headers_with_icons
@@ -454,7 +455,7 @@ with gr.Blocks() as demo:
             fn=load_vision_heatmap, outputs=[heatmap_image_vision]
         )
-    with gr.Tab("Text-only Benchmark (CoT)"):
         gr.Markdown("# Text-only Leaderboard (CoT)")
         cot_leader_board_text = gr.Dataframe(
             cot_text_accuracy_df, headers=headers_with_icons
@@ -499,7 +500,7 @@ with gr.Blocks() as demo:
         queue=True,
     )
-    with gr.Tab("Constraint Text-only Results (CoT)"):
         gr.Markdown("## Constraint Text-only Leaderboard by first substrin (CoT)")
         included_models_cot = gr.CheckboxGroup(
             label="Models to include",
@@ -514,14 +515,14 @@ with gr.Blocks() as demo:
         constrained_leader_board_text_cot = gr.Dataframe()
         constrained_leader_board_plot_cot = gr.Plot()
-    with gr.Tab("Majority Vote (Subset 1)"):
         gr.Markdown("## Majority Vote (Subset 1)")
         intersection_leader_board = gr.Dataframe(
             intersection_df_acc, headers=headers_with_icons
         )
         heatmap_image = gr.Plot(label="Model Heatmap")
-    with gr.Tab("Text-only Benchmark (deprecated)"):
         gr.Markdown("# Text-only Leaderboard")
         leader_board = gr.Dataframe(accuracy_df, headers=headers_with_icons)
         gr.Markdown("## Heatmap")

 # Load and label all data
 data = load_data(noncot_results, "Text Only")
+data_qwen = load_data(noncot_results_qwen, "Text Only")
 vision_data = load_data(vision_results, "Vision")
 cot_text_data = load_data(cot_text_results, "CoT Text Only")
 # cot_vision_data = load_data(cot_vision_results, "CoT Vision")
 # Combine all data into a single DataFrame
+all_data = pd.concat([data_qwen, vision_data, cot_text_data], ignore_index=True)
 all_model_names = all_data["Model Name"].unique()
 all_text_only_model_names = list(
     sns.despine(ax=ax, top=True, right=True, left=True, bottom=True)
+    plt.close(fig)
     return fig
         heatmap_image_qwen = gr.Image(label="", show_label=False)
         leader_board.select(fn=load_heatmap_qwen, outputs=[heatmap_image_qwen])
+    with gr.Tab("Vision Benchmark", visible=False):
         gr.Markdown("# Vision Benchmark Leaderboard")
         leader_board_vision = gr.Dataframe(
             vision_accuracy_df, headers=headers_with_icons
             fn=load_vision_heatmap, outputs=[heatmap_image_vision]
         )
+    with gr.Tab("Text-only Benchmark (CoT)", visible=False):
         gr.Markdown("# Text-only Leaderboard (CoT)")
         cot_leader_board_text = gr.Dataframe(
             cot_text_accuracy_df, headers=headers_with_icons
         queue=True,
     )
+    with gr.Tab("Constraint Text-only Results (CoT)", visible=False):
         gr.Markdown("## Constraint Text-only Leaderboard by first substrin (CoT)")
         included_models_cot = gr.CheckboxGroup(
             label="Models to include",
         constrained_leader_board_text_cot = gr.Dataframe()
         constrained_leader_board_plot_cot = gr.Plot()
+    with gr.Tab("Majority Vote (Subset 1)", visible=False):
         gr.Markdown("## Majority Vote (Subset 1)")
         intersection_leader_board = gr.Dataframe(
             intersection_df_acc, headers=headers_with_icons
         )
         heatmap_image = gr.Plot(label="Model Heatmap")
+    with gr.Tab("Text-only Benchmark (deprecated)", visible=False):
         gr.Markdown("# Text-only Leaderboard")
         leader_board = gr.Dataframe(accuracy_df, headers=headers_with_icons)
         gr.Markdown("## Heatmap")