Spaces:

allenai
/

ZebraLogic

Running

App Files Files Community

yuchenlin commited on Jul 12, 2024

Commit

eaea101

1 Parent(s): 4dd52cf

sample a puzzle

Browse files

Files changed (1) hide show

app.py +10 -6

app.py CHANGED Viewed

@@ -90,8 +90,8 @@ def _tab_leaderboard():
         mode_selection_radio.change(fn=df_filters, inputs=[mode_selection_radio, _gstr("")], outputs=[leaderboard_table])
-def sample_explore_item(model_name, size_H, size_W, greedy_or_sample):
-    print(model_name, size_H, size_W, greedy_or_sample)
     explore_item = get_random_item(model_name, size_H, size_W)
     if explore_item is None:
         return "No item found", "No item found", "No item found", "No item found"
@@ -99,7 +99,8 @@ def sample_explore_item(model_name, size_H, size_W, greedy_or_sample):
     example_id = explore_item['id']
     puzzle_md = f"### Puzzle [{example_id}]:\n\n" + explore_item['puzzle'].replace("## Clues", "### Clues").replace("\n", "<br>")
     model_reasoning_md = f"### {model_name}'s Reasoning:\n\n {explore_item['reasoning']}"
-    model_prediction_md = f"### {model_name}'s Prediction:\n\n {explore_item['solution']}"  + "\n\n" + explore_item['solution_table_md']
     puzzle_solved = explore_item['correct_cells'] == explore_item['total_cells']
     cell_acc = explore_item["correct_cells"] / explore_item["total_cells"] * 100
     model_eval_md = f"### Evaluation:\n\n  **Total Cells**: {explore_item['total_cells']} | **Correct Cells**: {explore_item['correct_cells']} | **Puzzle solved**: {puzzle_solved} | **Cell Acc**: {cell_acc:.2f}%"
@@ -109,13 +110,16 @@ def sample_explore_item(model_name, size_H, size_W, greedy_or_sample):
 def _tab_explore():
     global raw_data
     model_names = [item["Model"] for item in raw_data]
     with gr.Row():
         model_selection = gr.Dropdown(choices = ["random"] + model_names, label="Model: ", elem_id="select-models", value="random", interactive=True)
         size_H_selection = gr.Dropdown(choices = ["random"] + [f"{i}" for i in range(2,7)], label="Num of Houses", elem_id="select-H", value="random", interactive=True)
         size_W_selection = gr.Dropdown(choices = ["random"] + [f"{i}" for i in range(2,7)], label="Num of Features", elem_id="select-W", value="random", interactive=True)
         with gr.Column(scale=1):
-            greedy_or_sample = gr.Radio(["greedy", "sampling"], show_label=False, elem_id="greedy-or-sample", value="greedy", interactive=True)
-            explore_button = gr.Button("Sample", elem_id="explore-button")
     puzzle_md = gr.Markdown("\n\nTo be loaded", elem_id="puzzle-md", elem_classes="box_md")
     model_reasoning_md = gr.Markdown("\n\nTo be loaded", elem_id="model-reasoning-md", elem_classes="box_md")
@@ -123,7 +127,7 @@ def _tab_explore():
     model_eval_md = gr.Markdown("\n\nTo be loaded", elem_id="model-eval-md", elem_classes="box_md")
     explore_button.click(fn=sample_explore_item,
-                         inputs=[model_selection, size_H_selection, size_W_selection, greedy_or_sample],
                          outputs=[puzzle_md, model_reasoning_md, model_prediction_md, model_eval_md])

         mode_selection_radio.change(fn=df_filters, inputs=[mode_selection_radio, _gstr("")], outputs=[leaderboard_table])
+def sample_explore_item(model_name, size_H, size_W):
+    print(model_name, size_H, size_W)
     explore_item = get_random_item(model_name, size_H, size_W)
     if explore_item is None:
         return "No item found", "No item found", "No item found", "No item found"
     example_id = explore_item['id']
     puzzle_md = f"### Puzzle [{example_id}]:\n\n" + explore_item['puzzle'].replace("## Clues", "### Clues").replace("\n", "<br>")
     model_reasoning_md = f"### {model_name}'s Reasoning:\n\n {explore_item['reasoning']}"
+    model_prediction_md = f"### {model_name}'s Prediction:\n\n {str(explore_item['solution']).replace('___', 'null')}" + \
+                                        "\n\n" + explore_item['solution_table_md']
     puzzle_solved = explore_item['correct_cells'] == explore_item['total_cells']
     cell_acc = explore_item["correct_cells"] / explore_item["total_cells"] * 100
     model_eval_md = f"### Evaluation:\n\n  **Total Cells**: {explore_item['total_cells']} | **Correct Cells**: {explore_item['correct_cells']} | **Puzzle solved**: {puzzle_solved} | **Cell Acc**: {cell_acc:.2f}%"
 def _tab_explore():
     global raw_data
     model_names = [item["Model"] for item in raw_data]
+    # deduplicate and preserve the order
+    model_names = list(dict.fromkeys(model_names))
     with gr.Row():
         model_selection = gr.Dropdown(choices = ["random"] + model_names, label="Model: ", elem_id="select-models", value="random", interactive=True)
         size_H_selection = gr.Dropdown(choices = ["random"] + [f"{i}" for i in range(2,7)], label="Num of Houses", elem_id="select-H", value="random", interactive=True)
         size_W_selection = gr.Dropdown(choices = ["random"] + [f"{i}" for i in range(2,7)], label="Num of Features", elem_id="select-W", value="random", interactive=True)
         with gr.Column(scale=1):
+            # greedy_or_sample = gr.Radio(["greedy", "sampling"], show_label=False, elem_id="greedy-or-sample", value="greedy", interactive=True)
+            gr.Markdown("### 🚀 Click below to sample a puzzle. ⬇️ ")
+            explore_button = gr.Button("🦓 Sample a Zebra Puzzle!", elem_id="explore-button")
     puzzle_md = gr.Markdown("\n\nTo be loaded", elem_id="puzzle-md", elem_classes="box_md")
     model_reasoning_md = gr.Markdown("\n\nTo be loaded", elem_id="model-reasoning-md", elem_classes="box_md")
     model_eval_md = gr.Markdown("\n\nTo be loaded", elem_id="model-eval-md", elem_classes="box_md")
     explore_button.click(fn=sample_explore_item,
+                         inputs=[model_selection, size_H_selection, size_W_selection],
                          outputs=[puzzle_md, model_reasoning_md, model_prediction_md, model_eval_md])