Terry Zhuo
commited on
Commit
·
e2e46b9
1
Parent(s):
777def4
add gt pass rate
Browse files
app.py
CHANGED
@@ -511,12 +511,12 @@ with main_block as demo:
|
|
511 |
)
|
512 |
|
513 |
with gr.TabItem("🛠️ Code Execution (Beta)", id=5):
|
514 |
-
gr.Markdown("## Upload your sanitized JSONL file to evaluate")
|
515 |
|
516 |
with gr.Row():
|
517 |
jsonl_file = gr.File(label="Upload JSONL file", file_types=[".jsonl"])
|
518 |
split = gr.Dropdown(choices=["complete", "instruct"], label="Split", value="complete")
|
519 |
-
subset = gr.Dropdown(choices=["hard
|
520 |
|
521 |
with gr.Row():
|
522 |
parallel = gr.Number(label="Parallel (optional)", precision=0)
|
|
|
511 |
)
|
512 |
|
513 |
with gr.TabItem("🛠️ Code Execution (Beta)", id=5):
|
514 |
+
gr.Markdown("## Upload your sanitized JSONL file to evaluate\n\n### Hard Set Ground Truth Pass Rate: 100%\n### Full Set Ground Truth Pass Rate: 99.6%")
|
515 |
|
516 |
with gr.Row():
|
517 |
jsonl_file = gr.File(label="Upload JSONL file", file_types=[".jsonl"])
|
518 |
split = gr.Dropdown(choices=["complete", "instruct"], label="Split", value="complete")
|
519 |
+
subset = gr.Dropdown(choices=["hard", "full"], label="Subset", value="hard")
|
520 |
|
521 |
with gr.Row():
|
522 |
parallel = gr.Number(label="Parallel (optional)", precision=0)
|