from env import TASK | |
from utils import run_pipeline, update_examples | |
import gradio as gr | |
with gr.Blocks( | |
title="YourBench Leaderboard", | |
css="button { margin: 0 10px; padding: 5px 15px; }", | |
) as app: | |
# DISPLAY TABLE AND ANALYSIS | |
title = gr.Markdown(f"YourBench auto-Leaderboard for {TASK}") | |
leaderboard = gr.DataFrame(label="Results", interactive=False) | |
samples_ix = gr.Number(label="Example Index", value=0, step=1, info="Navigate through different examples") | |
with gr.Tab("Hardest samples"): | |
hard_samples = gr.HTML() | |
with gr.Tab("Easiest samples"): | |
easy_samples = gr.HTML() | |
with gr.Tab("All samples"): | |
all_samples = gr.HTML() | |
samples_ix.change(update_examples, samples_ix, [easy_samples, hard_samples, all_samples]) | |
app.load(run_pipeline, [samples_ix], [leaderboard, easy_samples, hard_samples, all_samples]) | |
app.launch() | |