Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -151,9 +151,11 @@ def enhanced_format_preview_for_display(preview_data):
|
|
| 151 |
# 3. Gradio Interface
|
| 152 |
# ---------------------------------------------------------------------------
|
| 153 |
with gr.Blocks() as demo:
|
| 154 |
-
gr.Markdown("#
|
| 155 |
gr.Markdown("""
|
| 156 |
-
This demo evaluates
|
|
|
|
|
|
|
| 157 |
""")
|
| 158 |
|
| 159 |
# Dataset Selection Section
|
|
@@ -164,7 +166,7 @@ with gr.Blocks() as demo:
|
|
| 164 |
choices=["(Select Dataset)", "MMLU-Pro"],
|
| 165 |
value="(Select Dataset)",
|
| 166 |
label="Dataset",
|
| 167 |
-
info="Select a dataset to
|
| 168 |
)
|
| 169 |
preview_toggle = gr.Button("Show Preview", interactive=False, variant="secondary")
|
| 170 |
|
|
|
|
| 151 |
# 3. Gradio Interface
|
| 152 |
# ---------------------------------------------------------------------------
|
| 153 |
with gr.Blocks() as demo:
|
| 154 |
+
gr.Markdown("# Head-to-Head Model Evaluation Comparator")
|
| 155 |
gr.Markdown("""
|
| 156 |
+
This demo evaluates two models (or one model with two different configs) on a benchmark dataset.
|
| 157 |
+
Available Datasets:[MMLU-Pro](https://huggingface.co/datasets/TIGER-Lab/MMLU-Pro)
|
| 158 |
+
Available Models: [Mistral-7B-v0.1](https://huggingface.co/mistralai/Mistral-7B-v0.1)
|
| 159 |
""")
|
| 160 |
|
| 161 |
# Dataset Selection Section
|
|
|
|
| 166 |
choices=["(Select Dataset)", "MMLU-Pro"],
|
| 167 |
value="(Select Dataset)",
|
| 168 |
label="Dataset",
|
| 169 |
+
info="Select a dataset to perform the Head to Head Evaluation on. Available Datasets: [MMLU-Pro](https://huggingface.co/datasets/TIGER-Lab/MMLU-Pro)"
|
| 170 |
)
|
| 171 |
preview_toggle = gr.Button("Show Preview", interactive=False, variant="secondary")
|
| 172 |
|