Commit
·
d1ca5fe
1
Parent(s):
39bc9e0
fix L-MT on default page
Browse files- app.py +18 -5
- submissions/baseline/results.json +1 -1
- uploads.py +10 -0
app.py
CHANGED
|
@@ -156,8 +156,17 @@ with demo:
|
|
| 156 |
with gr.Row():
|
| 157 |
tasks_checkbox = gr.CheckboxGroup(
|
| 158 |
label="Select Tasks",
|
| 159 |
-
choices=[
|
| 160 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 161 |
interactive=True,
|
| 162 |
)
|
| 163 |
|
|
@@ -231,7 +240,7 @@ with demo:
|
|
| 231 |
leaderboard_table = gr.components.Dataframe(
|
| 232 |
value=load_data(
|
| 233 |
# "baseline",
|
| 234 |
-
["L-NER", "RR", "CJPE", "BAIL", "LSI", "PCR", "SUMM"],
|
| 235 |
task_metrics=task_metrics,
|
| 236 |
),
|
| 237 |
interactive=True,
|
|
@@ -392,10 +401,13 @@ with demo:
|
|
| 392 |
outputs=leaderboard_table,
|
| 393 |
)
|
| 394 |
|
| 395 |
-
with gr.Accordion("Submit the
|
| 396 |
with gr.Row():
|
| 397 |
with gr.Column():
|
| 398 |
-
method_name_textbox = gr.Textbox(
|
|
|
|
|
|
|
|
|
|
| 399 |
url_textbox = gr.Textbox(label="Github Link")
|
| 400 |
organisation = gr.Textbox(label="Organisation")
|
| 401 |
mail = gr.Textbox(label="Contact email")
|
|
@@ -407,6 +419,7 @@ with demo:
|
|
| 407 |
add_new_eval,
|
| 408 |
[
|
| 409 |
method_name_textbox,
|
|
|
|
| 410 |
url_textbox,
|
| 411 |
file_output,
|
| 412 |
organisation,
|
|
|
|
| 156 |
with gr.Row():
|
| 157 |
tasks_checkbox = gr.CheckboxGroup(
|
| 158 |
label="Select Tasks",
|
| 159 |
+
choices=[
|
| 160 |
+
"L-NER",
|
| 161 |
+
"RR",
|
| 162 |
+
"CJPE",
|
| 163 |
+
"BAIL",
|
| 164 |
+
"LSI",
|
| 165 |
+
"PCR",
|
| 166 |
+
"SUMM",
|
| 167 |
+
"L-MT",
|
| 168 |
+
],
|
| 169 |
+
value=["L-NER", "RR", "CJPE", "BAIL", "LSI", "PCR", "SUMM", "L-MT"],
|
| 170 |
interactive=True,
|
| 171 |
)
|
| 172 |
|
|
|
|
| 240 |
leaderboard_table = gr.components.Dataframe(
|
| 241 |
value=load_data(
|
| 242 |
# "baseline",
|
| 243 |
+
["L-NER", "RR", "CJPE", "BAIL", "LSI", "PCR", "SUMM", "L-MT"],
|
| 244 |
task_metrics=task_metrics,
|
| 245 |
),
|
| 246 |
interactive=True,
|
|
|
|
| 401 |
outputs=leaderboard_table,
|
| 402 |
)
|
| 403 |
|
| 404 |
+
with gr.Accordion("Submit the Results of your Method"):
|
| 405 |
with gr.Row():
|
| 406 |
with gr.Column():
|
| 407 |
+
method_name_textbox = gr.Textbox(
|
| 408 |
+
label="Method",
|
| 409 |
+
)
|
| 410 |
+
submitted_by_textbox = gr.Textbox(label="Submitted By (Team Name)")
|
| 411 |
url_textbox = gr.Textbox(label="Github Link")
|
| 412 |
organisation = gr.Textbox(label="Organisation")
|
| 413 |
mail = gr.Textbox(label="Contact email")
|
|
|
|
| 419 |
add_new_eval,
|
| 420 |
[
|
| 421 |
method_name_textbox,
|
| 422 |
+
submitted_by_textbox,
|
| 423 |
url_textbox,
|
| 424 |
file_output,
|
| 425 |
organisation,
|
submissions/baseline/results.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
[{"Method": "SOTA", "Submitted By": "multiple", "Github Link": "exploration-lab.github.io/IL-TUR/", "L-NER": {"strict mF1": "48.58"}, "RR": {"mF1": "69.01"}, "CJPE": {"mF1": "81.31", "ROUGE-L": "56.00", "BLEU": "32.00"}, "BAIL": {"mF1": "81"}, "LSI": {"mF1": "28.08"}, "PCR": {"muF1@K": "39.15"}, "SUMM": {"ROUGE-L": "33.00", "BERTSCORE": "86.00"}, "L-MT": {"BLEU": "28.00", "GLEU": "32.00", "chrF++": "57.00"}}, {"Method": "BERT", "Submitted By": "multiple", "Github Link": "", "L-NER": {"strict mF1": "39.59"}, "RR": {"mF1": "58"}, "CJPE": {"mF1": "71.14", "ROUGE-L": "-", "BLEU": "-"}, "BAIL": {"mF1": "-"}, "LSI": {"mF1": "-"}, "PCR": {"muF1@K": "18.44"}, "SUMM": {"ROUGE-L": "9.24", "BERTSCORE": "-"}, "L-MT": {"BLEU": "-", "GLEU": "-", "chrF++": "-"}}, {"Method": "LegalBERT", "Submitted By": "multiple", "Github Link": "", "L-NER": {"strict mF1": "45.58"}, "RR": {"mF1": "54"}, "CJPE": {"mF1": "78.21", "ROUGE-L": "-", "BLEU": "-"}, "BAIL": {"mF1": "-"}, "LSI": {"mF1": "-"}, "PCR": {"muF1@K": "21.74"}, "SUMM": {"ROUGE-L": "8.67", "BERTSCORE": "-"}, "L-MT": {"BLEU": "-", "GLEU": "-", "chrF++": "-"}}, {"Method": "InLegalBERT", "Submitted By": "multiple", "Github Link": "", "L-NER": {"strict mF1": "48.58"}, "RR": {"mF1": "58"}, "CJPE": {"mF1": "81.31", "ROUGE-L": "-", "BLEU": "-"}, "BAIL": {"mF1": "-"}, "LSI": {"mF1": "-"}, "PCR": {"muF1@K": "26.23"}, "SUMM": {"ROUGE-L": "7.57", "BERTSCORE": "-"}, "L-MT": {"BLEU": "-", "GLEU": "-", "chrF++": "-"}}, {"Method": "GPT-3.5 (0-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "30.59"}, "RR": {"mF1": "30.95"}, "CJPE": {"mF1": "54.17", "ROUGE-L": "30.00", "BLEU": "8.00"}, "BAIL": {"mF1": "51.04"}, "LSI": {"mF1": "21.55"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "21.00", "BERTSCORE": "85.00"}, "L-MT": {"BLEU": "23.00", "GLEU": "28.00", "chrF++": "42.00"}}, {"Method": "GPT-3.5 (1-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "23.68"}, "RR": {"mF1": "30.05"}, "CJPE": {"mF1": "51.46", "ROUGE-L": "29.00", "BLEU": "15.00"}, "BAIL": {"mF1": "46.35"}, "LSI": {"mF1": "22.61"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "20.00", "BERTSCORE": "84.00"}, "L-MT": {"BLEU": "25.00", "GLEU": "28.00", "chrF++": "43.00"}}, {"Method": "GPT-3.5 (2-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "32.84"}, "RR": {"mF1": "30.31"}, "CJPE": {"mF1": "56.74", "ROUGE-L": "30.00", "BLEU": "11.00"}, "BAIL": {"mF1": "61"}, "LSI": {"mF1": "21.4"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "22.00", "BERTSCORE": "84.00"}, "L-MT": {"BLEU": "26.00", "GLEU": "29.00", "chrF++": "43.00"}}, {"Method": "GPT-4 (0-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "13.65"}, "RR": {"mF1": "37.37"}, "CJPE": {"mF1": "68.29", "ROUGE-L": "40.00", "BLEU": "14.00"}, "BAIL": {"mF1": "51.46"}, "LSI": {"mF1": "23.99"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "23.00", "BERTSCORE": "85.00"}, "L-MT": {"BLEU": "33.00", "GLEU": "36.00", "chrF++": "50.00"}}, {"Method": "GPT-4 (1-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "10.51"}, "RR": {"mF1": "37.43"}, "CJPE": {"mF1": "47.26", "ROUGE-L": "39.00", "BLEU": "16.00"}, "BAIL": {"mF1": "56.9"}, "LSI": {"mF1": "22.26"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "16.00", "BERTSCORE": "81.00"}, "L-MT": {"BLEU": "35.00", "GLEU": "38.00", "chrF++": "52.00"}}, {"Method": "GPT-4 (2-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "24.03"}, "RR": {"mF1": "38.18"}, "CJPE": {"mF1": "60.44", "ROUGE-L": "43.00", "BLEU": "18.00"}, "BAIL": {"mF1": "66.67"}, "LSI": {"mF1": "20.53"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "17.00", "BERTSCORE": "81.00"}, "L-MT": {"BLEU": "36.00", "GLEU": "39.00", "chrF++": "53.00"}}
|
|
|
|
| 1 |
+
[{"Method": "SOTA", "Submitted By": "multiple", "Github Link": "exploration-lab.github.io/IL-TUR/", "L-NER": {"strict mF1": "48.58"}, "RR": {"mF1": "69.01"}, "CJPE": {"mF1": "81.31", "ROUGE-L": "56.00", "BLEU": "32.00"}, "BAIL": {"mF1": "81"}, "LSI": {"mF1": "28.08"}, "PCR": {"muF1@K": "39.15"}, "SUMM": {"ROUGE-L": "33.00", "BERTSCORE": "86.00"}, "L-MT": {"BLEU": "28.00", "GLEU": "32.00", "chrF++": "57.00"}}, {"Method": "BERT", "Submitted By": "multiple", "Github Link": "", "L-NER": {"strict mF1": "39.59"}, "RR": {"mF1": "58"}, "CJPE": {"mF1": "71.14", "ROUGE-L": "-", "BLEU": "-"}, "BAIL": {"mF1": "-"}, "LSI": {"mF1": "-"}, "PCR": {"muF1@K": "18.44"}, "SUMM": {"ROUGE-L": "9.24", "BERTSCORE": "-"}, "L-MT": {"BLEU": "-", "GLEU": "-", "chrF++": "-"}}, {"Method": "LegalBERT", "Submitted By": "multiple", "Github Link": "", "L-NER": {"strict mF1": "45.58"}, "RR": {"mF1": "54"}, "CJPE": {"mF1": "78.21", "ROUGE-L": "-", "BLEU": "-"}, "BAIL": {"mF1": "-"}, "LSI": {"mF1": "-"}, "PCR": {"muF1@K": "21.74"}, "SUMM": {"ROUGE-L": "8.67", "BERTSCORE": "-"}, "L-MT": {"BLEU": "-", "GLEU": "-", "chrF++": "-"}}, {"Method": "InLegalBERT", "Submitted By": "multiple", "Github Link": "", "L-NER": {"strict mF1": "48.58"}, "RR": {"mF1": "58"}, "CJPE": {"mF1": "81.31", "ROUGE-L": "-", "BLEU": "-"}, "BAIL": {"mF1": "-"}, "LSI": {"mF1": "-"}, "PCR": {"muF1@K": "26.23"}, "SUMM": {"ROUGE-L": "7.57", "BERTSCORE": "-"}, "L-MT": {"BLEU": "-", "GLEU": "-", "chrF++": "-"}}, {"Method": "GPT-3.5 (0-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "30.59"}, "RR": {"mF1": "30.95"}, "CJPE": {"mF1": "54.17", "ROUGE-L": "30.00", "BLEU": "8.00"}, "BAIL": {"mF1": "51.04"}, "LSI": {"mF1": "21.55"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "21.00", "BERTSCORE": "85.00"}, "L-MT": {"BLEU": "23.00", "GLEU": "28.00", "chrF++": "42.00"}}, {"Method": "GPT-3.5 (1-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "23.68"}, "RR": {"mF1": "30.05"}, "CJPE": {"mF1": "51.46", "ROUGE-L": "29.00", "BLEU": "15.00"}, "BAIL": {"mF1": "46.35"}, "LSI": {"mF1": "22.61"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "20.00", "BERTSCORE": "84.00"}, "L-MT": {"BLEU": "25.00", "GLEU": "28.00", "chrF++": "43.00"}}, {"Method": "GPT-3.5 (2-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "32.84"}, "RR": {"mF1": "30.31"}, "CJPE": {"mF1": "56.74", "ROUGE-L": "30.00", "BLEU": "11.00"}, "BAIL": {"mF1": "61"}, "LSI": {"mF1": "21.4"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "22.00", "BERTSCORE": "84.00"}, "L-MT": {"BLEU": "26.00", "GLEU": "29.00", "chrF++": "43.00"}}, {"Method": "GPT-4 (0-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "13.65"}, "RR": {"mF1": "37.37"}, "CJPE": {"mF1": "68.29", "ROUGE-L": "40.00", "BLEU": "14.00"}, "BAIL": {"mF1": "51.46"}, "LSI": {"mF1": "23.99"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "23.00", "BERTSCORE": "85.00"}, "L-MT": {"BLEU": "33.00", "GLEU": "36.00", "chrF++": "50.00"}}, {"Method": "GPT-4 (1-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "10.51"}, "RR": {"mF1": "37.43"}, "CJPE": {"mF1": "47.26", "ROUGE-L": "39.00", "BLEU": "16.00"}, "BAIL": {"mF1": "56.9"}, "LSI": {"mF1": "22.26"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "16.00", "BERTSCORE": "81.00"}, "L-MT": {"BLEU": "35.00", "GLEU": "38.00", "chrF++": "52.00"}}, {"Method": "GPT-4 (2-shot)", "Submitted By": "IL-TUR", "Github Link": "", "L-NER": {"strict mF1": "24.03"}, "RR": {"mF1": "38.18"}, "CJPE": {"mF1": "60.44", "ROUGE-L": "43.00", "BLEU": "18.00"}, "BAIL": {"mF1": "66.67"}, "LSI": {"mF1": "20.53"}, "PCR": {"muF1@K": "-"}, "SUMM": {"ROUGE-L": "17.00", "BERTSCORE": "81.00"}, "L-MT": {"BLEU": "36.00", "GLEU": "39.00", "chrF++": "53.00"}}]
|
uploads.py
CHANGED
|
@@ -4,6 +4,7 @@ import os
|
|
| 4 |
import datetime
|
| 5 |
import json
|
| 6 |
import pandas as pd
|
|
|
|
| 7 |
|
| 8 |
LEADERBOARD_PATH = "Exploration-Lab/IL-TUR-Leaderboard"
|
| 9 |
# RESULTS_PATH = "Exploration-Lab/IL-TUR-Leaderboard-results"
|
|
@@ -42,11 +43,20 @@ def input_verification(method_name, url, path_to_file, organisation, mail):
|
|
| 42 |
if path_to_file is None:
|
| 43 |
return format_warning("Please attach a file.")
|
| 44 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 45 |
return parsed_mail
|
| 46 |
|
| 47 |
|
| 48 |
def add_new_eval(
|
| 49 |
method_name: str,
|
|
|
|
| 50 |
url: str,
|
| 51 |
path_to_file: str,
|
| 52 |
organisation: str,
|
|
|
|
| 4 |
import datetime
|
| 5 |
import json
|
| 6 |
import pandas as pd
|
| 7 |
+
import gradio as gr
|
| 8 |
|
| 9 |
LEADERBOARD_PATH = "Exploration-Lab/IL-TUR-Leaderboard"
|
| 10 |
# RESULTS_PATH = "Exploration-Lab/IL-TUR-Leaderboard-results"
|
|
|
|
| 43 |
if path_to_file is None:
|
| 44 |
return format_warning("Please attach a file.")
|
| 45 |
|
| 46 |
+
# check the required fields
|
| 47 |
+
required_fields = ["Method", "Submitted By", "url", "organisation", "mail"]
|
| 48 |
+
|
| 49 |
+
# Check if the required_fields are not blank
|
| 50 |
+
for field in required_fields:
|
| 51 |
+
if field not in locals():
|
| 52 |
+
raise gr.Error(f"{field} cannot be blank")
|
| 53 |
+
|
| 54 |
return parsed_mail
|
| 55 |
|
| 56 |
|
| 57 |
def add_new_eval(
|
| 58 |
method_name: str,
|
| 59 |
+
submitted_by: str,
|
| 60 |
url: str,
|
| 61 |
path_to_file: str,
|
| 62 |
organisation: str,
|