Spaces:

DontPlanToEnd
/

UGI-Leaderboard

Running

App Files Files Community

444

DontPlanToEnd commited on Mar 13, 2024

Commit

fb27588

verified ·

1 Parent(s): f19c73b

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -49

app.py CHANGED Viewed

@@ -60,32 +60,24 @@ with demo:
     gr.Markdown("## UGI Leaderboard", elem_classes="text-lg text-center")
     gr.Markdown("""
     UGI: Uncensored General Intelligence. The average of 5 different subjects that LLMs are commonly steered away from. The leaderboard is made from roughly 60 questions overall, measuring both "willingness to answer" and "accuracy" in fact-based controversial questions.
     Willingness: A more narrow score, solely measuring the LLM's willingness to answer controversial questions.
     Unruly: Knowledge of activities that are generally frowned upon.
     Internet: Knowledge of various internet information, from professional to deviant.
     CrimeStats: Knowledge of crime statistics which are uncomfortable to talk about.
     Stories/Jokes: Ability to write offensive stories and jokes.
     PolContro: Knowledge of politically/socially controversial information.
     """)
     with gr.Column():
         with gr.Row():
             search_bar = gr.Textbox(placeholder=" 🔍 Search for a model...", show_label=False)
-        with gr.Row(variant="compact"):
-            gr.Markdown("Model sizes (in billions of parameters)", elem_classes="text-sm")
-            param_range_1 = gr.Checkbox(label="~1.5", value=False)
-            param_range_2 = gr.Checkbox(label="~3", value=False)
-            param_range_3 = gr.Checkbox(label="~7", value=False)
-            param_range_4 = gr.Checkbox(label="~13", value=False)
-            param_range_5 = gr.Checkbox(label="~20", value=False)
-            param_range_6 = gr.Checkbox(label="~34", value=False)
-            param_range_7 = gr.Checkbox(label="~50", value=False)
-            param_range_8 = gr.Checkbox(label="~70+", value=False)
     # Load the initial leaderboard data
     leaderboard_df = load_leaderboard_data("ugi-leaderboard-data.csv")
@@ -104,48 +96,22 @@ with demo:
     # Define the search and filter functionality
     inputs = [
         search_bar,
-        param_range_1,
-        param_range_2,
-        param_range_3,
-        param_range_4,
-        param_range_5,
-        param_range_6,
-        param_range_7,
-        param_range_8
     ]
     outputs = leaderboard_table
     search_bar.change(
-        fn=lambda query, r1, r2, r3, r4, r5, r6, r7, r8: update_table(leaderboard_df, query, {
-            '~1.5': r1,
-            '~3': r2,
-            '~7': r3,
-            '~13': r4,
-            '~20': r5,
-            '~34': r6,
-            '~50': r7,
-            '~70+': r8
-        }),
         inputs=inputs,
         outputs=outputs
     )
-    for param_range in inputs[1:]:
-        param_range.change(
-            fn=lambda query, r1, r2, r3, r4, r5, r6, r7, r8: update_table(leaderboard_df, query, {
-                '~1.5': r1,
-                '~3': r2,
-                '~7': r3,
-                '~13': r4,
-                '~20': r5,
-                '~34': r6,
-                '~50': r7,
-                '~70+': r8
-            }),
-            inputs=inputs,
-            outputs=outputs
-        )
 # Launch the Gradio app
 demo.launch()

     gr.Markdown("## UGI Leaderboard", elem_classes="text-lg text-center")
     gr.Markdown("""
     UGI: Uncensored General Intelligence. The average of 5 different subjects that LLMs are commonly steered away from. The leaderboard is made from roughly 60 questions overall, measuring both "willingness to answer" and "accuracy" in fact-based controversial questions.
     Willingness: A more narrow score, solely measuring the LLM's willingness to answer controversial questions.
     Unruly: Knowledge of activities that are generally frowned upon.
     Internet: Knowledge of various internet information, from professional to deviant.
     CrimeStats: Knowledge of crime statistics which are uncomfortable to talk about.
     Stories/Jokes: Ability to write offensive stories and jokes.
     PolContro: Knowledge of politically/socially controversial information.
     """)
     with gr.Column():
         with gr.Row():
             search_bar = gr.Textbox(placeholder=" 🔍 Search for a model...", show_label=False)
+        with gr.Row():
+            filter_columns_size = gr.CheckboxGroup(
+                label="Model sizes (in billions of parameters)",
+                choices=['~1.5', '~3', '~7', '~13', '~20', '~34', '~50', '~70+'],
+                value=['~1.5', '~3', '~7', '~13', '~20', '~34', '~50', '~70+'],
+                interactive=True,
+                elem_id="filter-columns-size",
+            )
     # Load the initial leaderboard data
     leaderboard_df = load_leaderboard_data("ugi-leaderboard-data.csv")
     # Define the search and filter functionality
     inputs = [
         search_bar,
+        filter_columns_size
     ]
     outputs = leaderboard_table
     search_bar.change(
+        fn=lambda query, param_ranges: update_table(leaderboard_df, query, dict(zip(['~1.5', '~3', '~7', '~13', '~20', '~34', '~50', '~70+'], param_ranges))),
         inputs=inputs,
         outputs=outputs
     )
+    filter_columns_size.change(
+        fn=lambda query, param_ranges: update_table(leaderboard_df, query, dict(zip(['~1.5', '~3', '~7', '~13', '~20', '~34', '~50', '~70+'], param_ranges))),
+        inputs=inputs,
+        outputs=outputs
+    )
 # Launch the Gradio app
 demo.launch()