Spaces:

OpenEvals
/

open_benchmark_index

Running

App Files Files Community

Linker1907 commited on Oct 16

Commit

445a7b6

1 Parent(s): a22d77d

init

Browse files

Files changed (1) hide show

app.py +28 -29

app.py CHANGED Viewed

@@ -20,7 +20,6 @@ import os
 import re
 from collections import Counter
 from dataclasses import asdict, dataclass
-from typing import Dict, List, Optional, Tuple
 import gradio as gr
@@ -39,14 +38,14 @@ class TaskDoc:
     file_path: str
     module: str
     abstract: str
-    languages: List[str]
-    tags: List[str]
-    paper: Optional[str]
-    dataset: Optional[str]
-    name: Optional[str] = None
-def read_file_text(path: str) -> Optional[str]:
     try:
         with open(path, "r", encoding="utf-8") as f:
             return f.read()
@@ -54,7 +53,7 @@ def read_file_text(path: str) -> Optional[str]:
         return None
-def parse_module_docstring(text: str) -> Optional[str]:
     try:
         mod = ast.parse(text)
         return ast.get_docstring(mod)
@@ -64,11 +63,11 @@ def parse_module_docstring(text: str) -> Optional[str]:
         return m.group(2).strip() if m else None
-def parse_sections(doc: str) -> Dict[str, str]:
     # Very simple section parser keyed by lines ending with ':' on their own
     # Expected keys: name, dataset, abstract, languages, tags, paper
-    out: Dict[str, str] = {"name": "", "dataset": "", "abstract": "", "languages": "", "tags": "", "paper": ""}
-    current_key: Optional[str] = None
     for raw_line in doc.splitlines():
         line = raw_line.rstrip()
         if line.endswith(":") and line.strip().lower() in {"name:", "dataset:", "abstract:", "languages:", "tags:", "paper:"}:
@@ -80,12 +79,12 @@ def parse_sections(doc: str) -> Dict[str, str]:
     return out
-def split_list_field(value: str) -> List[str]:
     if not value:
         return []
     # Support comma and newline separated values
     parts = re.split(r"[\n,]", value)
-    cleaned: List[str] = []
     for p in parts:
         token = p.strip()
         if not token:
@@ -94,8 +93,8 @@ def split_list_field(value: str) -> List[str]:
     return cleaned
-def discover_task_files() -> List[str]:
-    files: List[str] = []
     for base in TASK_DIRS:
         if not os.path.isdir(base):
             continue
@@ -111,7 +110,7 @@ def discover_task_files() -> List[str]:
                 files.append(os.path.join(dirpath, "main.py"))
     # Deduplicate while preserving order
     seen: set = set()
-    unique_files: List[str] = []
     for p in files:
         if p in seen:
             continue
@@ -120,8 +119,8 @@ def discover_task_files() -> List[str]:
     return sorted(unique_files)
-def index_tasks() -> Tuple[List[TaskDoc], List[str], List[str]]:
-    docs: List[TaskDoc] = []
     language_counts: Counter = Counter()
     tag_set: set = set()
     for path in discover_task_files():
@@ -151,7 +150,7 @@ def index_tasks() -> Tuple[List[TaskDoc], List[str], List[str]]:
     return docs, languages_sorted, tags_sorted
-def save_index(path: str, tasks: List[TaskDoc], langs: List[str], tags: List[str]) -> None:
     data = {
         "tasks": [asdict(t) for t in tasks],
         "languages": list(langs),
@@ -162,7 +161,7 @@ def save_index(path: str, tasks: List[TaskDoc], langs: List[str], tags: List[str
         json.dump(data, f, ensure_ascii=False, indent=2)
-def load_index(path: str) -> Optional[Tuple[List[TaskDoc], List[str], List[str]]]:
     if not os.path.exists(path):
         return None
     with open(path, "r", encoding="utf-8") as f:
@@ -173,7 +172,7 @@ def load_index(path: str) -> Optional[Tuple[List[TaskDoc], List[str], List[str]]
     return tasks, langs, tags
-def build_and_cache_index() -> Tuple[List[TaskDoc], List[str], List[str]]:
     tasks, langs, tags = index_tasks()
     save_index(CACHE_PATH, tasks, langs, tags)
     return tasks, langs, tags
@@ -190,11 +189,11 @@ print(f"Loaded {len(ALL_TASKS)} tasks from cache")
 TOP_LANGS = ALL_LANGS[:8]  # show more by default
-def filter_tasks(languages: List[str], tags: List[str], search: str) -> List[TaskDoc]:
     selected_langs = [lang.lower() for lang in (languages or [])]
     selected_tags = [t.lower() for t in (tags or [])]
     search_lc = (search or "").strip().lower()
-    out: List[TaskDoc] = []
     for td in ALL_TASKS:
         if selected_langs and not any(lang in td.languages for lang in selected_langs):
             continue
@@ -209,9 +208,9 @@ def filter_tasks(languages: List[str], tags: List[str], search: str) -> List[Tas
     return out
-def render_cards(tasks: List[TaskDoc]) -> str:
     # Responsive grid of pretty cards; show all details without clicks
-    items: List[str] = []
     for t in tasks:
         parts = t.module.replace("\\", "/").split("/")
         base_no_ext = parts[-1].rsplit(".", 1)[0]
@@ -313,21 +312,21 @@ def render_cards(tasks: List[TaskDoc]) -> str:
     return style + "<div class=\"cards-grid\">" + "\n".join(items) + "</div>"
-def on_filter(languages: List[str], tags: List[str], search: str):
     tasks = filter_tasks(languages, tags, search)
     return render_cards(tasks)
-def on_toggle_language_choices(show_all: bool, selected_langs: List[str], tags: List[str], search: str):
     choices = ALL_LANGS if show_all else TOP_LANGS
     kept = [lang for lang in (selected_langs or []) if lang in choices]
     tasks = filter_tasks(kept, tags, search)
     return gr.update(choices=choices, value=kept), render_cards(tasks)
-def on_toggle_tags_visibility(show: bool, selected_tags: List[str], languages: List[str], search: str):
     # Only toggle visibility; preserve current tag selections and keep them active in filtering
-    tags_value: List[str] = selected_tags or []
     tasks = filter_tasks(languages, tags_value, search)
     # keep selections when showing; when hiding we keep value but component hidden (so filter still uses them)
     return gr.update(visible=show, value=tags_value), render_cards(tasks)

 import re
 from collections import Counter
 from dataclasses import asdict, dataclass
 import gradio as gr
     file_path: str
     module: str
     abstract: str
+    languages: list[str]
+    tags: list[str]
+    paper: str | None
+    dataset: str | None
+    name: str | None = None
+def read_file_text(path: str) -> str | None:
     try:
         with open(path, "r", encoding="utf-8") as f:
             return f.read()
         return None
+def parse_module_docstring(text: str) -> str | None:
     try:
         mod = ast.parse(text)
         return ast.get_docstring(mod)
         return m.group(2).strip() if m else None
+def parse_sections(doc: str) -> dict[str, str]:
     # Very simple section parser keyed by lines ending with ':' on their own
     # Expected keys: name, dataset, abstract, languages, tags, paper
+    out: dict[str, str] = {"name": "", "dataset": "", "abstract": "", "languages": "", "tags": "", "paper": ""}
+    current_key: str | None = None
     for raw_line in doc.splitlines():
         line = raw_line.rstrip()
         if line.endswith(":") and line.strip().lower() in {"name:", "dataset:", "abstract:", "languages:", "tags:", "paper:"}:
     return out
+def split_list_field(value: str) -> list[str]:
     if not value:
         return []
     # Support comma and newline separated values
     parts = re.split(r"[\n,]", value)
+    cleaned: list[str] = []
     for p in parts:
         token = p.strip()
         if not token:
     return cleaned
+def discover_task_files() -> list[str]:
+    files: list[str] = []
     for base in TASK_DIRS:
         if not os.path.isdir(base):
             continue
                 files.append(os.path.join(dirpath, "main.py"))
     # Deduplicate while preserving order
     seen: set = set()
+    unique_files: list[str] = []
     for p in files:
         if p in seen:
             continue
     return sorted(unique_files)
+def index_tasks() -> tuple[list[TaskDoc], list[str], list[str]]:
+    docs: list[TaskDoc] = []
     language_counts: Counter = Counter()
     tag_set: set = set()
     for path in discover_task_files():
     return docs, languages_sorted, tags_sorted
+def save_index(path: str, tasks: list[TaskDoc], langs: list[str], tags: list[str]) -> None:
     data = {
         "tasks": [asdict(t) for t in tasks],
         "languages": list(langs),
         json.dump(data, f, ensure_ascii=False, indent=2)
+def load_index(path: str) -> tuple[list[TaskDoc], list[str], list[str]] | None:
     if not os.path.exists(path):
         return None
     with open(path, "r", encoding="utf-8") as f:
     return tasks, langs, tags
+def build_and_cache_index() -> tuple[list[TaskDoc], list[str], list[str]]:
     tasks, langs, tags = index_tasks()
     save_index(CACHE_PATH, tasks, langs, tags)
     return tasks, langs, tags
 TOP_LANGS = ALL_LANGS[:8]  # show more by default
+def filter_tasks(languages: list[str], tags: list[str], search: str) -> list[TaskDoc]:
     selected_langs = [lang.lower() for lang in (languages or [])]
     selected_tags = [t.lower() for t in (tags or [])]
     search_lc = (search or "").strip().lower()
+    out: list[TaskDoc] = []
     for td in ALL_TASKS:
         if selected_langs and not any(lang in td.languages for lang in selected_langs):
             continue
     return out
+def render_cards(tasks: list[TaskDoc]) -> str:
     # Responsive grid of pretty cards; show all details without clicks
+    items: list[str] = []
     for t in tasks:
         parts = t.module.replace("\\", "/").split("/")
         base_no_ext = parts[-1].rsplit(".", 1)[0]
     return style + "<div class=\"cards-grid\">" + "\n".join(items) + "</div>"
+def on_filter(languages: list[str], tags: list[str], search: str):
     tasks = filter_tasks(languages, tags, search)
     return render_cards(tasks)
+def on_toggle_language_choices(show_all: bool, selected_langs: list[str], tags: list[str], search: str):
     choices = ALL_LANGS if show_all else TOP_LANGS
     kept = [lang for lang in (selected_langs or []) if lang in choices]
     tasks = filter_tasks(kept, tags, search)
     return gr.update(choices=choices, value=kept), render_cards(tasks)
+def on_toggle_tags_visibility(show: bool, selected_tags: list[str], languages: list[str], search: str):
     # Only toggle visibility; preserve current tag selections and keep them active in filtering
+    tags_value: list[str] = selected_tags or []
     tasks = filter_tasks(languages, tags_value, search)
     # keep selections when showing; when hiding we keep value but component hidden (so filter still uses them)
     return gr.update(visible=show, value=tags_value), render_cards(tasks)