Spaces:

SWE-Arena
/

SWE-Review

Sleeping

App Files Files Community

zhiminy commited on Oct 18

Commit

39cbf48

1 Parent(s): 325abdd

remove msr

Browse files

Files changed (2) hide show

app.py +62 -29
msr.py +0 -1224

app.py CHANGED Viewed

@@ -48,6 +48,7 @@ DEBUG_REVIEW_METADATA_CACHE = defaultdict(list)
 AGENTS_REPO = "SWE-Arena/swe_agents"  # HuggingFace dataset for agent metadata
 REVIEW_METADATA_REPO = "SWE-Arena/review_metadata"  # HuggingFace dataset for review metadata
 LEADERBOARD_COLUMNS = [
     ("Agent Name", "string"),
@@ -770,17 +771,14 @@ def calculate_monthly_metrics_by_agent():
             }
         }
     """
-    # Get current year for loading metadata
-    current_year = datetime.now().year
     # Load ALL agents from HuggingFace agents repo
     agents = load_agents_from_hf()
     # Create mapping from agent_identifier to agent_name
     identifier_to_name = {agent.get('github_identifier'): agent.get('agent_name') for agent in agents if agent.get('github_identifier')}
-    # Load all review metadata for current year from review_metadata dataset
-    all_metadata = load_review_metadata_for_year(current_year)
     if not all_metadata:
         return {'agents': [], 'months': [], 'data': {}}
@@ -967,27 +965,42 @@ def save_review_metadata_to_hf(metadata_list, agent_identifier):
         return False
-def load_review_metadata_for_year(year):
     """
-    Load all review metadata for a specific year from HuggingFace.
-    Scans all agent folders and loads daily files matching the year.
-    In debug mode, loads from in-memory cache if available.
     Structure: [agent_identifier]/YYYY.MM.DD.jsonl
     Returns:
         List of dictionaries with 'agent_identifier' added to each review metadata.
     """
     # In debug mode, check in-memory cache first
     if DEBUG_MODE and DEBUG_REVIEW_METADATA_CACHE:
         all_metadata = []
         for agent_identifier, metadata_list in DEBUG_REVIEW_METADATA_CACHE.items():
             for review_meta in metadata_list:
                 review_with_agent = review_meta.copy()
                 review_with_agent['agent_identifier'] = agent_identifier
                 all_metadata.append(review_with_agent)
         if all_metadata:
-            print(f"🐛 DEBUG MODE: Loading review metadata from in-memory cache ({len(all_metadata)} reviews)")
             return all_metadata
     try:
@@ -997,22 +1010,33 @@ def load_review_metadata_for_year(year):
         # List all files in the repository
         files = api.list_repo_files(repo_id=REVIEW_METADATA_REPO, repo_type="dataset")
-        # Filter for files matching the year pattern: [agent_identifier]/YYYY.MM.DD.jsonl
-        # Extract year from filename
-        year_str = str(year)
-        year_files = []
         for f in files:
             if f.endswith('.jsonl'):
                 parts = f.split('/')
                 if len(parts) == 2:  # [agent_identifier]/YYYY.MM.DD.jsonl
                     filename = parts[1]
-                    if filename.startswith(year_str + '.'):
-                        year_files.append(f)
-        print(f"📥 Loading review metadata for {year} ({len(year_files)} daily files across all agents)...")
         all_metadata = []
-        for filename in year_files:
             try:
                 # Extract agent_identifier from path (first part)
                 # Format: agent_identifier/YYYY.MM.DD.jsonl
@@ -1031,20 +1055,32 @@ def load_review_metadata_for_year(year):
                 )
                 day_metadata = load_jsonl(file_path)
-                # Add agent_identifier to each review metadata for processing
                 for review_meta in day_metadata:
                     review_meta['agent_identifier'] = agent_identifier
-                all_metadata.extend(day_metadata)
-                print(f"   ✓ Loaded {len(day_metadata)} reviews from {filename}")
             except Exception as e:
                 print(f"   Warning: Could not load {filename}: {str(e)}")
-        print(f"✓ Loaded {len(all_metadata)} total reviews for {year}")
         return all_metadata
     except Exception as e:
-        print(f"✗ Error loading review metadata for {year}: {str(e)}")
         return []
@@ -1532,7 +1568,6 @@ def update_all_agents_incremental():
     Returns dictionary of all agent data with current stats.
     """
     token = get_github_token()
-    current_year = datetime.now().year
     # Load agent metadata from HuggingFace
     agents = load_agents_from_hf()
@@ -1587,9 +1622,9 @@ def update_all_agents_incremental():
             else:
                 print(f"   No new reviews to save")
-            # Load ALL metadata for current year to calculate stats (aggregates entire last 6 months)
             print(f"📊 Calculating statistics from ALL stored metadata (last 6 months)...")
-            all_year_metadata = load_review_metadata_for_year(current_year)
             # Filter for this specific agent
             agent_metadata = [review for review in all_year_metadata if review.get("agent_identifier") == identifier]
@@ -1624,8 +1659,6 @@ def construct_leaderboard_from_metadata():
     Returns dictionary of agent stats.
     """
     print("📊 Constructing leaderboard from review metadata...")
-    current_year = datetime.now().year
     # Load agents
     agents = load_agents_from_hf()
     if not agents:
@@ -1633,7 +1666,7 @@ def construct_leaderboard_from_metadata():
         return {}
     # Load all review metadata for current year
-    all_metadata = load_review_metadata_for_year(current_year)
     cache_dict = {}

 AGENTS_REPO = "SWE-Arena/swe_agents"  # HuggingFace dataset for agent metadata
 REVIEW_METADATA_REPO = "SWE-Arena/review_metadata"  # HuggingFace dataset for review metadata
+LEADERBOARD_TIME_FRAME_DAYS = 180  # Time frame for leaderboard (past 6 months)
 LEADERBOARD_COLUMNS = [
     ("Agent Name", "string"),
             }
         }
     """
     # Load ALL agents from HuggingFace agents repo
     agents = load_agents_from_hf()
     # Create mapping from agent_identifier to agent_name
     identifier_to_name = {agent.get('github_identifier'): agent.get('agent_name') for agent in agents if agent.get('github_identifier')}
+    # Load all review metadata from review_metadata dataset
+    all_metadata = load_review_metadata()
     if not all_metadata:
         return {'agents': [], 'months': [], 'data': {}}
         return False
+def load_review_metadata():
     """
+    Load review metadata from the last LEADERBOARD_TIME_FRAME_DAYS.
+    In debug mode, loads from in-memory cache if available and filters by time frame.
     Structure: [agent_identifier]/YYYY.MM.DD.jsonl
     Returns:
         List of dictionaries with 'agent_identifier' added to each review metadata.
+        Only includes reviews from the last LEADERBOARD_TIME_FRAME_DAYS.
     """
+    # Calculate cutoff date based on LEADERBOARD_TIME_FRAME_DAYS
+    current_time = datetime.now(timezone.utc)
+    cutoff_date = current_time - timedelta(days=LEADERBOARD_TIME_FRAME_DAYS)
     # In debug mode, check in-memory cache first
     if DEBUG_MODE and DEBUG_REVIEW_METADATA_CACHE:
         all_metadata = []
         for agent_identifier, metadata_list in DEBUG_REVIEW_METADATA_CACHE.items():
             for review_meta in metadata_list:
+                # Filter by time frame
+                reviewed_at = review_meta.get('reviewed_at')
+                if reviewed_at:
+                    try:
+                        dt = datetime.fromisoformat(reviewed_at.replace('Z', '+00:00'))
+                        if dt < cutoff_date:
+                            continue  # Skip reviews older than time frame
+                    except Exception:
+                        pass  # Keep reviews with unparseable dates
                 review_with_agent = review_meta.copy()
                 review_with_agent['agent_identifier'] = agent_identifier
                 all_metadata.append(review_with_agent)
         if all_metadata:
+            print(f"🐛 DEBUG MODE: Loading review metadata from in-memory cache (last {LEADERBOARD_TIME_FRAME_DAYS} days, {len(all_metadata)} reviews)")
             return all_metadata
     try:
         # List all files in the repository
         files = api.list_repo_files(repo_id=REVIEW_METADATA_REPO, repo_type="dataset")
+        # Filter for files matching the pattern: [agent_identifier]/YYYY.MM.DD.jsonl
+        # AND within the time frame (parse date from filename)
+        time_frame_files = []
         for f in files:
             if f.endswith('.jsonl'):
                 parts = f.split('/')
                 if len(parts) == 2:  # [agent_identifier]/YYYY.MM.DD.jsonl
                     filename = parts[1]
+                    # Parse date from filename: YYYY.MM.DD.jsonl
+                    try:
+                        date_part = filename.replace('.jsonl', '')  # Get YYYY.MM.DD
+                        date_components = date_part.split('.')
+                        if len(date_components) == 3:
+                            file_year, file_month, file_day = map(int, date_components)
+                            file_date = datetime(file_year, file_month, file_day, tzinfo=timezone.utc)
+                            # Only include files within the time frame
+                            if file_date >= cutoff_date:
+                                time_frame_files.append(f)
+                    except Exception:
+                        # If we can't parse the date, skip this file
+                        continue
+        print(f"📥 Loading review metadata from last {LEADERBOARD_TIME_FRAME_DAYS} days ({len(time_frame_files)} daily files across all agents)...")
         all_metadata = []
+        for filename in time_frame_files:
             try:
                 # Extract agent_identifier from path (first part)
                 # Format: agent_identifier/YYYY.MM.DD.jsonl
                 )
                 day_metadata = load_jsonl(file_path)
+                # Add agent_identifier and filter by time frame (double-check)
+                filtered_count = 0
                 for review_meta in day_metadata:
+                    # Validate review date is within time frame
+                    reviewed_at = review_meta.get('reviewed_at')
+                    if reviewed_at:
+                        try:
+                            dt = datetime.fromisoformat(reviewed_at.replace('Z', '+00:00'))
+                            if dt < cutoff_date:
+                                continue  # Skip reviews older than time frame
+                        except Exception:
+                            pass  # Keep reviews with unparseable dates
                     review_meta['agent_identifier'] = agent_identifier
+                    all_metadata.append(review_meta)
+                    filtered_count += 1
+                print(f"   ✓ Loaded {filtered_count} reviews from {filename}")
             except Exception as e:
                 print(f"   Warning: Could not load {filename}: {str(e)}")
+        print(f"✓ Loaded {len(all_metadata)} total reviews from last {LEADERBOARD_TIME_FRAME_DAYS} days")
         return all_metadata
     except Exception as e:
+        print(f"✗ Error loading review metadata from last {LEADERBOARD_TIME_FRAME_DAYS} days: {str(e)}")
         return []
     Returns dictionary of all agent data with current stats.
     """
     token = get_github_token()
     # Load agent metadata from HuggingFace
     agents = load_agents_from_hf()
             else:
                 print(f"   No new reviews to save")
+            # Load ALL metadata to calculate stats (aggregates entire last 6 months)
             print(f"📊 Calculating statistics from ALL stored metadata (last 6 months)...")
+            all_year_metadata = load_review_metadata()
             # Filter for this specific agent
             agent_metadata = [review for review in all_year_metadata if review.get("agent_identifier") == identifier]
     Returns dictionary of agent stats.
     """
     print("📊 Constructing leaderboard from review metadata...")
     # Load agents
     agents = load_agents_from_hf()
     if not agents:
         return {}
     # Load all review metadata for current year
+    all_metadata = load_review_metadata()
     cache_dict = {}

msr.py DELETED Viewed

@@ -1,1224 +0,0 @@
-"""
-Standalone miner to fetch PR review metadata and update the leaderboard immediately.
-This script reuses the same logic and on-disk/HuggingFace formats as app.py, but
-has no UI or scheduler. You can run it once, or run it in a loop for hours.
-Datasets used:
-- Agents: SWE-Arena/swe_agents
-- Review metadata: SWE-Arena/review_metadata
-Environment:
-- Requires HF_TOKEN (for HuggingFace uploads)
-- Optional GITHUB_TOKEN (highly recommended to avoid low rate limits)
-- Reads .env if present
-CLI flags:
-- --debug / --no-debug: Same semantics as app.py (debug limits to 10 PRs/pattern
-  and DOES NOT save to HF, mirroring app.py behavior).
-- --loop: Keep running in a loop.
-- --interval-seconds N: Sleep between loops (default 3600 seconds).
-Note: In production mode (default), data will be saved to HuggingFace datasets.
-"""
-import argparse
-import json
-import os
-import random
-import sys
-import time
-from collections import defaultdict
-from datetime import datetime, timezone, timedelta
-import pandas as pd
-import requests
-from dotenv import load_dotenv
-from huggingface_hub import HfApi, hf_hub_download
-# =============================================================================
-# Environment & CLI
-# =============================================================================
-load_dotenv()
-parser = argparse.ArgumentParser(description="Immediate PR review miner for SWE Arena")
-parser.add_argument("--debug", "--DEBUG", action="store_true", help="Enable debug mode (limits PR retrieval to 10 per query; does NOT save to HF)")
-parser.add_argument("--no-debug", "--production", action="store_true", help="Explicitly disable debug mode (force production mode)")
-parser.add_argument("--loop", action="store_true", help="Run in a loop until interrupted")
-parser.add_argument("--interval-seconds", type=int, default=3600, help="Sleep interval between loops in seconds (default: 3600)")
-args = parser.parse_args()
-# DEBUG MODE priority: 1) flags, 2) env var, 3) default False
-if args.no_debug:
-    DEBUG_MODE = False
-elif args.debug:
-    DEBUG_MODE = True
-else:
-    DEBUG_MODE = os.getenv("DEBUG_MODE", "False").lower() in ("true", "1", "yes")
-# =============================================================================
-# Constants (match app.py)
-# =============================================================================
-DEBUG_REVIEW_METADATA_CACHE = defaultdict(list)
-AGENTS_REPO = "SWE-Arena/swe_agents"
-REVIEW_METADATA_REPO = "SWE-Arena/review_metadata"
-# =============================================================================
-# Utilities & I/O (match app.py behavior exactly)
-# =============================================================================
-def load_jsonl(filename):
-    """Load JSONL file and return list of dictionaries."""
-    if not os.path.exists(filename):
-        return []
-    data = []
-    with open(filename, 'r', encoding='utf-8') as f:
-        for line in f:
-            line = line.strip()
-            if line:
-                try:
-                    entry = json.loads(line)
-                    data.append(entry)
-                except json.JSONDecodeError as e:
-                    print(f"Warning: Skipping invalid JSON line: {e}")
-    return data
-def save_jsonl(filename, data):
-    """Save list of dictionaries to JSONL file."""
-    with open(filename, 'w', encoding='utf-8') as f:
-        for item in data:
-            f.write(json.dumps(item) + '\n')
-def cache_to_dict(cache_list):
-    return {entry['github_identifier']: entry for entry in cache_list}
-def dict_to_cache(cache_dict):
-    return list(cache_dict.values())
-def get_github_token():
-    token = os.getenv('GITHUB_TOKEN')
-    if not token:
-        print("Warning: GITHUB_TOKEN not found. API rate limits: 60/hour (authenticated: 5000/hour)")
-    return token
-def get_hf_token():
-    token = os.getenv('HF_TOKEN')
-    if not token:
-        print("Warning: HF_TOKEN not found in environment variables")
-    return token
-def upload_with_retry(api, path_or_fileobj, path_in_repo, repo_id, repo_type, token, max_retries=5):
-    """
-    Upload file to HuggingFace with exponential backoff retry logic.
-    Args:
-        api: HfApi instance
-        path_or_fileobj: Local file path to upload
-        path_in_repo: Target path in the repository
-        repo_id: Repository ID
-        repo_type: Type of repository (e.g., "dataset")
-        token: HuggingFace token
-        max_retries: Maximum number of retry attempts
-    Returns:
-        True if upload succeeded, raises exception if all retries failed
-    """
-    delay = 2.0  # Initial delay in seconds
-    for attempt in range(max_retries):
-        try:
-            api.upload_file(
-                path_or_fileobj=path_or_fileobj,
-                path_in_repo=path_in_repo,
-                repo_id=repo_id,
-                repo_type=repo_type,
-                token=token
-            )
-            if attempt > 0:
-                print(f"   ✓ Upload succeeded on attempt {attempt + 1}/{max_retries}")
-            return True
-        except Exception as e:
-            if attempt < max_retries - 1:
-                wait_time = delay + random.uniform(0, 1.0)
-                print(f"   ⚠️ Upload failed (attempt {attempt + 1}/{max_retries}): {str(e)}")
-                print(f"   ⏳ Retrying in {wait_time:.1f} seconds...")
-                time.sleep(wait_time)
-                delay = min(delay * 2, 60.0)  # Exponential backoff, max 60s
-            else:
-                print(f"   ✗ Upload failed after {max_retries} attempts: {str(e)}")
-                raise
-# =============================================================================
-# GitHub API with backoff (same as app.py)
-# =============================================================================
-def request_with_backoff(method, url, *, headers=None, params=None, json_body=None, data=None, max_retries=10, timeout=30):
-    delay = 1.0
-    for attempt in range(max_retries):
-        try:
-            resp = requests.request(
-                method,
-                url,
-                headers=headers or {},
-                params=params,
-                json=json_body,
-                data=data,
-                timeout=timeout
-            )
-            status = resp.status_code
-            if 200 <= status < 300:
-                return resp
-            if status in (403, 429) or 500 <= status < 600:
-                wait = None
-                retry_after = resp.headers.get('Retry-After') or resp.headers.get('retry-after')
-                if retry_after:
-                    try:
-                        wait = float(retry_after)
-                    except Exception:
-                        wait = None
-                if wait is None and status in (403, 429):
-                    reset_hdr = resp.headers.get('X-RateLimit-Reset') or resp.headers.get('x-ratelimit-reset')
-                    if reset_hdr:
-                        try:
-                            reset_ts = int(float(reset_hdr))
-                            wait = max(reset_ts - time.time() + 2, 1)
-                        except Exception:
-                            wait = None
-                if wait is None:
-                    wait = delay + random.uniform(0, 0.5)
-                wait = max(1.0, min(wait, 120.0))
-                print(f"GitHub API {status}. Backing off {wait:.1f}s (attempt {attempt + 1}/{max_retries})...")
-                time.sleep(wait)
-                delay = min(delay * 2, 60.0)
-                continue
-            return resp
-        except requests.RequestException as e:
-            wait = delay + random.uniform(0, 0.5)
-            wait = max(1.0, min(wait, 60.0))
-            print(f"Request error: {e}. Retrying in {wait:.1f}s (attempt {attempt + 1}/{max_retries})...")
-            time.sleep(wait)
-            delay = min(delay * 2, 60.0)
-    print(f"Exceeded max retries for {url}")
-    return None
-def fetch_reviews_with_time_partition(base_query, start_date, end_date, headers, prs_by_url, debug_limit=None, depth=0):
-    """
-    Fetch PR reviews within a specific time range using time-based partitioning.
-    Recursively splits the time range if hitting the 1000-result limit.
-    Supports splitting by day, hour, minute, and second as needed.
-    Args:
-        debug_limit: If set, stops fetching after this many NEW PRs total across all partitions (for testing)
-        depth: Current recursion depth (for tracking)
-    Returns the number of PRs found in this time partition.
-    """
-    # Calculate time difference
-    time_diff = end_date - start_date
-    total_seconds = time_diff.total_seconds()
-    # Determine granularity and format dates accordingly
-    if total_seconds >= 86400:  # >= 1 day
-        # Use day granularity (YYYY-MM-DD)
-        start_str = start_date.strftime('%Y-%m-%d')
-        end_str = end_date.strftime('%Y-%m-%d')
-    elif total_seconds >= 3600:  # >= 1 hour but < 1 day
-        # Use hour granularity (YYYY-MM-DDTHH:MM:SSZ)
-        start_str = start_date.strftime('%Y-%m-%dT%H:00:00Z')
-        end_str = end_date.strftime('%Y-%m-%dT%H:59:59Z')
-    elif total_seconds >= 60:  # >= 1 minute but < 1 hour
-        # Use minute granularity (YYYY-MM-DDTHH:MM:SSZ)
-        start_str = start_date.strftime('%Y-%m-%dT%H:%M:00Z')
-        end_str = end_date.strftime('%Y-%m-%dT%H:%M:59Z')
-    else:  # < 1 minute
-        # Use second granularity (YYYY-MM-DDTHH:MM:SSZ)
-        start_str = start_date.strftime('%Y-%m-%dT%H:%M:%SZ')
-        end_str = end_date.strftime('%Y-%m-%dT%H:%M:%SZ')
-    query = f'{base_query} created:{start_str}..{end_str}'
-    indent = "  " + "  " * depth
-    print(f"{indent}Searching range {start_str} to {end_str}...")
-    page = 1
-    per_page = 100
-    total_in_partition = 0
-    while True:
-        # Check debug limit GLOBALLY (total unique PRs across all partitions)
-        if debug_limit is not None and len(prs_by_url) >= debug_limit:
-            print(f"{indent}  🐛 DEBUG MODE: Reached global limit of {debug_limit} PRs, stopping...")
-            return total_in_partition
-        url = 'https://api.github.com/search/issues'  # Use issues endpoint for PR search
-        params = {
-            'q': query,
-            'per_page': per_page,
-            'page': page,
-            'sort': 'created',
-            'order': 'asc'
-        }
-        headers_with_accept = headers.copy() if headers else {}
-        try:
-            response = request_with_backoff('GET', url, headers=headers_with_accept, params=params)
-            if response is None:
-                print(f"{indent}  Error: retries exhausted for range {start_str} to {end_str}")
-                return total_in_partition
-            if response.status_code != 200:
-                print(f"{indent}  Error: HTTP {response.status_code} for range {start_str} to {end_str}")
-                return total_in_partition
-            data = response.json()
-            total_count = data.get('total_count', 0)
-            items = data.get('items', [])
-            if not items:
-                break
-            # Add PR reviews to global dict (keyed by PR URL)
-            for pr in items:
-                pr_url = pr.get('html_url')
-                pr_number = pr.get('number')
-                # Use PR URL as unique key (more reliable than number alone)
-                if pr_url and pr_url not in prs_by_url:
-                    prs_by_url[pr_url] = pr
-                    total_in_partition += 1
-            # Check if we hit the 1000-result limit
-            if total_count > 1000 and page == 10:
-                print(f"{indent}  ⚠️ Hit 1000-result limit ({total_count} total). Splitting time range...")
-                # Determine how to split based on time range duration
-                if total_seconds < 2:  # Less than 2 seconds - can't split further
-                    print(f"{indent}  ⚠️ Cannot split further (range < 2 seconds). Some results may be missing.")
-                    break
-                elif total_seconds < 120:  # Less than 2 minutes - split by seconds
-                    # Split into 2-4 parts depending on range
-                    num_splits = min(4, max(2, int(total_seconds / 30)))
-                    split_duration = time_diff / num_splits
-                    split_dates = [start_date + split_duration * i for i in range(num_splits + 1)]
-                    total_from_splits = 0
-                    for i in range(num_splits):
-                        split_start = split_dates[i]
-                        split_end = split_dates[i + 1]
-                        # Avoid overlapping ranges (add 1 second to start)
-                        if i > 0:
-                            split_start = split_start + timedelta(seconds=1)
-                        count = fetch_reviews_with_time_partition(
-                            base_query, split_start, split_end, headers, prs_by_url, debug_limit, depth + 1
-                        )
-                        total_from_splits += count
-                    return total_from_splits
-                elif total_seconds < 7200:  # Less than 2 hours - split by minutes
-                    # Split into 2-4 parts
-                    num_splits = min(4, max(2, int(total_seconds / 1800)))
-                    split_duration = time_diff / num_splits
-                    split_dates = [start_date + split_duration * i for i in range(num_splits + 1)]
-                    total_from_splits = 0
-                    for i in range(num_splits):
-                        split_start = split_dates[i]
-                        split_end = split_dates[i + 1]
-                        # Avoid overlapping ranges (add 1 minute to start)
-                        if i > 0:
-                            split_start = split_start + timedelta(minutes=1)
-                        count = fetch_reviews_with_time_partition(
-                            base_query, split_start, split_end, headers, prs_by_url, debug_limit, depth + 1
-                        )
-                        total_from_splits += count
-                    return total_from_splits
-                elif total_seconds < 172800:  # Less than 2 days - split by hours
-                    # Split into 2-4 parts
-                    num_splits = min(4, max(2, int(total_seconds / 43200)))
-                    split_duration = time_diff / num_splits
-                    split_dates = [start_date + split_duration * i for i in range(num_splits + 1)]
-                    total_from_splits = 0
-                    for i in range(num_splits):
-                        split_start = split_dates[i]
-                        split_end = split_dates[i + 1]
-                        # Avoid overlapping ranges (add 1 hour to start)
-                        if i > 0:
-                            split_start = split_start + timedelta(hours=1)
-                        count = fetch_reviews_with_time_partition(
-                            base_query, split_start, split_end, headers, prs_by_url, debug_limit, depth + 1
-                        )
-                        total_from_splits += count
-                    return total_from_splits
-                else:  # 2+ days - split by days
-                    days_diff = time_diff.days
-                    # Use aggressive splitting for large ranges or deep recursion
-                    # Split into 4 parts if range is > 30 days, otherwise split in half
-                    if days_diff > 30 or depth > 5:
-                        # Split into 4 parts for more aggressive partitioning
-                        quarter_diff = time_diff / 4
-                        split_dates = [
-                            start_date,
-                            start_date + quarter_diff,
-                            start_date + quarter_diff * 2,
-                            start_date + quarter_diff * 3,
-                            end_date
-                        ]
-                        total_from_splits = 0
-                        for i in range(4):
-                            split_start = split_dates[i]
-                            split_end = split_dates[i + 1]
-                            # Avoid overlapping ranges
-                            if i > 0:
-                                split_start = split_start + timedelta(days=1)
-                            count = fetch_reviews_with_time_partition(
-                                base_query, split_start, split_end, headers, prs_by_url, debug_limit, depth + 1
-                            )
-                            total_from_splits += count
-                        return total_from_splits
-                    else:
-                        # Binary split for smaller ranges
-                        mid_date = start_date + time_diff / 2
-                        # Recursively fetch both halves
-                        count1 = fetch_reviews_with_time_partition(
-                            base_query, start_date, mid_date, headers, prs_by_url, debug_limit, depth + 1
-                        )
-                        count2 = fetch_reviews_with_time_partition(
-                            base_query, mid_date + timedelta(days=1), end_date, headers, prs_by_url, debug_limit, depth + 1
-                        )
-                        return count1 + count2
-            # Normal pagination: check if there are more pages
-            if len(items) < per_page or page >= 10:
-                break
-            page += 1
-            time.sleep(0.5)  # Courtesy delay between pages
-        except Exception as e:
-            print(f"{indent}  Error fetching range {start_str} to {end_str}: {str(e)}")
-            return total_in_partition
-    if total_in_partition > 0:
-        print(f"{indent}  ✓ Found {total_in_partition} PRs in range {start_str} to {end_str}")
-    return total_in_partition
-def extract_review_metadata(pr):
-    """
-    Extract minimal PR review metadata for efficient storage.
-    Only keeps essential fields: html_url, reviewed_at, pr_status, pr_merged, pr_closed_at.
-    Note: agent_name is not stored as it's inferred from the folder structure.
-    PR status:
-    - pr_status: 'open', 'merged', or 'closed'
-    - pr_merged: True if PR was merged, False otherwise
-    - pr_closed_at: Date when PR was closed/merged (if applicable)
-    merged PR = PR that was merged after agent review
-    Rejected PR = PR that was closed without merging after agent review
-    """
-    # Extract PR metadata from search results
-    # The GitHub search API returns PR data from /search/issues endpoint
-    pr_url = pr.get('html_url')
-    pr_number = pr.get('number')
-    created_at = pr.get('created_at')
-    closed_at = pr.get('closed_at')
-    state = pr.get('state', 'open')  # open or closed
-    # Check if PR has pull_request field (indicates it's a PR, not an issue)
-    pull_request_data = pr.get('pull_request', {})
-    # For initial extraction, we don't know if merged yet
-    # This will be updated by update_pr_status function
-    pr_merged = pull_request_data.get('merged_at') is not None if pull_request_data else False
-    # Determine initial status
-    if pr_merged:
-        status = 'merged'
-    elif state == 'closed':
-        status = 'closed'
-    else:
-        status = 'open'
-    return {
-        'html_url': pr_url,
-        'reviewed_at': created_at,  # When the PR was created (agent reviewed it)
-        'pr_status': status,
-        'pr_merged': pr_merged,
-        'pr_closed_at': closed_at,
-        'pr_url': pr_url,  # Store PR URL for tracking
-        'review_id': f"pr_{pr_number}"  # Use PR number for deduplication
-    }
-def update_pr_status(metadata_list, headers, token):
-    """
-    Update PR status for reviews to get current merged/closed state.
-    For each PR associated with a review, fetch current status from GitHub API.
-    Updates metadata_list in-place with PR status information.
-    In DEBUG MODE: Skips status updates to avoid API rate limits.
-    Args:
-        metadata_list: List of review metadata dictionaries
-        headers: HTTP headers for GitHub API
-        token: GitHub API token
-    Returns:
-        Updated metadata_list with current PR status
-    """
-    if not metadata_list:
-        return metadata_list
-    # In debug mode, skip status updates to avoid excessive API calls
-    if DEBUG_MODE:
-        print(f"   🐛 DEBUG MODE: Skipping PR status updates for {len(metadata_list)} reviews")
-        return metadata_list
-    # Track unique PRs to avoid duplicate API calls
-    pr_url_to_status = {}
-    updated_count = 0
-    for metadata in metadata_list:
-        pr_url = metadata.get('pr_url')
-        if not pr_url:
-            continue
-        # Skip if already fetched for this PR
-        if pr_url in pr_url_to_status:
-            status_info = pr_url_to_status[pr_url]
-            metadata['pr_status'] = status_info['status']
-            metadata['pr_merged'] = status_info['merged']
-            metadata['pr_closed_at'] = status_info['closed_at']
-            continue
-        try:
-            # Convert HTML URL to API URL
-            # https://github.com/owner/repo/pull/123 -> https://api.github.com/repos/owner/repo/pulls/123
-            parts = pr_url.replace('https://github.com/', '').split('/')
-            if len(parts) >= 4:
-                owner, repo, pull_word, pr_number = parts[0], parts[1], parts[2], parts[3]
-                api_url = f'https://api.github.com/repos/{owner}/{repo}/pulls/{pr_number}'
-                response = request_with_backoff('GET', api_url, headers=headers, max_retries=3)
-                if response and response.status_code == 200:
-                    pr_data = response.json()
-                    state = pr_data.get('state', 'open')
-                    merged = pr_data.get('merged', False)
-                    closed_at = pr_data.get('closed_at')
-                    merged_at = pr_data.get('merged_at')
-                    # Determine final status
-                    if merged:
-                        status = 'merged'
-                    elif state == 'closed':
-                        status = 'closed'
-                    else:
-                        status = 'open'
-                    status_info = {
-                        'status': status,
-                        'merged': merged,
-                        'closed_at': closed_at or merged_at
-                    }
-                    # Cache and update
-                    pr_url_to_status[pr_url] = status_info
-                    metadata['pr_status'] = status
-                    metadata['pr_merged'] = merged
-                    metadata['pr_closed_at'] = closed_at or merged_at
-                    updated_count += 1
-                # Small delay to avoid rate limiting
-                time.sleep(0.1)
-        except Exception as e:
-            print(f"   Warning: Could not check PR status for {pr_url}: {e}")
-            continue
-    if updated_count > 0:
-        print(f"   ✓ Updated status for {updated_count} unique PRs")
-    return metadata_list
-def fetch_all_reviews_metadata(identifier, agent_name, token=None, start_from_date=None, year=None, exclude_dates=None):
-    """
-    Fetch PR reviews associated with a GitHub user or bot for the past 6 months.
-    Returns lightweight metadata instead of full review objects.
-    This function employs time-based partitioning to navigate GitHub's 1000-result limit per query.
-    It searches using the query pattern:
-    - reviewed-by:{identifier} (PR reviews by the agent)
-    After fetching reviews, it updates PR status to determine if PRs were merged or closed.
-    Args:
-        identifier: GitHub username or bot identifier
-        agent_name: Human-readable name of the agent for metadata purposes
-        token: GitHub API token for authentication
-        start_from_date: Only fetch reviews created after this date (for incremental updates)
-        year: Year parameter (deprecated, retained for compatibility but not utilized)
-        exclude_dates: Set of date objects to exclude from mining (dates that have already been processed)
-    Returns:
-        List of dictionaries containing minimal PR review metadata with PR status
-    """
-    headers = {'Authorization': f'token {token}'} if token else {}
-    # Debug mode: limit review retrieval for testing
-    debug_limit_per_pattern = 10 if DEBUG_MODE else None
-    if DEBUG_MODE:
-        print(f"\n🐛 DEBUG MODE ENABLED: Limiting to {debug_limit_per_pattern} PRs per query pattern")
-    # Define query pattern for PR reviews:
-    query_patterns = []
-    # Add reviewed-by pattern for PR reviews
-    query_patterns.append(f'is:pr reviewed-by:{identifier}')
-    # Use a dict to deduplicate PRs by URL
-    prs_by_url = {}
-    # Define time range: past 6 months only (or from start_from_date if specified)
-    current_time = datetime.now(timezone.utc)
-    six_months_ago = current_time - timedelta(days=180)  # ~6 months
-    if start_from_date:
-        # Use start_from_date but ensure it's not older than 6 months
-        start_date = max(start_from_date, six_months_ago)
-    else:
-        start_date = six_months_ago
-    # End date is current time
-    end_date = current_time
-    for query_pattern in query_patterns:
-        print(f"\n🔍 Searching with query: {query_pattern}")
-        print(f"   Time range: {start_date.strftime('%Y-%m-%d')} to {end_date.strftime('%Y-%m-%d')}")
-        pattern_start_time = time.time()
-        initial_count = len(prs_by_url)
-        # Fetch with time partitioning
-        reviews_found = fetch_reviews_with_time_partition(
-            query_pattern,
-            start_date,
-            end_date,
-            headers,
-            prs_by_url,
-            debug_limit_per_pattern
-        )
-        pattern_duration = time.time() - pattern_start_time
-        new_reviews = len(prs_by_url) - initial_count
-        print(f"   ✓ Pattern complete: {new_reviews} new PRs found ({reviews_found} total fetched, {len(prs_by_url) - initial_count - (reviews_found - new_reviews)} duplicates)")
-        print(f"   ⏱️ Time taken: {pattern_duration:.1f} seconds")
-        # Delay between different query patterns (shorter in debug mode)
-        time.sleep(0.2 if DEBUG_MODE else 1.0)
-    # Convert to lightweight metadata
-    all_prs = list(prs_by_url.values())
-    # Filter out PRs from excluded dates if specified
-    if exclude_dates:
-        filtered_prs = []
-        excluded_count = 0
-        for pr in all_prs:
-            created_at = pr.get('created_at')
-            if created_at:
-                try:
-                    dt = datetime.fromisoformat(created_at.replace('Z', '+00:00'))
-                    pr_date = dt.date()
-                    if pr_date not in exclude_dates:
-                        filtered_prs.append(pr)
-                    else:
-                        excluded_count += 1
-                except Exception:
-                    filtered_prs.append(pr)  # Keep PRs with unparseable dates
-            else:
-                filtered_prs.append(pr)  # Keep PRs without created_at
-        if excluded_count > 0:
-            print(f"   ⏭️ Skipped {excluded_count} PRs from already-mined dates")
-        all_prs = filtered_prs
-    if DEBUG_MODE:
-        print(f"\n✅ COMPLETE (DEBUG MODE): Found {len(all_prs)} unique PRs reviewed by {identifier}")
-        print(f"   Note: In production mode, this would fetch ALL PRs")
-    else:
-        print(f"\n✅ COMPLETE: Found {len(all_prs)} unique PRs reviewed by {identifier}")
-    print(f"📦 Extracting minimal metadata and updating PR status...")
-    # Extract metadata for each PR review
-    metadata_list = [extract_review_metadata(pr) for pr in all_prs]
-    # Update PR status to get current merged/closed state
-    print(f"🔍 Updating PR status for reviewed PRs...")
-    metadata_list = update_pr_status(metadata_list, headers, token)
-    # Calculate memory savings
-    original_size = sys.getsizeof(str(all_prs))
-    metadata_size = sys.getsizeof(str(metadata_list))
-    savings_pct = ((original_size - metadata_size) / original_size * 100) if original_size > 0 else 0
-    print(f"💾 Memory efficiency: {original_size // 1024}KB → {metadata_size // 1024}KB (saved {savings_pct:.1f}%)")
-    return metadata_list
-def group_metadata_by_date(metadata_list):
-    """
-    Group review metadata by exact date (year.month.day) for efficient daily storage.
-    Returns dict: {(year, month, day): [metadata_list]}
-    """
-    grouped = defaultdict(list)
-    for review_meta in metadata_list:
-        reviewed_at = review_meta.get('reviewed_at')
-        if not reviewed_at:
-            continue
-        try:
-            dt = datetime.fromisoformat(reviewed_at.replace('Z', '+00:00'))
-            key = (dt.year, dt.month, dt.day)
-            grouped[key].append(review_meta)
-        except Exception as e:
-            print(f"Warning: Could not parse date '{reviewed_at}': {e}")
-    return dict(grouped)
-def save_review_metadata_to_hf(metadata_list, agent_identifier):
-    """
-    Save review metadata to HuggingFace dataset, organized by [agent_identifier]/YYYY.MM.DD.jsonl.
-    Each file is stored in the agent's folder and named YYYY.MM.DD.jsonl for that day's reviews.
-    In debug mode, saves to in-memory cache only.
-    This function APPENDS new metadata and DEDUPLICATES by sha.
-    Args:
-        metadata_list: List of review metadata dictionaries
-        agent_identifier: GitHub identifier of the agent (used as folder name)
-    """
-    # Skip saving to HF in debug mode - use in-memory cache instead
-    if DEBUG_MODE:
-        global DEBUG_REVIEW_METADATA_CACHE
-        # Merge with existing cache, deduplicating by review_id
-        existing = {review['review_id']: review for review in DEBUG_REVIEW_METADATA_CACHE[agent_identifier] if review.get('review_id')}
-        new = {review['review_id']: review for review in metadata_list if review.get('review_id')}
-        existing.update(new)
-        DEBUG_REVIEW_METADATA_CACHE[agent_identifier] = list(existing.values())
-        print(f"🐛 DEBUG MODE: Saved to in-memory cache only ({len(metadata_list)} reviews) - NOT saved to HuggingFace")
-        return True
-    try:
-        token = get_hf_token()
-        if not token:
-            raise Exception("No HuggingFace token found")
-        api = HfApi()
-        # Group by exact date (year, month, day)
-        grouped = group_metadata_by_date(metadata_list)
-        for (review_year, month, day), day_metadata in grouped.items():
-            # New structure: [agent_identifier]/YYYY.MM.DD.jsonl
-            filename = f"{agent_identifier}/{review_year}.{month:02d}.{day:02d}.jsonl"
-            local_filename = f"{review_year}.{month:02d}.{day:02d}.jsonl"
-            print(f"📤 Uploading {len(day_metadata)} reviews to {filename}...")
-            # Download existing file if it exists
-            existing_metadata = []
-            try:
-                file_path = hf_hub_download(
-                    repo_id=REVIEW_METADATA_REPO,
-                    filename=filename,
-                    repo_type="dataset",
-                    token=token
-                )
-                existing_metadata = load_jsonl(file_path)
-                print(f"   Found {len(existing_metadata)} existing reviews in {filename}")
-            except Exception:
-                print(f"   No existing file found for {filename}, creating new")
-            # Merge and deduplicate by review_id
-            existing_by_id = {meta['review_id']: meta for meta in existing_metadata if meta.get('review_id')}
-            new_by_id = {meta['review_id']: meta for meta in day_metadata if meta.get('review_id')}
-            # Update with new data (new data overwrites old)
-            existing_by_id.update(new_by_id)
-            merged_metadata = list(existing_by_id.values())
-            # Save locally
-            save_jsonl(local_filename, merged_metadata)
-            try:
-                # Upload to HuggingFace with folder path
-                upload_with_retry(
-                    api=api,
-                    path_or_fileobj=local_filename,
-                    path_in_repo=filename,
-                    repo_id=REVIEW_METADATA_REPO,
-                    repo_type="dataset",
-                    token=token
-                )
-                print(f"   ✓ Saved {len(merged_metadata)} total reviews to {filename}")
-            finally:
-                # Always clean up local file, even if upload fails
-                if os.path.exists(local_filename):
-                    os.remove(local_filename)
-        return True
-    except Exception as e:
-        print(f"✗ Error saving review metadata: {str(e)}")
-        return False
-def load_agents_from_hf():
-    try:
-        api = HfApi()
-        agents = []
-        files = api.list_repo_files(repo_id=AGENTS_REPO, repo_type="dataset")
-        json_files = [f for f in files if f.endswith('.json')]
-        print(f"Found {len(json_files)} agent files in {AGENTS_REPO}")
-        for json_file in json_files:
-            try:
-                file_path = hf_hub_download(
-                    repo_id=AGENTS_REPO,
-                    filename=json_file,
-                    repo_type="dataset"
-                )
-                with open(file_path, 'r') as f:
-                    agent_data = json.load(f)
-                    agents.append(agent_data)
-            except Exception as e:
-                print(f"Warning: Could not load {json_file}: {str(e)}")
-                continue
-        print(f"✓ Loaded {len(agents)} agents from HuggingFace")
-        return agents
-    except Exception as e:
-        print(f"Could not load agents from HuggingFace: {str(e)}")
-        return None
-def load_review_metadata_for_year(year):
-    """
-    Load all review metadata for a specific year from HuggingFace.
-    Scans all agent folders and loads daily files matching the year.
-    In debug mode, loads from in-memory cache if available.
-    Structure: [agent_identifier]/YYYY.MM.DD.jsonl
-    Returns:
-        List of dictionaries with 'agent_identifier' added to each review metadata.
-    """
-    # In debug mode, check in-memory cache first
-    if DEBUG_MODE and DEBUG_REVIEW_METADATA_CACHE:
-        all_metadata = []
-        for agent_identifier, metadata_list in DEBUG_REVIEW_METADATA_CACHE.items():
-            for review_meta in metadata_list:
-                review_with_agent = review_meta.copy()
-                review_with_agent['agent_identifier'] = agent_identifier
-                all_metadata.append(review_with_agent)
-        if all_metadata:
-            print(f"🐛 DEBUG MODE: Loading review metadata from in-memory cache ({len(all_metadata)} reviews)")
-            return all_metadata
-    try:
-        api = HfApi()
-        token = get_hf_token()
-        # List all files in the repository
-        files = api.list_repo_files(repo_id=REVIEW_METADATA_REPO, repo_type="dataset")
-        # Filter for files matching the year pattern: [agent_identifier]/YYYY.MM.DD.jsonl
-        # Extract year from filename
-        year_str = str(year)
-        year_files = []
-        for f in files:
-            if f.endswith('.jsonl'):
-                parts = f.split('/')
-                if len(parts) == 2:  # [agent_identifier]/YYYY.MM.DD.jsonl
-                    filename = parts[1]
-                    if filename.startswith(year_str + '.'):
-                        year_files.append(f)
-        print(f"📥 Loading review metadata for {year} ({len(year_files)} daily files across all agents)...")
-        all_metadata = []
-        for filename in year_files:
-            try:
-                # Extract agent_identifier from path (first part)
-                # Format: agent_identifier/YYYY.MM.DD.jsonl
-                parts = filename.split('/')
-                if len(parts) != 2:
-                    print(f"   Warning: Unexpected filename format: {filename}")
-                    continue
-                agent_identifier = parts[0]
-                file_path = hf_hub_download(
-                    repo_id=REVIEW_METADATA_REPO,
-                    filename=filename,
-                    repo_type="dataset",
-                    token=token
-                )
-                day_metadata = load_jsonl(file_path)
-                # Add agent_identifier to each review metadata for processing
-                for review_meta in day_metadata:
-                    review_meta['agent_identifier'] = agent_identifier
-                all_metadata.extend(day_metadata)
-                print(f"   ✓ Loaded {len(day_metadata)} reviews from {filename}")
-            except Exception as e:
-                print(f"   Warning: Could not load {filename}: {str(e)}")
-        print(f"✓ Loaded {len(all_metadata)} total reviews for {year}")
-        return all_metadata
-    except Exception as e:
-        print(f"✗ Error loading review metadata for {year}: {str(e)}")
-        return []
-def get_latest_review_date_for_agent(agent_identifier):
-    """
-    Get the latest review creation date for an agent from stored metadata.
-    Used for incremental updates - only fetch reviews newer than this date.
-    Structure: [agent_identifier]/YYYY.MM.DD.jsonl
-    Args:
-        agent_identifier: GitHub identifier of the agent
-    Returns:
-        datetime or None if no existing reviews found.
-    """
-    try:
-        api = HfApi()
-        token = get_hf_token()
-        # List all files in the repository
-        files = api.list_repo_files(repo_id=REVIEW_METADATA_REPO, repo_type="dataset")
-        # Filter for files in this agent's folder
-        # New structure: [agent_identifier]/YYYY.MM.DD.jsonl
-        agent_pattern = f"{agent_identifier}/"
-        agent_files = [f for f in files if f.startswith(agent_pattern) and f.endswith('.jsonl')]
-        if not agent_files:
-            return None
-        # Find latest review_at across all files
-        latest_date = None
-        for filename in agent_files:
-            try:
-                file_path = hf_hub_download(
-                    repo_id=REVIEW_METADATA_REPO,
-                    filename=filename,
-                    repo_type="dataset",
-                    token=token
-                )
-                metadata = load_jsonl(file_path)
-                for review_meta in metadata:
-                    reviewed_at = review_meta.get("reviewed_at")
-                    if reviewed_at:
-                        try:
-                            dt = datetime.fromisoformat(reviewed_at.replace("Z", "+00:00"))
-                            if latest_date is None or dt > latest_date:
-                                latest_date = dt
-                        except Exception:
-                            continue
-            except Exception:
-                continue
-        return latest_date
-    except Exception:
-        return None
-def get_already_mined_dates(agent_identifier, n_months=6):
-    """
-    Get set of dates that have already been mined for an agent.
-    Args:
-        agent_identifier: GitHub identifier of the agent
-        n_months: Number of months to look back (default: 6)
-    Returns:
-        Set of date objects (datetime.date) that already have data files
-    """
-    try:
-        api = HfApi()
-        # Calculate date range
-        today = datetime.now(timezone.utc)
-        n_months_ago = today - timedelta(days=30 * n_months)
-        # List all files in the repository
-        files = api.list_repo_files(repo_id=REVIEW_METADATA_REPO, repo_type="dataset")
-        # Filter for files in this agent's folder
-        agent_pattern = f"{agent_identifier}/"
-        agent_files = [f for f in files if f.startswith(agent_pattern) and f.endswith('.jsonl')]
-        mined_dates = set()
-        for filename in agent_files:
-            try:
-                # Extract date from filename: [agent_identifier]/YYYY.MM.DD.jsonl
-                parts = filename.split('/')
-                if len(parts) != 2:
-                    continue
-                date_part = parts[1].replace('.jsonl', '')  # Get YYYY.MM.DD
-                date_components = date_part.split('.')
-                if len(date_components) != 3:
-                    continue
-                file_year, file_month, file_day = map(int, date_components)
-                file_date = datetime(file_year, file_month, file_day, tzinfo=timezone.utc).date()
-                # Only include dates within the last n_months
-                if n_months_ago.date() <= file_date <= today.date():
-                    mined_dates.add(file_date)
-            except Exception as e:
-                print(f"   Warning: Could not parse date from filename {filename}: {e}")
-                continue
-        return mined_dates
-    except Exception as e:
-        print(f"   Warning: Could not get already-mined dates for {agent_identifier}: {str(e)}")
-        return set()
-def calculate_review_stats_from_metadata(metadata_list):
-    """
-    Calculate statistics from a list of review metadata (lightweight objects).
-    Works with minimal metadata: html_url, reviewed_at, pr_status, pr_merged, pr_closed_at.
-    Returns a dictionary with comprehensive review metrics.
-    Acceptance Rate is calculated as:
-        merged PRs / (merged PRs + rejected PRs) * 100
-    merged PRs = PRs that were merged (pr_status='merged')
-    Rejected PRs = PRs that were closed without merging (pr_status='closed')
-    Pending PRs = PRs still open (pr_status='open') - excluded from acceptance rate
-    """
-    total_reviews = len(metadata_list)
-    # Count merged PRs (merged)
-    merged_prs = sum(1 for review_meta in metadata_list
-                      if review_meta.get('pr_status') == 'merged')
-    # Count rejected PRs (closed without merging)
-    rejected_prs = sum(1 for review_meta in metadata_list
-                      if review_meta.get('pr_status') == 'closed')
-    # Count pending PRs (still open)
-    pending_prs = sum(1 for review_meta in metadata_list
-                     if review_meta.get('pr_status') == 'open')
-    # Calculate acceptance rate (exclude pending PRs)
-    completed_prs = merged_prs + rejected_prs
-    acceptance_rate = (merged_prs / completed_prs * 100) if completed_prs > 0 else 0
-    return {
-        'total_reviews': total_reviews,
-        'merged_prs': merged_prs,
-        'rejected_prs': rejected_prs,
-        'pending_prs': pending_prs,
-        'acceptance_rate': round(acceptance_rate, 2),
-    }
-def update_all_agents_incremental():
-    """
-    Memory-efficient incremental update of review statistics for all agents.
-    Strategy:
-    1. For each agent, load existing data from SWE-Arena/review_metadata
-    2. Identify already-mined dates (based on filename: YYYY.MM.DD.jsonl)
-    3. Only fetch reviews from dates that haven't been mined yet (within last 6 months)
-    4. If no data exists at all, mine everything from scratch
-    5. Store minimal metadata (not full review objects) to avoid storage limits
-    6. Construct leaderboard from ALL stored metadata (last 6 months)
-    Returns dictionary of all agent data with current stats.
-    """
-    token = get_github_token()
-    current_year = datetime.now().year
-    # Load agent metadata from HuggingFace
-    agents = load_agents_from_hf()
-    if not agents:
-        print("No agents found in HuggingFace dataset")
-        return {}
-    cache_dict = {}
-    # Update each agent
-    for agent in agents:
-        identifier = agent.get('github_identifier')
-        agent_name = agent.get('agent_name', 'Unknown')
-        if not identifier:
-            print(f"Warning: Skipping agent without identifier: {agent}")
-            continue
-        try:
-            print(f"\n{'='*80}")
-            print(f"Processing: {agent_name} ({identifier})")
-            print(f"{'='*80}")
-            # Get already-mined dates for this agent (last 6 months)
-            already_mined_dates = get_already_mined_dates(identifier, n_months=6)
-            if already_mined_dates:
-                print(f"📅 Found {len(already_mined_dates)} already-mined dates")
-                print(f"   Skipping these dates and fetching only new data...")
-                # Fetch only reviews from dates not yet mined
-                new_metadata = fetch_all_reviews_metadata(
-                    identifier,
-                    agent_name,
-                    token,
-                    start_from_date=None,  # Use full 6-month range
-                    exclude_dates=already_mined_dates  # But exclude already-mined dates
-                )
-            else:
-                print(f"📅 No existing data found. Mining everything from scratch...")
-                # Mine everything from scratch (full 6-month range)
-                new_metadata = fetch_all_reviews_metadata(
-                    identifier,
-                    agent_name,
-                    token,
-                    start_from_date=None
-                )
-            if new_metadata:
-                # Save new metadata to HuggingFace (organized by agent_identifier/YYYY.MM.DD.jsonl)
-                print(f"💾 Saving {len(new_metadata)} new review records...")
-                save_review_metadata_to_hf(new_metadata, identifier)
-            else:
-                print(f"   No new reviews to save")
-            # Load ALL metadata for current year to calculate stats (aggregates entire last 6 months)
-            print(f"📊 Calculating statistics from ALL stored metadata (last 6 months)...")
-            all_year_metadata = load_review_metadata_for_year(current_year)
-            # Filter for this specific agent
-            agent_metadata = [review for review in all_year_metadata if review.get("agent_identifier") == identifier]
-            # Calculate stats from metadata
-            stats = calculate_review_stats_from_metadata(agent_metadata)
-            # Merge metadata with stats
-            cache_dict[identifier] = {
-                'agent_name': agent_name,
-                'website': agent.get('website', 'N/A'),
-                'github_identifier': identifier,
-                **stats
-            }
-            print(f"✓ Updated {identifier}: {stats['total_reviews']} reviews, {stats['acceptance_rate']}% acceptance rate")
-        except Exception as e:
-            print(f"✗ Error updating {identifier}: {str(e)}")
-            import traceback
-            traceback.print_exc()
-            continue
-    return cache_dict
-def run_once():
-    print("\n🚀 Immediate mining run started")
-    cache_dict = update_all_agents_incremental()
-    if cache_dict:
-        print(f"✓ Updated {len(cache_dict)} agents")
-    print("✅ Immediate mining run completed\n")
-def main():
-    if DEBUG_MODE:
-        print("\n" + "="*80)
-        print("🐛 DEBUG MODE ENABLED 🐛")
-        print("="*80)
-        print("PR retrieval is limited to 10 PRs per query pattern per agent")
-        print("Data will NOT be saved to HuggingFace in debug mode.")
-        print("="*80 + "\n")
-    else:
-        print("\n🚀 Starting in PRODUCTION MODE - full review retrieval enabled")
-        print()
-    if not args.loop:
-        run_once()
-        return
-    print(f"🔁 Loop mode enabled. Interval: {args.interval_seconds} seconds")
-    try:
-        while True:
-            start = time.time()
-            run_once()
-            elapsed = time.time() - start
-            sleep_for = max(0, args.interval_seconds - int(elapsed))
-            if sleep_for > 0:
-                print(f"😴 Sleeping {sleep_for} seconds before next run...")
-                time.sleep(sleep_for)
-    except KeyboardInterrupt:
-        print("\n👋 Loop interrupted by user. Exiting...")
-if __name__ == "__main__":
-    main()