Spaces:

Agents-MCP-Hackathon
/

HF_RepoSense

Sleeping

App Files Files Community

naman1102 commited on Jun 8

Commit

ecb092b

1 Parent(s): aa50ddd

j

Browse files

Files changed (2) hide show

app.py +68 -4
repo_explorer.py +50 -52

app.py CHANGED Viewed

@@ -39,10 +39,37 @@ def write_repos_to_csv(repo_ids: List[str]) -> None:
     except Exception as e:
         logger.error(f"Error writing to CSV: {e}")
 def read_csv_to_dataframe() -> pd.DataFrame:
-    """Reads the CSV file into a pandas DataFrame."""
     try:
-        return pd.read_csv(CSV_FILE, dtype=str).fillna('')
     except FileNotFoundError:
         return pd.DataFrame(columns=["repo id", "strength", "weaknesses", "speciality", "relevance rating"])
     except Exception as e:
@@ -225,6 +252,38 @@ def create_ui() -> gr.Blocks:
         background: linear-gradient(45deg, #667eea, #764ba2);
         border-radius: 4px;
     }
     """
     with gr.Blocks(
@@ -324,7 +383,11 @@ def create_ui() -> gr.Blocks:
                 df_output = gr.Dataframe(
                     headers=["Repository", "Strengths", "Weaknesses", "Speciality", "Relevance"],
                     wrap=True,
-                    interactive=False
                 )
             # --- Chatbot Tab ---
@@ -370,7 +433,8 @@ def create_ui() -> gr.Blocks:
                         )
             # --- Repo Explorer Tab ---
-            repo_explorer_tab, repo_components, repo_states = create_repo_explorer_tab()
         # --- Footer ---
         gr.Markdown(

     except Exception as e:
         logger.error(f"Error writing to CSV: {e}")
+def format_text_for_dataframe(text: str, max_length: int = 200) -> str:
+    """Format text for better display in dataframe by truncating and cleaning."""
+    if not text or pd.isna(text):
+        return ""
+    # Clean the text
+    text = str(text).strip()
+    # Remove excessive whitespace and newlines
+    text = re.sub(r'\s+', ' ', text)
+    # Truncate if too long
+    if len(text) > max_length:
+        text = text[:max_length-3] + "..."
+    return text
 def read_csv_to_dataframe() -> pd.DataFrame:
+    """Reads the CSV file into a pandas DataFrame with formatted text for display."""
     try:
+        df = pd.read_csv(CSV_FILE, dtype=str).fillna('')
+        # Format text columns for better display
+        if not df.empty:
+            df['strength'] = df['strength'].apply(lambda x: format_text_for_dataframe(x, 180))
+            df['weaknesses'] = df['weaknesses'].apply(lambda x: format_text_for_dataframe(x, 180))
+            df['speciality'] = df['speciality'].apply(lambda x: format_text_for_dataframe(x, 150))
+            df['repo id'] = df['repo id'].apply(lambda x: format_text_for_dataframe(x, 50))
+            # Keep relevance rating as is since it should be short
+        return df
     except FileNotFoundError:
         return pd.DataFrame(columns=["repo id", "strength", "weaknesses", "speciality", "relevance rating"])
     except Exception as e:
         background: linear-gradient(45deg, #667eea, #764ba2);
         border-radius: 4px;
     }
+    /* Improved dataframe styling */
+    .gr-dataframe {
+        max-height: 400px;
+        overflow-y: auto;
+    }
+    .gr-dataframe table {
+        table-layout: fixed;
+        width: 100%;
+    }
+    .gr-dataframe th,
+    .gr-dataframe td {
+        padding: 8px 12px;
+        vertical-align: top;
+        word-wrap: break-word;
+        overflow-wrap: break-word;
+        max-height: 100px;
+        overflow-y: auto;
+    }
+    .gr-dataframe th:nth-child(1),
+    .gr-dataframe td:nth-child(1) { width: 15%; }
+    .gr-dataframe th:nth-child(2),
+    .gr-dataframe td:nth-child(2) { width: 25%; }
+    .gr-dataframe th:nth-child(3),
+    .gr-dataframe td:nth-child(3) { width: 25%; }
+    .gr-dataframe th:nth-child(4),
+    .gr-dataframe td:nth-child(4) { width: 20%; }
+    .gr-dataframe th:nth-child(5),
+    .gr-dataframe td:nth-child(5) { width: 15%; }
     """
     with gr.Blocks(
                 df_output = gr.Dataframe(
                     headers=["Repository", "Strengths", "Weaknesses", "Speciality", "Relevance"],
                     wrap=True,
+                    interactive=False,
+                    max_rows=10,
+                    height=400,
+                    column_widths=["15%", "25%", "25%", "20%", "15%"],
+                    datatype=["str", "str", "str", "str", "str"]
                 )
             # --- Chatbot Tab ---
                         )
             # --- Repo Explorer Tab ---
+            with gr.TabItem("🔍 Repo Explorer", id="repo_explorer_tab"):
+                repo_components, repo_states = create_repo_explorer_tab()
         # --- Footer ---
         gr.Markdown(

repo_explorer.py CHANGED Viewed

@@ -120,10 +120,9 @@ Make this comprehensive but conversational - it will be used by a chatbot to ans
         logger.error(f"Error creating repo context summary: {e}")
         return f"Repository analysis unavailable: {e}"
-def create_repo_explorer_tab() -> Tuple[gr.TabItem, Dict[str, gr.components.Component], Dict[str, gr.State]]:
     """
-    Creates the Repo Explorer tab with all its components and returns the tab,
-    component references, and state variables.
     """
     # State variables for repo explorer
@@ -132,58 +131,57 @@ def create_repo_explorer_tab() -> Tuple[gr.TabItem, Dict[str, gr.components.Comp
         "current_repo_id": gr.State("")
     }
-    with gr.TabItem("🔍 Repo Explorer", id="repo_explorer_tab") as tab:
-        gr.Markdown("### 🗂️ Deep Dive into a Specific Repository")
-        with gr.Row():
-            with gr.Column(scale=2):
-                repo_explorer_input = gr.Textbox(
-                    label="📁 Repository ID",
-                    placeholder="microsoft/DialoGPT-medium",
-                    info="Enter a Hugging Face repository ID to explore"
                 )
-            with gr.Column(scale=1):
-                load_repo_btn = gr.Button("🚀 Load Repository", variant="primary", size="lg")
-        with gr.Row():
-            repo_status_display = gr.Textbox(
-                label="📊 Repository Status",
                 interactive=False,
-                lines=3,
-                info="Current repository loading status and basic info"
             )
-        with gr.Row():
-            with gr.Column(scale=2):
-                repo_chatbot = gr.Chatbot(
-                    label="🤖 Repository Assistant",
-                    height=500,
-                    type="messages",
-                    avatar_images=(
-                        "https://cdn-icons-png.flaticon.com/512/149/149071.png",
-                        "https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.png"
-                    ),
-                    show_copy_button=True
-                )
-                with gr.Row():
-                    repo_msg_input = gr.Textbox(
-                        label="💭 Ask about this repository",
-                        placeholder="What does this repository do? How do I use it?",
-                        lines=1,
-                        scale=4,
-                        info="Ask anything about the loaded repository"
-                    )
-                    repo_send_btn = gr.Button("📤 Send", variant="primary", scale=1)
-            with gr.Column(scale=1):
-                repo_content_display = gr.Textbox(
-                    label="📄 Repository Content Preview",
-                    lines=25,
-                    interactive=False,
-                    show_copy_button=True,
-                    info="Preview of the repository files and content"
-                )
     # Component references
     components = {
@@ -196,7 +194,7 @@ def create_repo_explorer_tab() -> Tuple[gr.TabItem, Dict[str, gr.components.Comp
         "repo_content_display": repo_content_display
     }
-    return tab, components, states
 def handle_load_repository(repo_id: str) -> Tuple[str, str, str]:
     """Load a specific repository and prepare it for exploration with chunk-based analysis."""

         logger.error(f"Error creating repo context summary: {e}")
         return f"Repository analysis unavailable: {e}"
+def create_repo_explorer_tab() -> Tuple[Dict[str, gr.components.Component], Dict[str, gr.State]]:
     """
+    Creates the Repo Explorer tab content and returns the component references and state variables.
     """
     # State variables for repo explorer
         "current_repo_id": gr.State("")
     }
+    gr.Markdown("### 🗂️ Deep Dive into a Specific Repository")
+    with gr.Row():
+        with gr.Column(scale=2):
+            repo_explorer_input = gr.Textbox(
+                label="📁 Repository ID",
+                placeholder="microsoft/DialoGPT-medium",
+                info="Enter a Hugging Face repository ID to explore"
+            )
+        with gr.Column(scale=1):
+            load_repo_btn = gr.Button("🚀 Load Repository", variant="primary", size="lg")
+    with gr.Row():
+        repo_status_display = gr.Textbox(
+            label="📊 Repository Status",
+            interactive=False,
+            lines=3,
+            info="Current repository loading status and basic info"
+        )
+    with gr.Row():
+        with gr.Column(scale=2):
+            repo_chatbot = gr.Chatbot(
+                label="🤖 Repository Assistant",
+                height=500,
+                type="messages",
+                avatar_images=(
+                    "https://cdn-icons-png.flaticon.com/512/149/149071.png",
+                    "https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.png"
+                ),
+                show_copy_button=True
+            )
+            with gr.Row():
+                repo_msg_input = gr.Textbox(
+                    label="💭 Ask about this repository",
+                    placeholder="What does this repository do? How do I use it?",
+                    lines=1,
+                    scale=4,
+                    info="Ask anything about the loaded repository"
                 )
+                repo_send_btn = gr.Button("📤 Send", variant="primary", scale=1)
+        with gr.Column(scale=1):
+            repo_content_display = gr.Textbox(
+                label="📄 Repository Content Preview",
+                lines=25,
                 interactive=False,
+                show_copy_button=True,
+                info="Preview of the repository files and content"
             )
     # Component references
     components = {
         "repo_content_display": repo_content_display
     }
+    return components, states
 def handle_load_repository(repo_id: str) -> Tuple[str, str, str]:
     """Load a specific repository and prepare it for exploration with chunk-based analysis."""