Spaces:

awacke1
/

AIKnowledgeTreeBuilder

Sleeping

App Files Files Community

awacke1 commited on Nov 2, 2024

Commit

5edd789

verified ·

1 Parent(s): 138b961

Update app.py

Browse files

Files changed (1) hide show

app.py +91 -54

app.py CHANGED Viewed

@@ -2,8 +2,10 @@ import streamlit as st
 import os
 import glob
 import re
-import datetime
 from urllib.parse import quote
 # Define the markdown variables
 Boxing_and_MMA_Commentary_and_Knowledge = """
@@ -38,7 +40,6 @@ Boxing_and_MMA_Commentary_and_Knowledge = """
 """
 Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds = """
 # Multiplayer Simulated Worlds
 1. 7 Days To Die PC
@@ -70,43 +71,89 @@ Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds = """
 27. The Forest PC
 28. Crossplay
 29. Valheim
 """
-# Function to parse markdown text and create external links for terms
-def display_external_links(term):
-    search_urls = {
-        "ArXiv": lambda k: f"https://arxiv.org/search/?query={quote(k)}",
-        "Wikipedia": lambda k: f"https://en.wikipedia.org/wiki/{quote(k)}",
-        "Google": lambda k: f"https://www.google.com/search?q={quote(k)}",
-        "YouTube": lambda k: f"https://www.youtube.com/results?search_query={quote(k)}",
-    }
-    links_md = ' | '.join([f"[{name}]({url(term)})" for name, url in search_urls.items()])
-    st.markdown(f"- **{term}** - {links_md}")
 # Function to parse markdown text and extract terms
 def extract_terms(markdown_text):
-    # Split text into lines
     lines = markdown_text.strip().split('\n')
     terms = []
     for line in lines:
-        # Remove markdown special characters
         line = re.sub(r'^[#*\->\d\.\s]+', '', line).strip()
         if line:
             terms.append(line)
     return terms
-# Function to create internal links with query parameters
-def display_internal_links(term):
-    app_url = st.experimental_get_query_params()
-    # Reconstruct the app URL without parameters
-    base_url = st.request.host_url
-    link = f"{base_url}?q={quote(term)}"
-    st.markdown(f"- [{term}]({link})")
-# Function to automatically generate filenames based on date and content
 def generate_filename(prefix, content):
-    timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
     safe_content = re.sub(r'\W+', '_', content[:50])
     filename = f"{prefix}_{timestamp}_{safe_content}.md"
     return filename
@@ -160,7 +207,7 @@ def file_management_sidebar():
     # Option to create a new markdown file
     if st.sidebar.button("Create New Markdown File"):
         # Generate automatic filename
-        timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
         new_filename = f"note_{timestamp}.md"
         with open(new_filename, 'w', encoding='utf-8') as f:
             f.write("# New Markdown File\n")
@@ -170,46 +217,36 @@ def file_management_sidebar():
 # Main application logic
 def main():
-    st.title("Markdown Content with Links and File Management")
     # Display the original markdown content
     st.markdown("## Original Markdown Content")
     st.markdown(Boxing_and_MMA_Commentary_and_Knowledge)
     st.markdown(Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds)
-    # Parse and display external links
-    st.markdown("## External Links Generated from Markdown Content")
-    terms = extract_terms(Boxing_and_MMA_Commentary_and_Knowledge)
-    for term in terms:
-        display_external_links(term)
-    terms = extract_terms(Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds)
-    for term in terms:
-        display_external_links(term)
-    # Parse and display internal links
-    st.markdown("## Internal Links Generated from Markdown Content")
-    terms = extract_terms(Boxing_and_MMA_Commentary_and_Knowledge)
-    for term in terms:
-        display_internal_links(term)
-    terms = extract_terms(Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds)
-    for term in terms:
-        display_internal_links(term)
     # Process 'q' query parameter from the URL
     query_params = st.experimental_get_query_params()
     if 'q' in query_params:
         search_query = query_params['q'][0]
         st.write(f"### Search query received: {search_query}")
-        # Here you can implement your search logic
-        # For demonstration, we'll create a markdown file with the search query
-        filename = generate_filename("search", search_query)
-        content = f"# Search Results for '{search_query}'\n\n"
-        content += f"Here are the results for your search query: '{search_query}'.\n"
         with open(filename, 'w', encoding='utf-8') as f:
-            f.write(content)
-        st.write(f"Generated file **{filename}** with search results.")
     # File management sidebar
     file_management_sidebar()

 import os
 import glob
 import re
 from urllib.parse import quote
+from gradio_client import Client
+import json
+from datetime import datetime
 # Define the markdown variables
 Boxing_and_MMA_Commentary_and_Knowledge = """
 """
 Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds = """
 # Multiplayer Simulated Worlds
 1. 7 Days To Die PC
 27. The Forest PC
 28. Crossplay
 29. Valheim
 """
 # Function to parse markdown text and extract terms
 def extract_terms(markdown_text):
     lines = markdown_text.strip().split('\n')
     terms = []
     for line in lines:
         line = re.sub(r'^[#*\->\d\.\s]+', '', line).strip()
         if line:
             terms.append(line)
     return terms
+# Function to display terms with links
+def display_terms_with_links(terms):
+    search_urls = {
+        "🚀🌌ArXiv": lambda k: f"/?q={quote(k)}",
+        "📖": lambda k: f"https://en.wikipedia.org/wiki/{quote(k)}",
+        "🔍": lambda k: f"https://www.google.com/search?q={quote(k)}",
+        "▶️": lambda k: f"https://www.youtube.com/results?search_query={quote(k)}",
+        "🔎": lambda k: f"https://www.bing.com/search?q={quote(k)}",
+        "🐦": lambda k: f"https://twitter.com/search?q={quote(k)}",
+    }
+    for term in terms:
+        links_md = ' '.join([f"[{emoji}]({url(term)})" for emoji, url in search_urls.items()])
+        st.markdown(f"**{term}** {links_md}", unsafe_allow_html=True)
+# Function to perform AI lookup using Gradio client
+def perform_ai_lookup(query):
+    st.write("Performing AI Lookup...")
+    # Initialize the Gradio client
+    client = Client("awacke1/Arxiv-Paper-Search-And-QA-RAG-Pattern")
+    # Perform the AI lookup using the Mixtral and Mistral models
+    result1 = client.predict(
+        prompt=query,
+        llm_model_picked="mistralai/Mixtral-8x7B-Instruct-v0.1",
+        stream_outputs=True,
+        api_name="/ask_llm"
+    )
+    st.markdown("### Mixtral-8x7B-Instruct-v0.1 Result")
+    st.markdown(result1)
+    result2 = client.predict(
+        prompt=query,
+        llm_model_picked="mistralai/Mistral-7B-Instruct-v0.2",
+        stream_outputs=True,
+        api_name="/ask_llm"
+    )
+    st.markdown("### Mistral-7B-Instruct-v0.2 Result")
+    st.markdown(result2)
+    combined_result = f"{result1}\n\n{result2}"
+    return combined_result
+# Function to extract URLs from AI result
+def extract_urls(text):
+    try:
+        date_pattern = re.compile(r'### (\d{2} \w{3} \d{4})')
+        abs_link_pattern = re.compile(r'\[(.*?)\]\((https://arxiv\.org/abs/\d+\.\d+)\)')
+        pdf_link_pattern = re.compile(r'\[⬇️\]\((https://arxiv\.org/pdf/\d+\.\d+)\)')
+        title_pattern = re.compile(r'### \d{2} \w{3} \d{4} \| \[(.*?)\]')
+        date_matches = date_pattern.findall(text)
+        abs_link_matches = abs_link_pattern.findall(text)
+        pdf_link_matches = pdf_link_pattern.findall(text)
+        title_matches = title_pattern.findall(text)
+        markdown_text = ""
+        for i in range(len(date_matches)):
+            date = date_matches[i]
+            title = title_matches[i]
+            abs_link = abs_link_matches[i][1]
+            pdf_link = pdf_link_matches[i]
+            markdown_text += f"**Date:** {date}\n\n"
+            markdown_text += f"**Title:** {title}\n\n"
+            markdown_text += f"**Abstract Link:** [{abs_link}]({abs_link})\n\n"
+            markdown_text += f"**PDF Link:** [{pdf_link}]({pdf_link})\n\n"
+            markdown_text += "---\n\n"
+        return markdown_text
+    except Exception as e:
+        st.write(f"An error occurred in extract_urls: {e}")
+        return ''
+# Function to generate filename based on date and content
 def generate_filename(prefix, content):
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
     safe_content = re.sub(r'\W+', '_', content[:50])
     filename = f"{prefix}_{timestamp}_{safe_content}.md"
     return filename
     # Option to create a new markdown file
     if st.sidebar.button("Create New Markdown File"):
         # Generate automatic filename
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
         new_filename = f"note_{timestamp}.md"
         with open(new_filename, 'w', encoding='utf-8') as f:
             f.write("# New Markdown File\n")
 # Main application logic
 def main():
+    st.title("Markdown Content with AI Lookup and File Management")
     # Display the original markdown content
     st.markdown("## Original Markdown Content")
     st.markdown(Boxing_and_MMA_Commentary_and_Knowledge)
     st.markdown(Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds)
+    # Parse and display terms with links
+    st.markdown("## Terms with Links")
+    terms1 = extract_terms(Boxing_and_MMA_Commentary_and_Knowledge)
+    terms2 = extract_terms(Multiplayer_Custom_Hosting_Game_Servers_For_Simulated_Worlds)
+    all_terms = terms1 + terms2
+    display_terms_with_links(all_terms)
     # Process 'q' query parameter from the URL
     query_params = st.experimental_get_query_params()
     if 'q' in query_params:
         search_query = query_params['q'][0]
         st.write(f"### Search query received: {search_query}")
+        # Perform AI lookup
+        ai_result = perform_ai_lookup(search_query)
+        # Extract URLs from AI result
+        markdown_text = extract_urls(ai_result)
+        st.markdown("## Extracted URLs")
+        st.markdown(markdown_text)
+        # Save the result as markdown file
+        filename = generate_filename("AI_Result", search_query)
         with open(filename, 'w', encoding='utf-8') as f:
+            f.write(markdown_text)
+        st.write(f"Generated file **{filename}** with AI lookup results.")
     # File management sidebar
     file_management_sidebar()