Spaces:
Runtime error
Runtime error
gamingflexer
commited on
Commit
·
80ed9e0
1
Parent(s):
dc3eeb1
dummy file updated & Gitingonre
Browse files- .gitignore +3 -1
- src/app.py +1 -3
- src/db/vector_fucntions.py +0 -0
- src/scrapper/articles.py +8 -0
.gitignore
CHANGED
|
@@ -162,4 +162,6 @@ src/flagged/log.csv
|
|
| 162 |
.vscode/PythonImportHelper-v2-Completion.json
|
| 163 |
notebooks/*.pdf
|
| 164 |
notebooks/notebooks/papers/*.jsonl
|
| 165 |
-
src/data/papers/*.jsonl
|
|
|
|
|
|
|
|
|
| 162 |
.vscode/PythonImportHelper-v2-Completion.json
|
| 163 |
notebooks/*.pdf
|
| 164 |
notebooks/notebooks/papers/*.jsonl
|
| 165 |
+
src/data/papers/*.jsonl
|
| 166 |
+
src/data/papers/*
|
| 167 |
+
src/notebooks/papers/*.jsonl
|
src/app.py
CHANGED
|
@@ -6,8 +6,6 @@ from config import *
|
|
| 6 |
from db.db_functions import get_correct_author_name, insert_papers_data, fetch_papers_data, get_unquine_authors
|
| 7 |
from utils import compare_paper_ids
|
| 8 |
|
| 9 |
-
unique_authors_df = get_unquine_authors()
|
| 10 |
-
|
| 11 |
def plagiarism_checker(authors_name_fetch,number_of_results_fetch, progress=gr.Progress()):
|
| 12 |
number_of_results_fetch = int(number_of_results_fetch)
|
| 13 |
print(authors_name_fetch,number_of_results_fetch,type(number_of_results_fetch))
|
|
@@ -69,7 +67,7 @@ with gr.Blocks() as demo:
|
|
| 69 |
'references', 'categories', 'comment', 'journal_ref', 'source',
|
| 70 |
'summary', 'published'])
|
| 71 |
with gr.Row():
|
| 72 |
-
unquine_authors_output = gr.Dataframe(headers=["author_name"],value=
|
| 73 |
|
| 74 |
|
| 75 |
with gr.Tab("Arxiv Plagiarism Fetcher & Save to DB"):
|
|
|
|
| 6 |
from db.db_functions import get_correct_author_name, insert_papers_data, fetch_papers_data, get_unquine_authors
|
| 7 |
from utils import compare_paper_ids
|
| 8 |
|
|
|
|
|
|
|
| 9 |
def plagiarism_checker(authors_name_fetch,number_of_results_fetch, progress=gr.Progress()):
|
| 10 |
number_of_results_fetch = int(number_of_results_fetch)
|
| 11 |
print(authors_name_fetch,number_of_results_fetch,type(number_of_results_fetch))
|
|
|
|
| 67 |
'references', 'categories', 'comment', 'journal_ref', 'source',
|
| 68 |
'summary', 'published'])
|
| 69 |
with gr.Row():
|
| 70 |
+
unquine_authors_output = gr.Dataframe(headers=["author_name"],value=get_unquine_authors(), label=" Authors Currently in our DB")
|
| 71 |
|
| 72 |
|
| 73 |
with gr.Tab("Arxiv Plagiarism Fetcher & Save to DB"):
|
src/db/vector_fucntions.py
ADDED
|
File without changes
|
src/scrapper/articles.py
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
from langchain_community.document_loaders import AsyncChromiumLoader
|
| 2 |
+
from langchain_community.document_transformers import BeautifulSoupTransformer
|
| 3 |
+
|
| 4 |
+
class GetSimilarArticles:
|
| 5 |
+
|
| 6 |
+
def __init__(self, paper_title_name: str):
|
| 7 |
+
self.paper_title_name = paper_title_name
|
| 8 |
+
|