Spaces:
Build error
Build error
Commit
Β·
bb788ed
1
Parent(s):
aecf994
Update app.py
Browse files
app.py
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
import gradio as gr
|
| 2 |
-
from faiss import IndexFlatIP
|
| 3 |
import pandas as pd
|
| 4 |
import numpy as np
|
| 5 |
from transformers import AutoTokenizer
|
|
@@ -7,7 +7,7 @@ from transformers import AutoTokenizer
|
|
| 7 |
|
| 8 |
tokenizer = AutoTokenizer.from_pretrained("bert-large-uncased")
|
| 9 |
input_embeddings = np.load("bert_input_embeddings.npy")
|
| 10 |
-
index =
|
| 11 |
index.add(input_embeddings)
|
| 12 |
vocab = {v:k for k,v in tokenizer.vocab.items()}
|
| 13 |
lookup_table = pd.Series(vocab).sort_index()
|
|
|
|
| 1 |
import gradio as gr
|
| 2 |
+
from faiss import IndexFlatIP, IndexFlatL2
|
| 3 |
import pandas as pd
|
| 4 |
import numpy as np
|
| 5 |
from transformers import AutoTokenizer
|
|
|
|
| 7 |
|
| 8 |
tokenizer = AutoTokenizer.from_pretrained("bert-large-uncased")
|
| 9 |
input_embeddings = np.load("bert_input_embeddings.npy")
|
| 10 |
+
index = IndexFlatL2(input_embeddings.shape[-1])
|
| 11 |
index.add(input_embeddings)
|
| 12 |
vocab = {v:k for k,v in tokenizer.vocab.items()}
|
| 13 |
lookup_table = pd.Series(vocab).sort_index()
|