static-embeddings / potion.py
gregtatum's picture
Add the initial models
f7fef32
raw
history blame contribute delete
403 Bytes
from model2vec import StaticModel
from tokenizers import Tokenizer
import torch
model = StaticModel.from_pretrained("minishlab/potion-multilingual-128M")
embeddings = torch.from_numpy(model.embedding)
print("Embedding shape:", embeddings.shape)
bytes = embeddings.shape[0] * embeddings.shape[1] * 4
print("MiB:", bytes / 1024 / 1024)
tokenizer: Tokenizer = model.tokenizer
print(tokenizer.to_str())