Update app.py
Browse files
app.py
CHANGED
|
@@ -5,14 +5,10 @@ from llama_cpp import Llama
|
|
| 5 |
# Load GGUF model
|
| 6 |
# ----------------------------------------------------
|
| 7 |
|
| 8 |
-
MODEL_PATH = "astegaras/merged_kaggle" # HF repo containing your .gguf
|
| 9 |
-
|
| 10 |
# llama_cpp automatically downloads from HF Hub if you provide the repo
|
| 11 |
llm = Llama.from_pretrained(
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
n_ctx=4096,
|
| 15 |
-
verbose=False,
|
| 16 |
)
|
| 17 |
|
| 18 |
# ----------------------------------------------------
|
|
|
|
| 5 |
# Load GGUF model
|
| 6 |
# ----------------------------------------------------
|
| 7 |
|
|
|
|
|
|
|
| 8 |
# llama_cpp automatically downloads from HF Hub if you provide the repo
|
| 9 |
llm = Llama.from_pretrained(
|
| 10 |
+
repo_id="astegaras/merged_kaggle",
|
| 11 |
+
filename="llama-3.2-3b-instruct.Q4_K_M.gguf",
|
|
|
|
|
|
|
| 12 |
)
|
| 13 |
|
| 14 |
# ----------------------------------------------------
|