Spaces:

Sparticle
/

Llama2_7b_chat_Japanese_Lora

Paused

zhaozitian commited on Aug 9, 2023

Commit

a2e7059

1 Parent(s): 6231256

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ assert (
 ), "LLaMA is now in HuggingFace's main branch.\nPlease reinstall it: pip uninstall transformers && pip install git+https://github.com/huggingface/transformers.git"
 from transformers import LlamaTokenizer, LlamaForCausalLM, GenerationConfig
-tokenizer = LlamaTokenizer.from_pretrained("daryl149/llama-2-7b-chat-hf", use_auth_token=True)
 BASE_MODEL = "daryl149/llama-2-7b-chat-hf"
 LORA_WEIGHTS = "Sparticle/llama-2-7b-japanese-lora"
@@ -30,7 +30,6 @@ if device == "cuda":
         load_in_8bit=False,
         torch_dtype=torch.float16,
         device_map="auto",
-        use_auth_token = True,
     )
     model = PeftModel.from_pretrained(
         model, LORA_WEIGHTS, torch_dtype=torch.float16, force_download=True
@@ -40,7 +39,6 @@ elif device == "mps":
         BASE_MODEL,
         device_map={"": device},
         torch_dtype=torch.float16,
-        use_auth_token = True,
     )
     model = PeftModel.from_pretrained(
         model,

 ), "LLaMA is now in HuggingFace's main branch.\nPlease reinstall it: pip uninstall transformers && pip install git+https://github.com/huggingface/transformers.git"
 from transformers import LlamaTokenizer, LlamaForCausalLM, GenerationConfig
+tokenizer = LlamaTokenizer.from_pretrained("daryl149/llama-2-7b-chat-hf")
 BASE_MODEL = "daryl149/llama-2-7b-chat-hf"
 LORA_WEIGHTS = "Sparticle/llama-2-7b-japanese-lora"
         load_in_8bit=False,
         torch_dtype=torch.float16,
         device_map="auto",
     )
     model = PeftModel.from_pretrained(
         model, LORA_WEIGHTS, torch_dtype=torch.float16, force_download=True
         BASE_MODEL,
         device_map={"": device},
         torch_dtype=torch.float16,
     )
     model = PeftModel.from_pretrained(
         model,