Spaces:

Pgohari
/

Orbii-KM

Sleeping

Pgohari commited on Aug 26, 2024

Commit

a66e61b

verified ·

1 Parent(s): d354ed6

update the model to mt5-small

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,20 +1,26 @@
 import gradio as gr
-from transformers import AutoModelForCausalLM, AutoTokenizer
-# Load the Mistral AI model and tokenizer from Hugging Face
-model_name = "mistralai/Mistral-7B"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(model_name)
-# Define the chatbot function
 def chatbot(user_input):
-    inputs = tokenizer(user_input, return_tensors="pt")
-    outputs = model.generate(inputs['input_ids'], max_length=50)
     response = tokenizer.decode(outputs[0], skip_special_tokens=True)
     return response
 # Set up the Gradio interface
-demo = gr.Interface(fn=chatbot, inputs="text", outputs="text", title="Mistral AI Chatbot")
 # Launch the app
 demo.launch()

 import gradio as gr
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
+# Load the mT5-small model and tokenizer
+model_name = "google/mt5-small"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
+# Define the chatbot function for summarization and answering questions
 def chatbot(user_input):
+    # Tokenize the user input
+    inputs = tokenizer(user_input, return_tensors="pt", max_length=512, truncation=True)
+    # Generate a response (you can customize max_length and num_beams for different outputs)
+    outputs = model.generate(inputs["input_ids"], max_length=150, num_beams=2, early_stopping=True)
+    # Decode and return the generated text
     response = tokenizer.decode(outputs[0], skip_special_tokens=True)
     return response
 # Set up the Gradio interface
+demo = gr.Interface(fn=chatbot, inputs="text", outputs="text", title="mT5-Small Chatbot")
 # Launch the app
 demo.launch()