Spaces:

ignitariumcloud
/

NvidiaCanary-2.5

Sleeping

manueljohnson063 commited on Aug 22

Commit

c9d0e01

verified ·

1 Parent(s): 621e9b8

Upload 2 files

Files changed (2) hide show

app.py CHANGED Viewed

@@ -13,6 +13,9 @@ model_id = "nvidia/canary-qwen-2.5b"
 print("Loading NVIDIA Canary-Qwen-2.5B model using NeMo...")
 model = SALM.from_pretrained(model_id)
 def generate_text(prompt, max_tokens=200, temperature=0.7, top_p=0.9):
     """Generate text using the NVIDIA NeMo model (LLM mode)"""
@@ -28,7 +31,8 @@ def generate_text(prompt, max_tokens=200, temperature=0.7, top_p=0.9):
             )
         # Convert IDs to text using model's tokenizer
-        response = model.tokenizer.ids_to_text(answer_ids[0].cpu())
         return response
     except Exception as e:
@@ -50,7 +54,8 @@ def transcribe_audio(audio_file, user_prompt="Transcribe the following:"):
         )
         # Convert IDs to text
-        transcript = model.tokenizer.ids_to_text(answer_ids[0].cpu())
         return transcript
     except Exception as e:

 print("Loading NVIDIA Canary-Qwen-2.5B model using NeMo...")
 model = SALM.from_pretrained(model_id)
+device = "cuda" if torch.cuda.is_available() else "cpu"
+model = model.to(device)
 def generate_text(prompt, max_tokens=200, temperature=0.7, top_p=0.9):
     """Generate text using the NVIDIA NeMo model (LLM mode)"""
             )
         # Convert IDs to text using model's tokenizer
+        # response = model.tokenizer.ids_to_text(answer_ids[0].cpu())
+        response = model.tokenizer.ids_to_text(answer_ids[0].to(device))
         return response
     except Exception as e:
         )
         # Convert IDs to text
+        # transcript = model.tokenizer.ids_to_text(answer_ids[0].cpu())
+        transcript = model.tokenizer.ids_to_text(answer_ids[0].to(device))
         return transcript
     except Exception as e:

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-torch>=2.6.0
 gradio>=4.0.0
 nemo_toolkit[asr,tts] @ git+https://github.com/NVIDIA/NeMo.git
 accelerate>=0.20.0

+torch==2.6.0+cu118 --extra-index-url https://download.pytorch.org/whl/cu118
 gradio>=4.0.0
 nemo_toolkit[asr,tts] @ git+https://github.com/NVIDIA/NeMo.git
 accelerate>=0.20.0