Update app.py
Browse files
app.py
CHANGED
|
@@ -72,16 +72,17 @@ def transcribe_audio(file_path):
|
|
| 72 |
return "Reference not found.", "", "", "", "", "", ""
|
| 73 |
|
| 74 |
model_ids = [
|
| 75 |
-
"openai/whisper-tiny",
|
| 76 |
-
"openai/whisper-tiny.en",
|
| 77 |
-
"openai/whisper-base",
|
| 78 |
-
"openai/whisper-base.en",
|
| 79 |
-
"openai/whisper-medium",
|
| 80 |
-
"openai/whisper-medium.en",
|
| 81 |
-
"distil-whisper/distil-large-v3.5",
|
| 82 |
-
"facebook/wav2vec2-base-960h",
|
| 83 |
-
"facebook/wav2vec2-large-960h",
|
| 84 |
-
"facebook/
|
|
|
|
| 85 |
]
|
| 86 |
|
| 87 |
outputs = {}
|
|
@@ -144,6 +145,7 @@ with gr.Blocks() as demo:
|
|
| 144 |
distil_html = gr.HTML(label="Distil-Whisper Large")
|
| 145 |
wav2vec_base_html = gr.HTML(label="Wav2Vec2 Base")
|
| 146 |
wav2vec_large_html = gr.HTML(label="Wav2Vec2 Large")
|
|
|
|
| 147 |
hubert_html = gr.HTML(label="HuBERT Large")
|
| 148 |
|
| 149 |
transcribe_btn.click(
|
|
@@ -160,6 +162,7 @@ with gr.Blocks() as demo:
|
|
| 160 |
distil_html,
|
| 161 |
wav2vec_base_html,
|
| 162 |
wav2vec_large_html,
|
|
|
|
| 163 |
hubert_html,
|
| 164 |
],
|
| 165 |
)
|
|
|
|
| 72 |
return "Reference not found.", "", "", "", "", "", ""
|
| 73 |
|
| 74 |
model_ids = [
|
| 75 |
+
"openai/whisper-tiny", # Smallest, multilingual
|
| 76 |
+
"openai/whisper-tiny.en", # Tiny, English-only
|
| 77 |
+
"openai/whisper-base", # Balanced, multilingual
|
| 78 |
+
"openai/whisper-base.en", # Base, English-only
|
| 79 |
+
"openai/whisper-medium", # Medium, multilingual
|
| 80 |
+
"openai/whisper-medium.en", # Medium, English-only
|
| 81 |
+
"distil-whisper/distil-large-v3.5", # Distilled from Whisper large, Faster & More accurate
|
| 82 |
+
"facebook/wav2vec2-base-960h", # Base model trained on 960h LibriSpeech (monolingual, English)
|
| 83 |
+
"facebook/wav2vec2-large-960h", #Larger model, better performance (monolingual, English)
|
| 84 |
+
"facebook/wav2vec2-large-960h-lv60-self", # Fine-tuned on 60k LibriLight hours
|
| 85 |
+
"facebook/hubert-large-ls960-ft", # Fine-tuned on LibriSpeech
|
| 86 |
]
|
| 87 |
|
| 88 |
outputs = {}
|
|
|
|
| 145 |
distil_html = gr.HTML(label="Distil-Whisper Large")
|
| 146 |
wav2vec_base_html = gr.HTML(label="Wav2Vec2 Base")
|
| 147 |
wav2vec_large_html = gr.HTML(label="Wav2Vec2 Large")
|
| 148 |
+
wav2vec_lv60_html = gr.HTML(label="Wav2Vec2 Large + LibriLight")
|
| 149 |
hubert_html = gr.HTML(label="HuBERT Large")
|
| 150 |
|
| 151 |
transcribe_btn.click(
|
|
|
|
| 162 |
distil_html,
|
| 163 |
wav2vec_base_html,
|
| 164 |
wav2vec_large_html,
|
| 165 |
+
wav2vec_lv60_html,
|
| 166 |
hubert_html,
|
| 167 |
],
|
| 168 |
)
|