Spaces:

mayankpuvvala
/

Spoken_English_Scoring

Sleeping

App Files Files Community

mayankpuvvala commited on May 5

Commit

5d66bfc

verified ·

1 Parent(s): c64a43c

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -17

app.py CHANGED Viewed

@@ -1,8 +1,6 @@
 import gradio as gr
 import torch
 from transformers import pipeline, AutoTokenizer, AutoModelForSequenceClassification
-import tempfile
-import torchaudio
 # Load Whisper for transcription
 asr_pipeline = pipeline("automatic-speech-recognition", model="openai/whisper-large-v3")
@@ -15,21 +13,16 @@ grammar_pipeline = pipeline("text-classification", model=cola_model, tokenizer=c
 # Load grammar correction model
 correction_pipeline = pipeline("text2text-generation", model="vennify/t5-base-grammar-correction")
-def process_audio(audio_file):
-    # Save uploaded file to temporary path
-    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp:
-        tmp.write(audio_file.read())
-        tmp_path = tmp.name
-    # Transcription
-    transcription = asr_pipeline(tmp_path)["text"]
-    # Grammar Scoring
     grammar_result = grammar_pipeline(transcription)[0]
     score_label = grammar_result["label"]
     score_confidence = grammar_result["score"]
-    # Correction
     corrected_text = correction_pipeline(transcription, max_length=128)[0]["generated_text"]
     return transcription, f"{score_label} ({score_confidence:.2f})", corrected_text
@@ -37,14 +30,18 @@ def process_audio(audio_file):
 # Gradio Interface
 interface = gr.Interface(
     fn=process_audio,
-    inputs=gr.Audio(type="file", label="Upload your .wav file"),
     outputs=[
-        gr.Textbox(label="Transcription"),
-        gr.Textbox(label="Grammar Score"),
-        gr.Textbox(label="Grammar Correction")
     ],
     title="🎙️ Voice Grammar Scorer",
-    description="Upload your voice (WAV file). This app transcribes it, scores grammar, and suggests corrections."
 )
 if __name__ == "__main__":

 import gradio as gr
 import torch
 from transformers import pipeline, AutoTokenizer, AutoModelForSequenceClassification
 # Load Whisper for transcription
 asr_pipeline = pipeline("automatic-speech-recognition", model="openai/whisper-large-v3")
 # Load grammar correction model
 correction_pipeline = pipeline("text2text-generation", model="vennify/t5-base-grammar-correction")
+def process_audio(audio_path):
+    # Transcribe
+    transcription = asr_pipeline(audio_path)["text"]
+    # Score grammar
     grammar_result = grammar_pipeline(transcription)[0]
     score_label = grammar_result["label"]
     score_confidence = grammar_result["score"]
+    # Suggest correction
     corrected_text = correction_pipeline(transcription, max_length=128)[0]["generated_text"]
     return transcription, f"{score_label} ({score_confidence:.2f})", corrected_text
 # Gradio Interface
 interface = gr.Interface(
     fn=process_audio,
+    inputs=gr.Audio(
+        source="microphone",  # enables both mic recording and upload
+        type="filepath",
+        label="🎤 Record or Upload Audio (.wav)"
+    ),
     outputs=[
+        gr.Textbox(label="📝 Transcription"),
+        gr.Textbox(label="✅ Grammar Score"),
+        gr.Textbox(label="✍️ Suggested Correction")
     ],
     title="🎙️ Voice Grammar Scorer",
+    description="Record or upload your voice (.wav). This app transcribes it, scores grammar, and suggests corrections."
 )
 if __name__ == "__main__":