Spaces:

chenxie95
/

Language-Audio-Banquet

Runtime error

App Files Files Community

Jihuai commited on Sep 20

Commit

9f787c6

1 Parent(s): d572f56

app.py and requirements.txt init

Browse files

Files changed (2) hide show

app.py +68 -0
requirements.txt +19 -0

app.py ADDED Viewed

	@@ -0,0 +1,68 @@

+import os
+import torch
+import gradio as gr
+from huggingface_hub import hf_hub_download
+from train import init, inference_file
+import tempfile
+# ===== Basic config =====
+USE_CUDA = torch.cuda.is_available()
+BATCH_SIZE = int(os.getenv("BATCH_SIZE", "12"))
+# Read model repo and filename from environment variables
+REPO_ID  = os.getenv("MODEL_REPO_ID", "chenxie95/Language-Audio-Banquet-ckpt")
+FILENAME = os.getenv("MODEL_FILENAME", "ev-pre-aug.ckpt")
+# ===== Download & load weights =====
+ckpt_path = hf_hub_download(repo_id=REPO_ID, filename=FILENAME)
+system = init(ckpt_path, batch_size=BATCH_SIZE, use_cuda=USE_CUDA)
+# ===== Inference =====
+def inference(audio_path: str):
+    temp_dir = tempfile.gettempdir()
+    output_filename = os.path.basename(audio_path).replace('.wav', '_enhanced.wav')
+    output_path = os.path.join(temp_dir, output_filename)
+    inference_file(system, audio_path, output_path, audio_path)
+    return output_path
+# ===== Gradio UI =====
+with gr.Blocks() as demo:
+    gr.Markdown(
+        """
+# 🎧 DCCRN Speech Enhancement (Demo)
+**How to use:** drag & drop a noisy audio clip (or upload / record) → click **Enhance** → listen & download the result.
+**Sample audio:** click a sample below to auto-fill the input, then click **Enhance**.
+        """
+    )
+    with gr.Row():
+        inp = gr.Audio(
+            sources=["upload", "microphone"],     # drag & drop supported by default
+            type="filepath",
+            label="Input: noisy speech (drag & drop or upload / record)"
+        )
+        out = gr.Audio(
+            label="Output: enhanced speech (downloadable)",
+            show_download_button=True
+        )
+    enhance_btn = gr.Button("Enhance")
+    # On-page sample clips (make sure these files exist in the repo)
+    gr.Examples(
+        examples=[
+            ["examples/noisy_1.wav"],
+            ["examples/noisy_2.wav"],
+            ["examples/noisy_3.wav"],
+        ],
+        inputs=inp,
+        label="Sample audio",
+        examples_per_page=3,
+    )
+    # Gradio ≥4.44: set concurrency on the event listener
+    enhance_btn.click(inference, inputs=inp, outputs=out, concurrency_limit=1)
+# Queue: keep a small queue to avoid OOM
+demo.queue(max_size=16)
+demo.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,19 @@

+einops==0.8.1
+fire==0.7.0
+hear21passt==0.0.26
+hyper_connections==0.2.1
+laion_clap==1.1.7
+librosa==0.9.2
+museval==0.4.1
+numpy==2.3.3
+omegaconf==2.3.0
+packaging==25.0
+pandas==2.3.2
+pytorch_lightning==2.1.0
+rotary_embedding_torch==0.3.5
+scikit_learn==1.7.2
+torch==2.7.0+cu126
+torch_audiomentations==0.12.0
+torchaudio==2.7.0+cu126
+torchmetrics==0.11.4
+tqdm==4.66.4