Spaces:

kevinwang676
/

NeuCoSVC-2

Running

kevinwang676 commited on May 11, 2024

Commit

65de068

verified ·

1 Parent(s): 5d4265b

Update inference.py

Files changed (1) hide show

inference.py CHANGED Viewed

@@ -10,6 +10,10 @@ from SVCNN import SVCNN
 from utils.tools import extract_voiced_area
 from utils.extract_pitch import extract_pitch_ref as extract_pitch, coarse_f0
 SPEAKER_INFORMATION_WEIGHTS = [
     0, 0, 0, 0, 0, 0,  # layer 0-5
     1.0, 0, 0, 0,
@@ -51,12 +55,21 @@ def svc(model, src_wav_path, ref_wav_path, synth_set_path=None, f0_factor=0., sp
     if synth_set_path:
         synth_set = torch.load(synth_set_path).to(device)
     else:
-        synth_set = model.get_matching_set(ref_wav_path).to(device)
-    if hallucinated_set_path:
-        hallucinated_set = torch.from_numpy(np.load(hallucinated_set_path)).to(device)
-        synth_set = torch.cat([synth_set, hallucinated_set], dim=0)
     query_len = query_seq.shape[0]
     if len(query_mask) > query_len:
         query_mask = query_mask[:query_len]

 from utils.tools import extract_voiced_area
 from utils.extract_pitch import extract_pitch_ref as extract_pitch, coarse_f0
+from Phoneme_Hallucinator_v2.utils.hparams import HParams
+from Phoneme_Hallucinator_v2.models import get_model as get_hallucinator
+from Phoneme_Hallucinator_v2.scripts.speech_expansion_ins import single_expand
 SPEAKER_INFORMATION_WEIGHTS = [
     0, 0, 0, 0, 0, 0,  # layer 0-5
     1.0, 0, 0, 0,
     if synth_set_path:
         synth_set = torch.load(synth_set_path).to(device)
     else:
+        synth_set_path = f"matching_set/{ref_name}.pt"
+        synth_set = model.get_matching_set(ref_wav_path, out_path=synth_set_path).to(device)
+    if hallucinated_set_path is None:
+        params = HParams('Phoneme_Hallucinator_v2/exp/speech_XXL_cond/params.json')
+        Hallucinator = get_hallucinator(params)
+        Hallucinator.load()
+        hallucinated_set = single_expand(synth_set_path, Hallucinator, 15000)
+    else:
+        hallucinated_set = np.load(hallucinated_set_path)
+    hallucinated_set = torch.from_numpy(hallucinated_set).to(device)
+    synth_set = torch.cat([synth_set, hallucinated_set], dim=0)
     query_len = query_seq.shape[0]
     if len(query_mask) > query_len:
         query_mask = query_mask[:query_len]