RVC-Project
diff --git a/‎config.py‎
Lines changed: 41 additions & 32 deletions b/‎config.py‎
Lines changed: 41 additions & 32 deletions
diff --git a/‎export_onnx.py‎
Lines changed: 29 additions & 26 deletions b/‎export_onnx.py‎
Lines changed: 29 additions & 26 deletions
diff --git a/‎extract_f0_print.py‎
Lines changed: 76 additions & 40 deletions b/‎extract_f0_print.py‎
Lines changed: 76 additions & 40 deletions
@@ -1,13 +1,13 @@
 ########################硬件参数########################
 
-#填写cuda:x, cpu 或 mps, x指代第几张卡，只支持 N卡 / Apple Silicon 加速
-device  =   "cuda:0"
+# 填写cuda:x, cpu 或 mps, x指代第几张卡，只支持 N卡 / Apple Silicon 加速
+device = "cuda:0"
 
-#9-10-20-30-40系显卡无脑True，不影响质量，>=20显卡开启有加速
-is_half =   True
+# 9-10-20-30-40系显卡无脑True，不影响质量，>=20显卡开启有加速
+is_half = True
 
-#默认0用上所有线程，写数字限制CPU资源使用  
-n_cpu   =   0
+# 默认0用上所有线程，写数字限制CPU资源使用
+n_cpu = 0
 
 ########################硬件参数########################
 
@@ -16,64 +16,73 @@
 
 ########################命令行参数########################
 import argparse
+
 parser = argparse.ArgumentParser()
 parser.add_argument("--port", type=int, default=7865, help="Listen port")
 parser.add_argument("--pycmd", type=str, default="python", help="Python command")
-parser.add_argument("--colab", action='store_true', help="Launch in colab")
-parser.add_argument("--noparallel", action='store_true', help="Disable parallel processing")
-parser.add_argument("--noautoopen", action='store_true', help="Do not open in browser automatically")
+parser.add_argument("--colab", action="store_true", help="Launch in colab")
+parser.add_argument(
+    "--noparallel", action="store_true", help="Disable parallel processing"
+)
+parser.add_argument(
+    "--noautoopen", action="store_true", help="Do not open in browser automatically"
+)
 cmd_opts = parser.parse_args()
 
-python_cmd=cmd_opts.pycmd
-listen_port=cmd_opts.port
-iscolab=cmd_opts.colab
-noparallel=cmd_opts.noparallel
-noautoopen=cmd_opts.noautoopen
+python_cmd = cmd_opts.pycmd
+listen_port = cmd_opts.port
+iscolab = cmd_opts.colab
+noparallel = cmd_opts.noparallel
+noautoopen = cmd_opts.noautoopen
 ########################命令行参数########################
 
 import sys
 import torch
 
+
 # has_mps is only available in nightly pytorch (for now) and MasOS 12.3+.
 # check `getattr` and try it for compatibility
 def has_mps() -> bool:
     if sys.platform != "darwin":
         return False
     else:
-        if not getattr(torch, 'has_mps', False): return False
+        if not getattr(torch, "has_mps", False):
+            return False
         try:
             torch.zeros(1).to(torch.device("mps"))
             return True
         except Exception:
             return False
 
 
-if(not torch.cuda.is_available()):
+if not torch.cuda.is_available():
     if has_mps():
         print("没有发现支持的N卡, 使用MPS进行推理")
-        device  = "mps"
+        device = "mps"
     else:
         print("没有发现支持的N卡, 使用CPU进行推理")
-        device  = "cpu"
+        device = "cpu"
         is_half = False
 
-if(device not in ["cpu", "mps"]):
+if device not in ["cpu", "mps"]:
     gpu_name = torch.cuda.get_device_name(int(device.split(":")[-1]))
-    if("16" in gpu_name or "MX" in gpu_name):
+    if "16" in gpu_name or "MX" in gpu_name:
         print("16系显卡/MX系显卡强制单精度")
         is_half = False
 
 from multiprocessing import cpu_count
-if(n_cpu==0): n_cpu=cpu_count()
-if(is_half):
-    #6G显存配置
-    x_pad       =   3
-    x_query     =   10
-    x_center    =   60
-    x_max       =   65
+
+if n_cpu == 0:
+    n_cpu = cpu_count()
+if is_half:
+    # 6G显存配置
+    x_pad = 3
+    x_query = 10
+    x_center = 60
+    x_max = 65
 else:
-    #5G显存配置
-    x_pad       =   1
-    x_query     =   6
-    x_center    =   38
-    x_max       =   41
+    # 5G显存配置
+    x_pad = 1
+    x_query = 6
+    x_center = 38
+    x_max = 41
@@ -5,40 +5,43 @@
 exported_path = "model.onnx"
 
 
-
 cpt = torch.load(person, map_location="cpu")
-cpt["config"][-3]=cpt["weight"]["emb_g.weight"].shape[0]#n_spk
+cpt["config"][-3] = cpt["weight"]["emb_g.weight"].shape[0]  # n_spk
 print(*cpt["config"])
 net_g = SynthesizerTrnMs256NSFsid(*cpt["config"], is_half=False)
 net_g.load_state_dict(cpt["weight"], strict=False)
 
 test_phone = torch.rand(1, 200, 256)
 test_phone_lengths = torch.tensor([200]).long()
-test_pitch = torch.randint(size=(1 ,200),low=5,high=255)
+test_pitch = torch.randint(size=(1, 200), low=5, high=255)
 test_pitchf = torch.rand(1, 200)
 test_ds = torch.LongTensor([0])
 test_rnd = torch.rand(1, 192, 200)
 input_names = ["phone", "phone_lengths", "pitch", "pitchf", "ds", "rnd"]
-output_names = ["audio", ]
-device="cpu"
-torch.onnx.export(net_g,
-            (
-                test_phone.to(device),
-                test_phone_lengths.to(device),
-                test_pitch.to(device),
-                test_pitchf.to(device),
-                test_ds.to(device),
-                test_rnd.to(device)
-            ),
-            exported_path,
-            dynamic_axes={
-                "phone": [1],
-                "pitch": [1],
-                "pitchf": [1],
-                "rnd": [2],
-            },
-            do_constant_folding=False,
-            opset_version=16,
-            verbose=False,
-            input_names=input_names,
-            output_names=output_names)
+output_names = [
+    "audio",
+]
+device = "cpu"
+torch.onnx.export(
+    net_g,
+    (
+        test_phone.to(device),
+        test_phone_lengths.to(device),
+        test_pitch.to(device),
+        test_pitchf.to(device),
+        test_ds.to(device),
+        test_rnd.to(device),
+    ),
+    exported_path,
+    dynamic_axes={
+        "phone": [1],
+        "pitch": [1],
+        "pitchf": [1],
+        "rnd": [2],
+    },
+    do_constant_folding=False,
+    opset_version=16,
+    verbose=False,
+    input_names=input_names,
+    output_names=output_names,
+)
@@ -1,21 +1,26 @@
-import os,traceback,sys,parselmouth
+import os, traceback, sys, parselmouth
 import librosa
 import pyworld
 from scipy.io import wavfile
-import numpy as np,logging
-logging.getLogger('numba').setLevel(logging.WARNING)
+import numpy as np, logging
+
+logging.getLogger("numba").setLevel(logging.WARNING)
 from multiprocessing import Process
 
 exp_dir = sys.argv[1]
-f = open("%s/extract_f0_feature.log"%exp_dir, "a+")
+f = open("%s/extract_f0_feature.log" % exp_dir, "a+")
+
+
 def printt(strr):
     print(strr)
     f.write("%s\n" % strr)
     f.flush()
 
+
 n_p = int(sys.argv[2])
 f0method = sys.argv[3]
 
+
 class FeatureInput(object):
     def __init__(self, samplerate=16000, hop_size=160):
         self.fs = samplerate
@@ -27,21 +32,30 @@ def __init__(self, samplerate=16000, hop_size=160):
         self.f0_mel_min = 1127 * np.log(1 + self.f0_min / 700)
         self.f0_mel_max = 1127 * np.log(1 + self.f0_max / 700)
 
-    def compute_f0(self, path,f0_method):
+    def compute_f0(self, path, f0_method):
         x, sr = librosa.load(path, self.fs)
-        p_len=x.shape[0]//self.hop
+        p_len = x.shape[0] // self.hop
         assert sr == self.fs
-        if(f0_method=="pm"):
+        if f0_method == "pm":
             time_step = 160 / 16000 * 1000
             f0_min = 50
             f0_max = 1100
-            f0 = parselmouth.Sound(x, sr).to_pitch_ac(
-                time_step=time_step / 1000, voicing_threshold=0.6,
-                pitch_floor=f0_min, pitch_ceiling=f0_max).selected_array['frequency']
-            pad_size=(p_len - len(f0) + 1) // 2
-            if(pad_size>0 or p_len - len(f0) - pad_size>0):
-                f0 = np.pad(f0,[[pad_size,p_len - len(f0) - pad_size]], mode='constant')
-        elif(f0_method=="harvest"):
+            f0 = (
+                parselmouth.Sound(x, sr)
+                .to_pitch_ac(
+                    time_step=time_step / 1000,
+                    voicing_threshold=0.6,
+                    pitch_floor=f0_min,
+                    pitch_ceiling=f0_max,
+                )
+                .selected_array["frequency"]
+            )
+            pad_size = (p_len - len(f0) + 1) // 2
+            if pad_size > 0 or p_len - len(f0) - pad_size > 0:
+                f0 = np.pad(
+                    f0, [[pad_size, p_len - len(f0) - pad_size]], mode="constant"
+                )
+        elif f0_method == "harvest":
             f0, t = pyworld.harvest(
                 x.astype(np.double),
                 fs=sr,
@@ -50,7 +64,7 @@ def compute_f0(self, path,f0_method):
                 frame_period=1000 * self.hop / sr,
             )
             f0 = pyworld.stonemask(x.astype(np.double), f0, t, self.fs)
-        elif(f0_method=="dio"):
+        elif f0_method == "dio":
             f0, t = pyworld.dio(
                 x.astype(np.double),
                 fs=sr,
@@ -77,45 +91,67 @@ def coarse_f0(self, f0):
         )
         return f0_coarse
 
-    def go(self,paths,f0_method):
-        if (len(paths) == 0): printt("no-f0-todo")
+    def go(self, paths, f0_method):
+        if len(paths) == 0:
+            printt("no-f0-todo")
         else:
-            printt("todo-f0-%s"%len(paths))
-            n=max(len(paths)//5,1)#每个进程最多打印5条
-            for idx,(inp_path,opt_path1,opt_path2) in enumerate(paths):
+            printt("todo-f0-%s" % len(paths))
+            n = max(len(paths) // 5, 1)  # 每个进程最多打印5条
+            for idx, (inp_path, opt_path1, opt_path2) in enumerate(paths):
                 try:
-                    if(idx%n==0):printt("f0ing,now-%s,all-%s,-%s"%(idx,len(paths),inp_path))
-                    if(os.path.exists(opt_path1+".npy")==True and os.path.exists(opt_path2+".npy")==True):continue
-                    featur_pit = self.compute_f0(inp_path,f0_method)
-                    np.save(opt_path2,featur_pit,allow_pickle=False,)#nsf
+                    if idx % n == 0:
+                        printt("f0ing,now-%s,all-%s,-%s" % (idx, len(paths), inp_path))
+                    if (
+                        os.path.exists(opt_path1 + ".npy") == True
+                        and os.path.exists(opt_path2 + ".npy") == True
+                    ):
+                        continue
+                    featur_pit = self.compute_f0(inp_path, f0_method)
+                    np.save(
+                        opt_path2,
+                        featur_pit,
+                        allow_pickle=False,
+                    )  # nsf
                     coarse_pit = self.coarse_f0(featur_pit)
-                    np.save(opt_path1,coarse_pit,allow_pickle=False,)#ori
+                    np.save(
+                        opt_path1,
+                        coarse_pit,
+                        allow_pickle=False,
+                    )  # ori
                 except:
-                    printt("f0fail-%s-%s-%s" % (idx, inp_path,traceback.format_exc()))
+                    printt("f0fail-%s-%s-%s" % (idx, inp_path, traceback.format_exc()))
 
-if __name__=='__main__':
+
+if __name__ == "__main__":
     # exp_dir=r"E:\codes\py39\dataset\mi-test"
     # n_p=16
     # f = open("%s/log_extract_f0.log"%exp_dir, "w")
     printt(sys.argv)
     featureInput = FeatureInput()
-    paths=[]
-    inp_root= "%s/1_16k_wavs"%(exp_dir)
-    opt_root1="%s/2a_f0"%(exp_dir)
-    opt_root2="%s/2b-f0nsf"%(exp_dir)
+    paths = []
+    inp_root = "%s/1_16k_wavs" % (exp_dir)
+    opt_root1 = "%s/2a_f0" % (exp_dir)
+    opt_root2 = "%s/2b-f0nsf" % (exp_dir)
 
-    os.makedirs(opt_root1,exist_ok=True)
-    os.makedirs(opt_root2,exist_ok=True)
+    os.makedirs(opt_root1, exist_ok=True)
+    os.makedirs(opt_root2, exist_ok=True)
     for name in sorted(list(os.listdir(inp_root))):
-        inp_path="%s/%s"%(inp_root,name)
-        if ("spec" in inp_path): continue
-        opt_path1="%s/%s"%(opt_root1,name)
-        opt_path2="%s/%s"%(opt_root2,name)
-        paths.append([inp_path,opt_path1,opt_path2])
+        inp_path = "%s/%s" % (inp_root, name)
+        if "spec" in inp_path:
+            continue
+        opt_path1 = "%s/%s" % (opt_root1, name)
+        opt_path2 = "%s/%s" % (opt_root2, name)
+        paths.append([inp_path, opt_path1, opt_path2])
 
-    ps=[]
+    ps = []
     for i in range(n_p):
-        p=Process(target=featureInput.go,args=(paths[i::n_p],f0method,))
+        p = Process(
+            target=featureInput.go,
+            args=(
+                paths[i::n_p],
+                f0method,
+            ),
+        )
         p.start()
         ps.append(p)
     for p in ps: