sovits4dzl

Sleeping

App Files Files Community

Vegecken commited on Mar 5, 2023

Commit

03b417a

1 Parent(s): b01ceec

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -14,7 +14,7 @@ logging.getLogger('markdown_it').setLevel(logging.WARNING)
 logging.getLogger('urllib3').setLevel(logging.WARNING)
 logging.getLogger('matplotlib').setLevel(logging.WARNING)
-model = Svc("logs/44k/G_27200.pth", "configs/config.json", cluster_model_path="logs/44k/kmeans_10000.pt")
@@ -24,8 +24,8 @@ def vc_fn(sid, input_audio, vc_transform, auto_f0,cluster_ratio, noise_scale):
     sampling_rate, audio = input_audio
     # print(audio.shape,sampling_rate)
     duration = audio.shape[0] / sampling_rate
-    if duration > 45:
-        return "请上传小于45s的音频，需要转换长音频请本地进行转换", None
     audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
     if len(audio.shape) > 1:
         audio = librosa.to_mono(audio.transpose(1, 0))
@@ -48,13 +48,13 @@ with app:
     with gr.Tabs():
         with gr.TabItem("Basic"):
             gr.Markdown(value="""
-                sovits4.0 nemo在线demo
                 """)
             spks = list(model.spk2id.keys())
             sid = gr.Dropdown(label="音色", choices=["nemo", "1"], value="yunhao")
-            vc_input3 = gr.Audio(label="上传音频（长度小于45秒）")
             vc_transform = gr.Number(label="变调（整数，可以正负，半音数量，升高八度就是12）", value=0)
             cluster_ratio = gr.Number(label="聚类模型混合比例，0-1之间，默认为0不启用聚类，能提升音色相似度，但会导致咬字下降（如果使用建议0.5左右）", value=0)
             auto_f0 = gr.Checkbox(label="自动f0预测，配合聚类模型f0预测效果更好,会导致变调功能失效（仅限转换语音，歌声不要勾选此项会究极跑调）", value=False)

 logging.getLogger('urllib3').setLevel(logging.WARNING)
 logging.getLogger('matplotlib').setLevel(logging.WARNING)
+model = Svc("logs/44k/model.pth", "configs/config.json", cluster_model_path="logs/44k/kmeans_10000.pt")
     sampling_rate, audio = input_audio
     # print(audio.shape,sampling_rate)
     duration = audio.shape[0] / sampling_rate
+    if duration > 30:
+        return "这只是个DEMO只能有30s的长度", None
     audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
     if len(audio.shape) > 1:
         audio = librosa.to_mono(audio.transpose(1, 0))
     with gr.Tabs():
         with gr.TabItem("Basic"):
             gr.Markdown(value="""
+                sovits4.0 东知了在线demo
                 """)
             spks = list(model.spk2id.keys())
             sid = gr.Dropdown(label="音色", choices=["nemo", "1"], value="yunhao")
+            vc_input3 = gr.Audio(label="上传音频（长度小于30秒）")
             vc_transform = gr.Number(label="变调（整数，可以正负，半音数量，升高八度就是12）", value=0)
             cluster_ratio = gr.Number(label="聚类模型混合比例，0-1之间，默认为0不启用聚类，能提升音色相似度，但会导致咬字下降（如果使用建议0.5左右）", value=0)
             auto_f0 = gr.Checkbox(label="自动f0预测，配合聚类模型f0预测效果更好,会导致变调功能失效（仅限转换语音，歌声不要勾选此项会究极跑调）", value=False)