rvc-genshin-impact

Paused

App Files Files Community

ozipoetra commited on Jul 3, 2024

Commit

62d077f

1 Parent(s): e48fdae

yest

Browse files

Files changed (2) hide show

app.py +4 -4
lib/vc/vc_infer_pipeline.py +2 -2

app.py CHANGED Viewed

@@ -58,8 +58,8 @@ else:
     f0method_mode = ["pm", "harvest", "crepe"]
     f0method_info = "PM is fast, Harvest is good but extremely slow, Rvmpe is alternative to harvest (might be better), and Crepe effect is good but requires GPU (Default: PM)"
-if os.path.isfile("assets/rmvpe/rmvpe.pt"):
-    f0method_mode.insert(2, "rmvpe")
 def create_vc_fn(model_name, tgt_sr, net_g, vc, if_f0, version, file_index):
     def vc_fn(
@@ -408,7 +408,7 @@ if __name__ == '__main__':
                                         tts_text = gr.Textbox(label="TTS text", info="Text to speech input", visible=False)
                                         tts_voice = gr.Dropdown(label="Edge-tts speaker", choices=voices, visible=False, allow_custom_value=False, value="en-US-AnaNeural-Female")
                                     with gr.Column():
-                                        vc_transform0 = gr.Number(label="Transpose", value=0, info='Type "12" to change from male to female voice. Type "-12" to change female to male voice')
                                         f0method0 = gr.Radio(
                                             label="Pitch extraction algorithm",
                                             info=f0method_info,
@@ -447,7 +447,7 @@ if __name__ == '__main__':
                                             maximum=1,
                                             label="Volume Envelope",
                                             info="Use the volume envelope of the input to replace or mix with the volume envelope of the output. The closer the ratio is to 1, the more the output envelope is used",
-                                            value=1,
                                             interactive=True,
                                         )
                                         protect0 = gr.Slider(

     f0method_mode = ["pm", "harvest", "crepe"]
     f0method_info = "PM is fast, Harvest is good but extremely slow, Rvmpe is alternative to harvest (might be better), and Crepe effect is good but requires GPU (Default: PM)"
+if os.path.isfile("assets/rvmpe/rvmpe.pt"):
+    f0method_mode.insert(2, "rvmpe")
 def create_vc_fn(model_name, tgt_sr, net_g, vc, if_f0, version, file_index):
     def vc_fn(
                                         tts_text = gr.Textbox(label="TTS text", info="Text to speech input", visible=False)
                                         tts_voice = gr.Dropdown(label="Edge-tts speaker", choices=voices, visible=False, allow_custom_value=False, value="en-US-AnaNeural-Female")
                                     with gr.Column():
+                                        vc_transform0 = gr.Number(label="Transpose", value=12, info='Type "12" to change from male to female voice. Type "-12" to change female to male voice')
                                         f0method0 = gr.Radio(
                                             label="Pitch extraction algorithm",
                                             info=f0method_info,
                                             maximum=1,
                                             label="Volume Envelope",
                                             info="Use the volume envelope of the input to replace or mix with the volume envelope of the output. The closer the ratio is to 1, the more the output envelope is used",
+                                            value=0.1,
                                             interactive=True,
                                         )
                                         protect0 = gr.Slider(

lib/vc/vc_infer_pipeline.py CHANGED Viewed

@@ -129,11 +129,11 @@ class VC(object):
             f0 = f0[0].cpu().numpy()
         elif f0_method == "rmvpe":
             if hasattr(self, "model_rmvpe") == False:
-                from lib.vc.rmvpe import RMVPE
                 print("loading rmvpe model")
                 self.model_rmvpe = RMVPE(
-                    os.path.join("assets", "rvmpe", "rmvpe.pt"), is_half=self.is_half, device=self.device
                 )
             f0 = self.model_rmvpe.infer_from_audio(x, thred=0.03)
         f0 *= pow(2, f0_up_key / 12)

             f0 = f0[0].cpu().numpy()
         elif f0_method == "rmvpe":
             if hasattr(self, "model_rmvpe") == False:
+                from rmvpe import RMVPE
                 print("loading rmvpe model")
                 self.model_rmvpe = RMVPE(
+                    os.path.join("assets", "rvmpe", "rvmpe.pt"), is_half=self.is_half, device=self.device
                 )
             f0 = self.model_rmvpe.infer_from_audio(x, thred=0.03)
         f0 *= pow(2, f0_up_key / 12)