vtube_rvc

Running

App Files Files Community

Kit-Lemonfoot commited on Nov 11, 2023

Commit

daaa3ac

•

1 Parent(s): b1eebc3

Added Vshojo and Phaseconnect models. Updated Vedal and Anny images. Added credits

Browse files

Files changed (1) hide show

app.py +14 -6

app.py CHANGED Viewed

@@ -31,7 +31,7 @@ limitation = os.getenv("SYSTEM") == "spaces"
 audio_mode = []
 f0method_mode = ["pm", "crepe", "harvest"]
-f0method_info = "PM is fast, rmvpe is middle. Crepe or harvest is good but it was extremely slow (Default: PM))"
 if limitation is True:
     audio_mode = ["TTS Audio", "Upload audio"]
 else:
@@ -47,11 +47,11 @@ def infer(name, path, index, vc_audio_mode, vc_input, vc_upload, tts_text, tts_v
             audio, sr = librosa.load(vc_input, sr=16000, mono=True)
         elif vc_audio_mode == "Upload audio":
             if vc_upload is None:
-                return "You need to upload an audio.", None
             sampling_rate, audio = vc_upload
             duration = audio.shape[0] / sampling_rate
             if duration > 360 and limitation:
-                return "Please upload an audio file that is less than 1 minute.", None
             audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
             if len(audio.shape) > 1:
                 audio = librosa.to_mono(audio.transpose(1, 0))
@@ -342,7 +342,8 @@ if __name__ == '__main__':
             "# <center> VTuber RVC Models\n"
             "### <center> Space by Kit Lemonfoot / Noel Shirogane's High Flying Birds"
             "<center> Original space by megaaziib & zomehwh\n"
-            "### <center> Please credit the original model authors if you use this Space.\n"
             "<center> (I will be adding more tabs later. Don't ask.)\n"
         )
         for (folder_title, folder, models) in categories:
@@ -393,7 +394,7 @@ if __name__ == '__main__':
                                         minimum=0,
                                         maximum=1,
                                         label="Retrieval feature ratio",
-                                        info="Accents controling. Too high prob gonna sounds too robotic (Default: 0.4)",
                                         value=0.4,
                                         interactive=True,
                                     )
@@ -410,7 +411,7 @@ if __name__ == '__main__':
                                         minimum=0,
                                         maximum=48000,
                                         label="Resample the output audio",
-                                        info="Resample the output audio in post-processing to the final sample rate. Set to 0 for no resampling",
                                         value=0,
                                         step=1,
                                         interactive=True,
@@ -504,6 +505,13 @@ if __name__ == '__main__':
                                 tts_voice
                             ]
                         )
 if limitation is True:
     app.queue(concurrency_count=1, max_size=20, api_open=config.api).launch(share=config.colab)
 else:

 audio_mode = []
 f0method_mode = ["pm", "crepe", "harvest"]
+f0method_info = "PM is fast but low quality, crepe and harvest are slow but good quality, RMVPE is the best of both worlds. (Default: RMVPE))"
 if limitation is True:
     audio_mode = ["TTS Audio", "Upload audio"]
 else:
             audio, sr = librosa.load(vc_input, sr=16000, mono=True)
         elif vc_audio_mode == "Upload audio":
             if vc_upload is None:
+                return "Please upload an audio file.", None
             sampling_rate, audio = vc_upload
             duration = audio.shape[0] / sampling_rate
             if duration > 360 and limitation:
+                return "Too long! Please upload an audio file that is less than 1 minute.", None
             audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
             if len(audio.shape) > 1:
                 audio = librosa.to_mono(audio.transpose(1, 0))
             "# <center> VTuber RVC Models\n"
             "### <center> Space by Kit Lemonfoot / Noel Shirogane's High Flying Birds"
             "<center> Original space by megaaziib & zomehwh\n"
+            "### <center> Please credit the original model authors if you use this Space."
+            "<center>Do no evil.\n"
             "<center> (I will be adding more tabs later. Don't ask.)\n"
         )
         for (folder_title, folder, models) in categories:
                                         minimum=0,
                                         maximum=1,
                                         label="Retrieval feature ratio",
+                                        info="Accent control. Too high will usually sound too robotic. (Default: 0.4)",
                                         value=0.4,
                                         interactive=True,
                                     )
                                         minimum=0,
                                         maximum=48000,
                                         label="Resample the output audio",
+                                        info="Resample the output audio in post-processing to the final sample rate. Set to 0 for no resampling.",
                                         value=0,
                                         step=1,
                                         interactive=True,
                                 tts_voice
                             ]
                         )
+        gr.Markdown(
+            "## <center>Credit to:\n"
+            "#### <center>Original devs:\n"
+            "<center>the RVC Project, lj1995, zomehwh \n\n"
+            "#### <center>Model creators:\n"
+            "<center>dacoolkid44, Hijack, Maki Ligon, megaaziib, KitLemonfoot, yeey5, Sui, Itaxhix, Acato, Kyuubical, MartinFLL, Listra92, IshimaIshimsky, ZomballTH, Jotape91, RigidSpinner, RandomAssBettel, Oida, Nhat Minh, Ardha27, Legitdark, TempoHawk, 0x3e9, Kaiaya, Skeetawn, Sonphantrung, Pianissimo\n"
+        )
 if limitation is True:
     app.queue(concurrency_count=1, max_size=20, api_open=config.api).launch(share=config.colab)
 else: