from enum import Enum import os import sys import tempfile from typing import Literal, TypeAlias VoiceChangerType: TypeAlias = Literal[ "MMVCv13", "MMVCv15", "so-vits-svc-40", "DDSP-SVC", "RVC", "Diffusion-SVC" ] STORED_SETTING_FILE = "stored_setting.json" SERVER_DEVICE_SAMPLE_RATES = [16000, 32000, 44100, 48000, 96000, 192000] tmpdir = tempfile.TemporaryDirectory() SSL_KEY_DIR = os.path.join(tmpdir.name, "keys") if hasattr(sys, "_MEIPASS") else "keys" MODEL_DIR = os.path.join(tmpdir.name, "logs") if hasattr(sys, "_MEIPASS") else "logs" UPLOAD_DIR = os.path.join(tmpdir.name, "upload_dir") if hasattr(sys, "_MEIPASS") else "upload_dir" NATIVE_CLIENT_FILE_WIN = os.path.join(sys._MEIPASS, "voice-changer-native-client.exe") if hasattr(sys, "_MEIPASS") else "voice-changer-native-client" # type: ignore NATIVE_CLIENT_FILE_MAC = ( os.path.join( sys._MEIPASS, # type: ignore "voice-changer-native-client.app", "Contents", "MacOS", "voice-changer-native-client", ) if hasattr(sys, "_MEIPASS") else "voice-changer-native-client" ) HUBERT_ONNX_MODEL_PATH = os.path.join(sys._MEIPASS, "model_hubert/hubert_simple.onnx") if hasattr(sys, "_MEIPASS") else "model_hubert/hubert_simple.onnx" # type: ignore TMP_DIR = os.path.join(tmpdir.name, "tmp_dir") if hasattr(sys, "_MEIPASS") else "tmp_dir" os.makedirs(TMP_DIR, exist_ok=True) def getFrontendPath(): frontend_path = os.path.join(sys._MEIPASS, "dist") if hasattr(sys, "_MEIPASS") else "../client/demo/dist" return frontend_path EmbedderType: TypeAlias = Literal[ "hubert_base", "contentvec", "hubert-base-japanese" ] class EnumInferenceTypes(Enum): pyTorchRVC = "pyTorchRVC" pyTorchRVCNono = "pyTorchRVCNono" pyTorchRVCv2 = "pyTorchRVCv2" pyTorchRVCv2Nono = "pyTorchRVCv2Nono" pyTorchWebUI = "pyTorchWebUI" pyTorchWebUINono = "pyTorchWebUINono" pyTorchVoRASbeta = "pyTorchVoRASbeta" onnxRVC = "onnxRVC" onnxRVCNono = "onnxRVCNono" DiffusionSVCInferenceType: TypeAlias = Literal[ "combo", ] PitchExtractorType: TypeAlias = Literal[ "harvest", "dio", "crepe", "crepe_full", "crepe_tiny", "rmvpe", ] ServerAudioDeviceType: TypeAlias = Literal[ "audioinput", "audiooutput" ] RVCSampleMode: TypeAlias = Literal[ "production", "testOfficial", "testDDPNTorch", "testDDPNONNX", "testONNXFull", ] def getSampleJsonAndModelIds(mode: RVCSampleMode): if mode == "production": return [ # "https://huggingface.co/wok000/vcclient_model/raw/main/samples_0001.json", # "https://huggingface.co/wok000/vcclient_model/raw/main/samples_0002.json", "https://huggingface.co/wok000/vcclient_model/raw/main/samples_0003_t2.json", "https://huggingface.co/wok000/vcclient_model/raw/main/samples_0003_o2.json", "https://huggingface.co/wok000/vcclient_model/raw/main/samples_0003_d2.json", ], [ ("Tsukuyomi-chan_o", {"useIndex": False}), ("Amitaro_o", {"useIndex": False}), ("KikotoMahiro_o", {"useIndex": False}), ("TokinaShigure_o", {"useIndex": True}), ("diffusion_combo_spk5_nl3_dl20_k50_500ep", {}), ("diffusion_combo_spk5_nl3_dl1_k50_500ep", {}), ] elif mode == "testOfficial": return [ "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_official_v1_v2.json", "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_ddpn_v1_v2.json", ], [ ("test-official-v1-f0-48k-l9-hubert_t", {"useIndex": True}), ("test-official-v1-nof0-48k-l9-hubert_t", {"useIndex": False}), ("test-official-v2-f0-40k-l12-hubert_t", {"useIndex": False}), ("test-official-v2-nof0-40k-l12-hubert_t", {"useIndex": False}), ("test-official-v1-f0-48k-l9-hubert_o", {"useIndex": True}), ("test-official-v1-nof0-48k-l9-hubert_o", {"useIndex": False}), ("test-official-v2-f0-40k-l12-hubert_o", {"useIndex": False}), ("test-official-v2-nof0-40k-l12-hubert_o", {"useIndex": False}), ] elif mode == "testDDPNTorch": return [ "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_official_v1_v2.json", "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_ddpn_v1_v2.json", ], [ ("test-ddpn-v1-f0-48k-l9-hubert_t", {"useIndex": False}), ("test-ddpn-v1-nof0-48k-l9-hubert_t", {"useIndex": False}), ("test-ddpn-v2-f0-40k-l12-hubert_t", {"useIndex": False}), ("test-ddpn-v2-nof0-40k-l12-hubert_t", {"useIndex": False}), ("test-ddpn-v2-f0-40k-l12-hubert_jp_t", {"useIndex": False}), ("test-ddpn-v2-nof0-40k-l12-hubert_jp_t", {"useIndex": False}), ] elif mode == "testDDPNONNX": return [ "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_official_v1_v2.json", "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_ddpn_v1_v2.json", ], [ ("test-ddpn-v1-f0-48k-l9-hubert_o", {"useIndex": False}), ("test-ddpn-v1-nof0-48k-l9-hubert_o", {"useIndex": False}), ("test-ddpn-v2-f0-40k-l12-hubert_o", {"useIndex": False}), ("test-ddpn-v2-nof0-40k-l12-hubert_o", {"useIndex": False}), ("test-ddpn-v2-f0-40k-l12-hubert_jp_o", {"useIndex": False}), ("test-ddpn-v2-nof0-40k-l12-hubert_jp_o", {"useIndex": False}), ] elif mode == "testONNXFull": return [ "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_official_v1_v2.json", "https://huggingface.co/wok000/vcclient_model/raw/main/test/test_ddpn_v1_v2.json", ], [ ("test-official-v1-f0-48k-l9-hubert_o_full", {"useIndex": False}), ("test-official-v1-nof0-48k-l9-hubert_o_full", {"useIndex": False}), ("test-official-v2-f0-40k-l12-hubert_o_full", {"useIndex": False}), ("test-official-v2-nof0-40k-l12-hubert_o_full", {"useIndex": False}), ("test-ddpn-v1-f0-48k-l9-hubert_o_full", {"useIndex": False}), ("test-ddpn-v1-nof0-48k-l9-hubert_o_full", {"useIndex": False}), ("test-ddpn-v2-f0-40k-l12-hubert_o_full", {"useIndex": False}), ("test-ddpn-v2-nof0-40k-l12-hubert_o_full", {"useIndex": False}), ("test-ddpn-v2-f0-40k-l12-hubert_jp_o_full", {"useIndex": False}), ("test-ddpn-v2-nof0-40k-l12-hubert_jp_o_full", {"useIndex": False}), ] else: return [], [] RVC_MODEL_DIRNAME = "rvc" MAX_SLOT_NUM = 200