voice-changer/demo/MMVCServerSIO.py

517 lines
18 KiB
Python
Raw Normal View History

2022-11-12 04:27:34 +03:00
import sys, os, struct, argparse, logging, shutil, base64, traceback
2022-11-12 03:26:28 +03:00
from dataclasses import dataclass
2022-11-12 04:27:34 +03:00
from datetime import datetime
from distutils.util import strtobool
import numpy as np
from scipy.io.wavfile import write, read
2022-12-09 06:52:27 +03:00
sys.path.append("MMVC_Trainer")
sys.path.append("MMVC_Trainer/text")
2022-10-29 18:58:21 +03:00
2022-11-12 04:27:34 +03:00
from fastapi.routing import APIRoute
from fastapi import HTTPException, Request, Response, FastAPI, UploadFile, File, Form
2022-10-30 13:28:27 +03:00
from fastapi.staticfiles import StaticFiles
2022-11-12 04:27:34 +03:00
from fastapi.encoders import jsonable_encoder
from fastapi.responses import JSONResponse
from fastapi.middleware.cors import CORSMiddleware
import uvicorn
2022-10-29 18:58:21 +03:00
import socketio
2022-11-12 04:27:34 +03:00
from pydantic import BaseModel
2022-10-29 18:58:21 +03:00
2022-11-12 04:27:34 +03:00
from typing import Callable
2022-11-08 13:00:47 +03:00
2022-11-12 04:27:34 +03:00
from mods.Trainer_Speakers import mod_get_speakers
from mods.Trainer_Training import mod_post_pre_training, mod_post_start_training, mod_post_stop_training, mod_get_related_files, mod_get_tail_training_log
from mods.Trainer_Model import mod_get_model, mod_delete_model
from mods.Trainer_Models import mod_get_models
from mods.Trainer_MultiSpeakerSetting import mod_get_multi_speaker_setting, mod_post_multi_speaker_setting
from mods.Trainer_Speaker_Voice import mod_get_speaker_voice
from mods.Trainer_Speaker_Voices import mod_get_speaker_voices
from mods.Trainer_Speaker import mod_delete_speaker
from mods.FileUploader import upload_file, concat_file_chunks
2022-10-29 18:58:21 +03:00
from mods.VoiceChanger import VoiceChanger
2022-11-12 04:27:34 +03:00
from mods.ssl import create_self_signed_cert
2022-11-08 13:00:47 +03:00
# File Uploader
2022-11-12 04:27:34 +03:00
# Trainer Rest Internal
2022-10-29 18:58:21 +03:00
class UvicornSuppressFilter(logging.Filter):
def filter(self, record):
return False
2022-11-12 04:27:34 +03:00
2022-10-29 18:58:21 +03:00
logger = logging.getLogger("uvicorn.error")
logger.addFilter(UvicornSuppressFilter())
# logger.propagate = False
logger = logging.getLogger("multipart.multipart")
logger.propagate = False
2022-11-12 04:27:34 +03:00
2022-11-12 03:26:28 +03:00
@dataclass
class ExApplicationInfo():
2022-11-12 04:27:34 +03:00
external_tensorboard_port: int
2022-10-29 18:58:21 +03:00
2022-11-12 03:26:28 +03:00
exApplitionInfo = ExApplicationInfo(external_tensorboard_port=0)
2022-11-12 04:27:34 +03:00
2022-10-29 18:58:21 +03:00
class VoiceModel(BaseModel):
gpu: int
srcId: int
dstId: int
timestamp: int
2022-11-02 22:05:42 +03:00
prefixChunkSize: int
2022-10-29 18:58:21 +03:00
buffer: str
2022-11-12 04:27:34 +03:00
class MyCustomNamespace(socketio.AsyncNamespace):
2022-10-29 18:58:21 +03:00
def __init__(self, namespace):
super().__init__(namespace)
def loadModel(self, config, model):
if hasattr(self, 'voiceChanger') == True:
self.voiceChanger.destroy()
self.voiceChanger = VoiceChanger(config, model)
2022-11-02 22:23:04 +03:00
# def loadWhisperModel(self, model):
# self.whisper = Whisper()
# self.whisper.loadModel("tiny")
# print("load")
2022-11-02 22:05:42 +03:00
def changeVoice(self, gpu, srcId, dstId, timestamp, prefixChunkSize, unpackedData):
2022-11-02 22:23:04 +03:00
# if hasattr(self, 'whisper') == True:
# self.whisper.addData(unpackedData)
2022-11-03 21:20:43 +03:00
if hasattr(self, 'voiceChanger') == True:
return self.voiceChanger.on_request(gpu, srcId, dstId, timestamp, prefixChunkSize, unpackedData)
else:
print("Voice Change is not loaded. Did you load a correct model?")
return np.zeros(1).astype(np.int16)
2022-11-02 22:05:42 +03:00
2022-11-02 22:23:04 +03:00
# def transcribe(self):
# if hasattr(self, 'whisper') == True:
# self.whisper.transcribe(0)
# else:
# print("whisper not found")
2022-11-02 22:05:42 +03:00
2022-10-29 18:58:21 +03:00
def on_connect(self, sid, environ):
# print('[{}] connet sid : {}'.format(datetime.now().strftime('%Y-%m-%d %H:%M:%S') , sid))
pass
2022-11-12 04:27:34 +03:00
async def on_request_message(self, sid, msg):
2022-10-29 18:58:21 +03:00
# print("on_request_message", torch.cuda.memory_allocated())
gpu = int(msg[0])
srcId = int(msg[1])
dstId = int(msg[2])
timestamp = int(msg[3])
2022-11-02 22:05:42 +03:00
prefixChunkSize = int(msg[4])
data = msg[5]
2022-10-29 18:58:21 +03:00
# print(srcId, dstId, timestamp)
2022-11-12 04:27:34 +03:00
unpackedData = np.array(struct.unpack(
'<%sh' % (len(data) // struct.calcsize('<h')), data))
audio1 = self.changeVoice(
gpu, srcId, dstId, timestamp, prefixChunkSize, unpackedData)
2022-10-29 18:58:21 +03:00
2022-11-12 04:27:34 +03:00
bin = struct.pack('<%sh' % len(audio1), *audio1)
await self.emit('response', [timestamp, bin])
2022-10-29 18:58:21 +03:00
def on_disconnect(self, sid):
# print('[{}] disconnect'.format(datetime.now().strftime('%Y-%m-%d %H:%M:%S')))
2022-11-12 04:27:34 +03:00
pass
2022-10-29 18:58:21 +03:00
def setupArgParser():
parser = argparse.ArgumentParser()
2022-11-12 04:27:34 +03:00
parser.add_argument("-t", type=str, default="MMVC",
help="Server type. MMVC|TRAIN")
2022-10-29 18:58:21 +03:00
parser.add_argument("-p", type=int, default=8080, help="port")
parser.add_argument("-c", type=str, help="path for the config.json")
parser.add_argument("-m", type=str, help="path for the model file")
2022-11-12 04:27:34 +03:00
parser.add_argument("--https", type=strtobool,
default=False, help="use https")
parser.add_argument("--httpsKey", type=str,
default="ssl.key", help="path for the key of https")
parser.add_argument("--httpsCert", type=str,
default="ssl.cert", help="path for the cert of https")
parser.add_argument("--httpsSelfSigned", type=strtobool,
default=True, help="generate self-signed certificate")
parser.add_argument("--colab", type=strtobool,
default=False, help="run on colab")
2022-10-29 18:58:21 +03:00
return parser
2022-11-12 04:27:34 +03:00
2022-10-29 18:58:21 +03:00
def printMessage(message, level=0):
if level == 0:
print(f"\033[17m{message}\033[0m")
elif level == 1:
print(f"\033[34m {message}\033[0m")
elif level == 2:
print(f"\033[32m {message}\033[0m")
else:
print(f"\033[47m {message}\033[0m")
2022-11-12 04:27:34 +03:00
2022-10-29 18:58:21 +03:00
global app_socketio
2022-10-30 13:28:27 +03:00
global app_fastapi
2022-10-29 18:58:21 +03:00
2022-10-30 13:28:27 +03:00
parser = setupArgParser()
args = parser.parse_args()
2022-10-29 18:58:21 +03:00
printMessage(f"Phase name:{__name__}", level=2)
thisFilename = os.path.basename(__file__)[:-3]
2022-11-12 04:27:34 +03:00
2022-11-08 13:00:47 +03:00
class ValidationErrorLoggingRoute(APIRoute):
def get_route_handler(self) -> Callable:
original_route_handler = super().get_route_handler()
async def custom_route_handler(request: Request) -> Response:
try:
return await original_route_handler(request)
except Exception as exc:
print("Exception", request.url, str(exc))
body = await request.body()
detail = {"errors": exc.errors(), "body": body.decode()}
raise HTTPException(status_code=422, detail=detail)
return custom_route_handler
2022-10-29 18:58:21 +03:00
2022-11-12 04:27:34 +03:00
2022-10-30 13:28:27 +03:00
if __name__ == thisFilename or args.colab == True:
2022-10-29 18:58:21 +03:00
printMessage(f"PHASE3:{__name__}", level=2)
2022-11-12 04:27:34 +03:00
TYPE = args.t
2022-10-29 18:58:21 +03:00
PORT = args.p
CONFIG = args.c
2022-11-12 04:27:34 +03:00
MODEL = args.m
2022-10-29 18:58:21 +03:00
2022-11-12 05:54:03 +03:00
if os.getenv("EX_TB_PORT"):
EX_TB_PORT = os.environ["EX_TB_PORT"]
exApplitionInfo.external_tensorboard_port = int(EX_TB_PORT)
2022-10-29 18:58:21 +03:00
app_fastapi = FastAPI()
2022-11-08 13:00:47 +03:00
app_fastapi.router.route_class = ValidationErrorLoggingRoute
2022-10-30 13:28:27 +03:00
app_fastapi.add_middleware(
CORSMiddleware,
allow_origins=["*"],
allow_credentials=True,
allow_methods=["*"],
allow_headers=["*"],
)
2022-11-12 04:27:34 +03:00
app_fastapi.mount(
"/front", StaticFiles(directory="../frontend/dist", html=True), name="static")
2022-10-30 13:28:27 +03:00
2022-11-12 04:27:34 +03:00
app_fastapi.mount(
"/trainer", StaticFiles(directory="../frontend/dist", html=True), name="static")
2022-11-08 13:00:47 +03:00
2022-11-12 04:27:34 +03:00
app_fastapi.mount(
"/recorder", StaticFiles(directory="../frontend/dist", html=True), name="static")
2022-11-08 13:00:47 +03:00
2022-10-29 18:58:21 +03:00
sio = socketio.AsyncServer(
async_mode='asgi',
cors_allowed_origins='*'
)
namespace = MyCustomNamespace('/test')
2022-11-12 04:27:34 +03:00
sio.register_namespace(namespace)
2022-10-29 18:58:21 +03:00
if CONFIG and MODEL:
namespace.loadModel(CONFIG, MODEL)
2022-11-02 22:23:04 +03:00
# namespace.loadWhisperModel("base")
2022-11-12 04:27:34 +03:00
2022-10-29 18:58:21 +03:00
app_socketio = socketio.ASGIApp(
2022-11-12 04:27:34 +03:00
sio,
2022-10-29 18:58:21 +03:00
other_asgi_app=app_fastapi,
static_files={
2022-11-03 13:22:33 +03:00
'/assets/icons/github.svg': {
2022-11-12 04:27:34 +03:00
'filename': '../frontend/dist/assets/icons/github.svg',
'content_type': 'image/svg+xml'
},
2022-10-29 18:58:21 +03:00
'': '../frontend/dist',
'/': '../frontend/dist/index.html',
}
)
@app_fastapi.get("/api/hello")
async def index():
return {"result": "Index"}
2022-11-08 13:00:47 +03:00
############
# File Uploder
2022-11-12 04:27:34 +03:00
# ##########
2022-11-08 13:00:47 +03:00
UPLOAD_DIR = "upload_dir"
2022-10-30 16:42:05 +03:00
os.makedirs(UPLOAD_DIR, exist_ok=True)
2022-12-09 06:52:27 +03:00
MODEL_DIR = "MMVC_Trainer/logs"
2022-11-08 13:00:47 +03:00
os.makedirs(MODEL_DIR, exist_ok=True)
2022-10-29 18:58:21 +03:00
2022-10-30 16:37:57 +03:00
@app_fastapi.post("/upload_file")
async def post_upload_file(
2022-11-12 04:27:34 +03:00
file: UploadFile = File(...),
2022-10-30 13:01:55 +03:00
filename: str = Form(...)
2022-11-12 04:27:34 +03:00
):
2022-11-08 13:00:47 +03:00
return upload_file(UPLOAD_DIR, file, filename)
2022-10-30 16:37:57 +03:00
@app_fastapi.post("/load_model")
async def post_load_model(
modelFilename: str = Form(...),
modelFilenameChunkNum: int = Form(...),
configFilename: str = Form(...)
2022-11-12 04:27:34 +03:00
):
2022-10-30 16:37:57 +03:00
2022-11-12 04:27:34 +03:00
modelFilePath = concat_file_chunks(
UPLOAD_DIR, modelFilename, modelFilenameChunkNum, UPLOAD_DIR)
2022-11-08 13:00:47 +03:00
print(f'File saved to: {modelFilePath}')
configFilePath = os.path.join(UPLOAD_DIR, configFilename)
2022-10-30 16:37:57 +03:00
2022-11-08 13:00:47 +03:00
namespace.loadModel(configFilePath, modelFilePath)
return {"load": f"{modelFilePath}, {configFilePath}"}
2022-10-30 13:01:55 +03:00
2022-11-08 13:00:47 +03:00
@app_fastapi.post("/load_model_for_train")
async def post_load_model_for_train(
modelGFilename: str = Form(...),
modelGFilenameChunkNum: int = Form(...),
modelDFilename: str = Form(...),
modelDFilenameChunkNum: int = Form(...),
2022-11-12 04:27:34 +03:00
):
2022-10-29 18:58:21 +03:00
2022-11-12 04:27:34 +03:00
modelGFilePath = concat_file_chunks(
UPLOAD_DIR, modelGFilename, modelGFilenameChunkNum, MODEL_DIR)
modelDFilePath = concat_file_chunks(
UPLOAD_DIR, modelDFilename, modelDFilenameChunkNum, MODEL_DIR)
2022-11-08 13:00:47 +03:00
return {"File saved": f"{modelGFilePath}, {modelDFilePath}"}
@app_fastapi.post("/extract_voices")
async def post_load_model(
zipFilename: str = Form(...),
zipFileChunkNum: int = Form(...),
2022-11-12 04:27:34 +03:00
):
zipFilePath = concat_file_chunks(
UPLOAD_DIR, zipFilename, zipFileChunkNum, UPLOAD_DIR)
2022-12-09 06:52:27 +03:00
shutil.unpack_archive(zipFilePath, "MMVC_Trainer/dataset/textful/")
2022-11-08 13:00:47 +03:00
return {"Zip file unpacked": f"{zipFilePath}"}
2022-11-02 22:05:42 +03:00
2022-11-08 13:00:47 +03:00
############
# Voice Changer
2022-11-12 04:27:34 +03:00
# ##########
2022-10-29 18:58:21 +03:00
@app_fastapi.post("/test")
2022-11-12 04:27:34 +03:00
async def post_test(voice: VoiceModel):
2022-10-29 18:58:21 +03:00
try:
# print("POST REQUEST PROCESSING....")
gpu = voice.gpu
srcId = voice.srcId
dstId = voice.dstId
timestamp = voice.timestamp
2022-11-02 22:05:42 +03:00
prefixChunkSize = voice.prefixChunkSize
2022-10-29 18:58:21 +03:00
buffer = voice.buffer
wav = base64.b64decode(buffer)
2022-11-12 04:27:34 +03:00
if wav == 0:
samplerate, data = read("dummy.wav")
2022-10-29 18:58:21 +03:00
unpackedData = data
else:
2022-11-12 04:27:34 +03:00
unpackedData = np.array(struct.unpack(
'<%sh' % (len(wav) // struct.calcsize('<h')), wav))
write("logs/received_data.wav", 24000,
unpackedData.astype(np.int16))
2022-10-29 18:58:21 +03:00
2022-11-12 04:27:34 +03:00
changedVoice = namespace.changeVoice(
gpu, srcId, dstId, timestamp, prefixChunkSize, unpackedData)
2022-10-29 18:58:21 +03:00
2022-11-03 21:20:43 +03:00
changedVoiceBase64 = base64.b64encode(changedVoice).decode('utf-8')
2022-10-29 18:58:21 +03:00
data = {
2022-11-12 04:27:34 +03:00
"gpu": gpu,
"srcId": srcId,
"dstId": dstId,
"timestamp": timestamp,
"prefixChunkSize": prefixChunkSize,
"changedVoiceBase64": changedVoiceBase64
2022-10-29 18:58:21 +03:00
}
json_compatible_item_data = jsonable_encoder(data)
2022-11-12 04:27:34 +03:00
2022-10-29 18:58:21 +03:00
return JSONResponse(content=json_compatible_item_data)
2022-11-03 21:20:43 +03:00
2022-10-29 18:58:21 +03:00
except Exception as e:
print("REQUEST PROCESSING!!!! EXCEPTION!!!", e)
print(traceback.format_exc())
return str(e)
2022-11-08 13:00:47 +03:00
# Trainer REST API ※ ColabがTop直下のパスにしかPOSTを投げれないようなので"REST風"
2022-11-12 04:27:34 +03:00
2022-11-08 13:00:47 +03:00
@app_fastapi.get("/get_speakers")
async def get_speakers():
return mod_get_speakers()
@app_fastapi.delete("/delete_speaker")
2022-11-12 04:27:34 +03:00
async def delete_speaker(speaker: str = Form(...)):
2022-11-08 13:00:47 +03:00
return mod_delete_speaker(speaker)
@app_fastapi.get("/get_speaker_voices")
2022-11-12 04:27:34 +03:00
async def get_speaker_voices(speaker: str):
2022-11-08 13:00:47 +03:00
return mod_get_speaker_voices(speaker)
@app_fastapi.get("/get_speaker_voice")
2022-11-12 04:27:34 +03:00
async def get_speaker_voices(speaker: str, voice: str):
2022-11-08 13:00:47 +03:00
return mod_get_speaker_voice(speaker, voice)
@app_fastapi.get("/get_multi_speaker_setting")
async def get_multi_speaker_setting():
return mod_get_multi_speaker_setting()
@app_fastapi.post("/post_multi_speaker_setting")
async def post_multi_speaker_setting(setting: str = Form(...)):
return mod_post_multi_speaker_setting(setting)
@app_fastapi.get("/get_models")
async def get_models():
return mod_get_models()
@app_fastapi.get("/get_model")
2022-11-12 04:27:34 +03:00
async def get_model(model: str):
2022-11-08 13:00:47 +03:00
return mod_get_model(model)
@app_fastapi.delete("/delete_model")
2022-11-12 04:27:34 +03:00
async def delete_model(model: str = Form(...)):
2022-11-08 13:00:47 +03:00
return mod_delete_model(model)
@app_fastapi.post("/post_pre_training")
2022-11-12 04:27:34 +03:00
async def post_pre_training(batch: int = Form(...)):
2022-11-08 13:00:47 +03:00
return mod_post_pre_training(batch)
@app_fastapi.post("/post_start_training")
async def post_start_training():
print("POST START TRAINING..")
return mod_post_start_training()
@app_fastapi.post("/post_stop_training")
async def post_stop_training():
print("POST STOP TRAINING..")
return mod_post_stop_training()
@app_fastapi.get("/get_related_files")
async def get_related_files():
return mod_get_related_files()
2022-11-12 04:27:34 +03:00
2022-11-08 13:00:47 +03:00
@app_fastapi.get("/get_tail_training_log")
2022-11-12 04:27:34 +03:00
async def get_tail_training_log(num: int):
2022-11-08 13:00:47 +03:00
return mod_get_tail_training_log(num)
2022-11-12 03:26:28 +03:00
@app_fastapi.get("/get_ex_application_info")
async def get_ex_application_info():
json_compatible_item_data = jsonable_encoder(exApplitionInfo)
return JSONResponse(content=json_compatible_item_data)
2022-10-29 18:58:21 +03:00
if __name__ == '__mp_main__':
printMessage(f"PHASE2:{__name__}", level=2)
if __name__ == '__main__':
printMessage(f"PHASE1:{__name__}", level=2)
2022-11-12 04:27:34 +03:00
TYPE = args.t
2022-10-29 18:58:21 +03:00
PORT = args.p
CONFIG = args.c
2022-11-12 04:27:34 +03:00
MODEL = args.m
if TYPE != "MMVC" and TYPE != "TRAIN":
print("Type(-t) should be MMVC or TRAIN")
exit(1)
2022-10-29 18:58:21 +03:00
printMessage(f"Start MMVC SocketIO Server", level=0)
printMessage(f"CONFIG:{CONFIG}, MODEL:{MODEL}", level=1)
2022-10-29 19:42:01 +03:00
if args.colab == False:
2022-11-12 04:27:34 +03:00
if os.getenv("EX_PORT"):
EX_PORT = os.environ["EX_PORT"]
printMessage(
f"External_Port:{EX_PORT} Internal_Port:{PORT}", level=1)
else:
printMessage(f"Internal_Port:{PORT}", level=1)
if os.getenv("EX_TB_PORT"):
EX_TB_PORT = os.environ["EX_TB_PORT"]
2022-11-12 05:23:01 +03:00
printMessage(f"External_TeonsorBord_Port:{EX_TB_PORT}", level=1)
2022-11-12 04:27:34 +03:00
if os.getenv("EX_IP"):
EX_IP = os.environ["EX_IP"]
printMessage(f"External_IP:{EX_IP}", level=1)
# HTTPS key/cert作成
if args.https and args.httpsSelfSigned == 1:
# HTTPS(おれおれ証明書生成)
os.makedirs("./key", exist_ok=True)
key_base_name = f"{datetime.now().strftime('%Y%m%d_%H%M%S')}"
keyname = f"{key_base_name}.key"
certname = f"{key_base_name}.cert"
create_self_signed_cert(certname, keyname, certargs={"Country": "JP",
"State": "Tokyo",
"City": "Chuo-ku",
"Organization": "F",
"Org. Unit": "F"}, cert_dir="./key")
key_path = os.path.join("./key", keyname)
cert_path = os.path.join("./key", certname)
printMessage(
f"protocol: HTTPS(self-signed), key:{key_path}, cert:{cert_path}", level=1)
elif args.https and args.httpsSelfSigned == 0:
# HTTPS
key_path = args.httpsKey
cert_path = args.httpsCert
printMessage(
f"protocol: HTTPS, key:{key_path}, cert:{cert_path}", level=1)
else:
# HTTP
printMessage(f"protocol: HTTP", level=1)
2022-10-29 18:58:21 +03:00
2022-11-12 04:27:34 +03:00
# アドレス表示
if args.https == 1:
printMessage(
f"open https://<IP>:<PORT>/ with your browser.", level=0)
else:
printMessage(
f"open http://<IP>:<PORT>/ with your browser.", level=0)
if TYPE == "MMVC":
path = ""
else:
path = "trainer"
if EX_PORT and EX_IP and args.https == 1:
printMessage(f"In many cases it is one of the following", level=1)
printMessage(f"https://localhost:{EX_PORT}/{path}", level=1)
for ip in EX_IP.strip().split(" "):
printMessage(f"https://{ip}:{EX_PORT}/{path}", level=1)
elif EX_PORT and EX_IP and args.https == 0:
printMessage(f"In many cases it is one of the following", level=1)
printMessage(f"http://localhost:{EX_PORT}/{path}", level=1)
2022-10-29 18:58:21 +03:00
# サーバ起動
if args.https:
2022-11-12 04:27:34 +03:00
# HTTPS サーバ起動
2022-10-29 18:58:21 +03:00
uvicorn.run(
2022-11-12 04:27:34 +03:00
f"{os.path.basename(__file__)[:-3]}:app_socketio",
host="0.0.0.0",
port=int(PORT),
reload=True,
ssl_keyfile=key_path,
ssl_certfile=cert_path,
2022-11-02 22:05:42 +03:00
log_level="critical"
2022-10-29 18:58:21 +03:00
)
else:
# HTTP サーバ起動
2022-10-30 13:28:27 +03:00
if args.colab == True:
2022-11-12 04:27:34 +03:00
uvicorn.run(
f"{os.path.basename(__file__)[:-3]}:app_fastapi",
host="0.0.0.0",
port=int(PORT),
log_level="critical"
)
2022-10-30 13:28:27 +03:00
else:
2022-11-12 04:27:34 +03:00
uvicorn.run(
f"{os.path.basename(__file__)[:-3]}:app_socketio",
host="0.0.0.0",
port=int(PORT),
reload=True,
log_level="critical"
)