2023-05-20 09:54:00 +03:00
|
|
|
import torch
|
2023-05-31 08:30:35 +03:00
|
|
|
from const import EnumInferenceTypes
|
2023-05-29 11:34:35 +03:00
|
|
|
from voice_changer.RVC.deviceManager.DeviceManager import DeviceManager
|
2023-05-20 09:54:00 +03:00
|
|
|
from voice_changer.RVC.inferencer.Inferencer import Inferencer
|
2023-06-23 16:34:09 +03:00
|
|
|
from .rvc_models.infer_pack.models import SynthesizerTrnMs768NSFsid
|
2023-05-20 09:54:00 +03:00
|
|
|
|
|
|
|
|
|
|
|
class RVCInferencerv2(Inferencer):
|
2023-05-29 11:34:35 +03:00
|
|
|
def loadModel(self, file: str, gpu: int):
|
2023-05-31 08:30:35 +03:00
|
|
|
self.setProps(EnumInferenceTypes.pyTorchRVCv2, file, True, gpu)
|
|
|
|
|
2023-05-29 11:34:35 +03:00
|
|
|
dev = DeviceManager.get_instance().getDevice(gpu)
|
|
|
|
isHalf = DeviceManager.get_instance().halfPrecisionAvailable(gpu)
|
|
|
|
|
2023-05-20 09:54:00 +03:00
|
|
|
cpt = torch.load(file, map_location="cpu")
|
|
|
|
model = SynthesizerTrnMs768NSFsid(*cpt["config"], is_half=isHalf)
|
|
|
|
|
|
|
|
model.eval()
|
|
|
|
model.load_state_dict(cpt["weight"], strict=False)
|
|
|
|
|
|
|
|
model = model.to(dev)
|
|
|
|
if isHalf:
|
|
|
|
model = model.half()
|
|
|
|
|
|
|
|
self.model = model
|
|
|
|
return self
|
|
|
|
|
|
|
|
def infer(
|
|
|
|
self,
|
|
|
|
feats: torch.Tensor,
|
|
|
|
pitch_length: torch.Tensor,
|
|
|
|
pitch: torch.Tensor,
|
|
|
|
pitchf: torch.Tensor,
|
|
|
|
sid: torch.Tensor,
|
2023-07-01 10:45:25 +03:00
|
|
|
convert_length: int | None,
|
2023-05-20 09:54:00 +03:00
|
|
|
) -> torch.Tensor:
|
2023-09-06 02:04:39 +03:00
|
|
|
res = self.model.infer(feats, pitch_length, pitch, pitchf, sid, convert_length=convert_length)
|
|
|
|
res = res[0][0, 0].to(dtype=torch.float32)
|
|
|
|
res = torch.clip(res, -1.0, 1.0)
|
|
|
|
return res
|
|
|
|
|