mirror of
https://github.com/w-okada/voice-changer.git
synced 2025-03-15 04:13:57 +03:00
WIP: so-vits-svc 40v2, alpha (refactoring4 apply for v13)
This commit is contained in:
parent
5818292046
commit
ef6fdd8d49
4
client/demo_v13/dist/index.js
vendored
4
client/demo_v13/dist/index.js
vendored
File diff suppressed because one or more lines are too long
@ -28,7 +28,7 @@ const App = () => {
|
|||||||
return (
|
return (
|
||||||
<div className="top-title">
|
<div className="top-title">
|
||||||
<span className="title">Voice Changer Setting</span>
|
<span className="title">Voice Changer Setting</span>
|
||||||
<span className="top-title-version">for v.1.3.x</span>
|
<span className="top-title-version">for MMVC v.1.3.x</span>
|
||||||
<span className="belongings">
|
<span className="belongings">
|
||||||
<a className="link" href="https://github.com/w-okada/voice-changer" target="_blank" rel="noopener noreferrer">
|
<a className="link" href="https://github.com/w-okada/voice-changer" target="_blank" rel="noopener noreferrer">
|
||||||
<img src="./assets/icons/github.svg" />
|
<img src="./assets/icons/github.svg" />
|
||||||
|
@ -118,6 +118,9 @@ class MMVCv13:
|
|||||||
|
|
||||||
return data
|
return data
|
||||||
|
|
||||||
|
def get_processing_sampling_rate(self):
|
||||||
|
return self.hps.data.sampling_rate
|
||||||
|
|
||||||
def _get_spec(self, audio: any):
|
def _get_spec(self, audio: any):
|
||||||
spec = spectrogram_torch(audio, self.hps.data.filter_length,
|
spec = spectrogram_torch(audio, self.hps.data.filter_length,
|
||||||
self.hps.data.sampling_rate, self.hps.data.hop_length, self.hps.data.win_length,
|
self.hps.data.sampling_rate, self.hps.data.hop_length, self.hps.data.win_length,
|
||||||
@ -125,19 +128,24 @@ class MMVCv13:
|
|||||||
spec = torch.squeeze(spec, 0)
|
spec = torch.squeeze(spec, 0)
|
||||||
return spec
|
return spec
|
||||||
|
|
||||||
def generate_input(self, newData: any, convertSize: int):
|
def generate_input(self, newData: any, inputSize: int, crossfadeSize: int):
|
||||||
newData = newData.astype(np.float32)
|
newData = newData.astype(np.float32) / self.hps.data.max_wav_value
|
||||||
|
|
||||||
if hasattr(self, "audio_buffer"):
|
if hasattr(self, "audio_buffer"):
|
||||||
self.audio_buffer = np.concatenate([self.audio_buffer, newData], 0) # 過去のデータに連結
|
self.audio_buffer = np.concatenate([self.audio_buffer, newData], 0) # 過去のデータに連結
|
||||||
else:
|
else:
|
||||||
self.audio_buffer = newData
|
self.audio_buffer = newData
|
||||||
|
|
||||||
self.audio_buffer = self.audio_buffer[-(convertSize):] # 変換対象の部分だけ抽出
|
convertSize = inputSize + crossfadeSize
|
||||||
|
if convertSize < 8192:
|
||||||
|
convertSize = 8192
|
||||||
|
if convertSize % self.hps.data.hop_length != 0: # モデルの出力のホップサイズで切り捨てが発生するので補う。
|
||||||
|
convertSize = convertSize + (self.hps.data.hop_length - (convertSize % self.hps.data.hop_length))
|
||||||
|
|
||||||
|
self.audio_buffer = self.audio_buffer[-1 * convertSize:] # 変換対象の部分だけ抽出
|
||||||
|
|
||||||
audio = torch.FloatTensor(self.audio_buffer)
|
audio = torch.FloatTensor(self.audio_buffer)
|
||||||
audio_norm = audio / self.hps.data.max_wav_value # normalize
|
audio_norm = audio.unsqueeze(0) # unsqueeze
|
||||||
audio_norm = audio_norm.unsqueeze(0) # unsqueeze
|
|
||||||
spec = self._get_spec(audio_norm)
|
spec = self._get_spec(audio_norm)
|
||||||
sid = torch.LongTensor([int(self.settings.srcId)])
|
sid = torch.LongTensor([int(self.settings.srcId)])
|
||||||
|
|
||||||
|
@ -149,9 +149,7 @@ class MMVCv15:
|
|||||||
|
|
||||||
def _get_spec(self, newData: any):
|
def _get_spec(self, newData: any):
|
||||||
audio = torch.FloatTensor(newData)
|
audio = torch.FloatTensor(newData)
|
||||||
# audio_norm = audio / self.hps.data.max_wav_value # normalize
|
audio_norm = audio.unsqueeze(0) # unsqueeze
|
||||||
audio_norm = audio
|
|
||||||
audio_norm = audio_norm.unsqueeze(0) # unsqueeze
|
|
||||||
spec = spectrogram_torch(audio_norm, self.hps.data.filter_length,
|
spec = spectrogram_torch(audio_norm, self.hps.data.filter_length,
|
||||||
self.hps.data.sampling_rate, self.hps.data.hop_length, self.hps.data.win_length,
|
self.hps.data.sampling_rate, self.hps.data.hop_length, self.hps.data.win_length,
|
||||||
center=False)
|
center=False)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user