voice-changer/server/voice_changer/utils/VoiceChangerModel.py

from typing import Any, Protocol, TypeAlias
import numpy as np
from const import VoiceChangerType

from voice_changer.utils.LoadModelParams import LoadModelParams


AudioInOut: TypeAlias = np.ndarray[Any, np.dtype[np.int16]]
AudioInOutFloat: TypeAlias = np.ndarray[Any, np.dtype[np.float32]]

PitchfInOut: TypeAlias = np.ndarray[Any, np.dtype[np.int16]]
FeatureInOut: TypeAlias = np.ndarray[Any, np.dtype[np.int16]]


class VoiceChangerModel(Protocol):
    voiceChangerType: VoiceChangerType = "RVC"

    # loadModel: Callable[..., dict[str, Any]]
    def loadModel(self, params: LoadModelParams):
        ...

    def get_processing_sampling_rate(self) -> int:
        ...

    def get_info(self) -> dict[str, Any]:
        ...

    def inference(self, data: tuple[Any, ...]) -> Any:
        ...

    def generate_input(
        self,
        newData: AudioInOut,
        inputSize: int,
        crossfadeSize: int,
        solaSearchFrame: int,
    ) -> tuple[Any, ...]:
        ...

    def update_settings(self, key: str, val: int | float | str) -> bool:
        ...
WIP: refactoring 2023-04-28 00:39:51 +03:00			`from typing import Any, Protocol, TypeAlias`
refactor: cherry pick from https://github.com/w-okada/voice-changer/pull/158. Timer and VoiceChangerModel 2023-04-12 19:13:25 +03:00			`import numpy as np`
bugfix: beatrice load 2023-11-08 13:54:13 +03:00			`from const import VoiceChangerType`
refactor: cherry pick from https://github.com/w-okada/voice-changer/pull/158. Timer and VoiceChangerModel 2023-04-12 19:13:25 +03:00
WIP: refactoring 2023-04-28 00:39:51 +03:00			`from voice_changer.utils.LoadModelParams import LoadModelParams`

refactor: cherry pick from https://github.com/w-okada/voice-changer/pull/158. Timer and VoiceChangerModel 2023-04-12 19:13:25 +03:00
			`AudioInOut: TypeAlias = np.ndarray[Any, np.dtype[np.int16]]`
Experimental LLVC 2023-11-12 17:10:58 +03:00			`AudioInOutFloat: TypeAlias = np.ndarray[Any, np.dtype[np.float32]]`

inferenceの高品質化+高速化 2023-07-01 10:45:25 +03:00			`PitchfInOut: TypeAlias = np.ndarray[Any, np.dtype[np.int16]]`
			`FeatureInOut: TypeAlias = np.ndarray[Any, np.dtype[np.int16]]`

refactor: cherry pick from https://github.com/w-okada/voice-changer/pull/158. Timer and VoiceChangerModel 2023-04-12 19:13:25 +03:00
			`class VoiceChangerModel(Protocol):`
bugfix: beatrice load 2023-11-08 13:54:13 +03:00			`voiceChangerType: VoiceChangerType = "RVC"`

WIP: refactoring 2023-04-28 00:39:51 +03:00			`# loadModel: Callable[..., dict[str, Any]]`
			`def loadModel(self, params: LoadModelParams):`
			`...`

			`def get_processing_sampling_rate(self) -> int:`
			`...`

			`def get_info(self) -> dict[str, Any]:`
			`...`

			`def inference(self, data: tuple[Any, ...]) -> Any:`
			`...`

bugfix: beatrice load 2023-11-08 13:54:13 +03:00			`def generate_input(`
			`self,`
			`newData: AudioInOut,`
			`inputSize: int,`
			`crossfadeSize: int,`
			`solaSearchFrame: int,`
			`) -> tuple[Any, ...]:`
WIP: refactoring 2023-04-28 00:39:51 +03:00			`...`

wip:support m1 mac 1 2023-06-21 03:18:51 +03:00			`def update_settings(self, key: str, val: int \| float \| str) -> bool:`
WIP: refactoring 2023-04-28 00:39:51 +03:00			`...`