voice-changer/client/lib/src/const.ts

628 lines
15 KiB
TypeScript
Raw Normal View History

2023-01-04 20:28:36 +03:00
// (★1) chunk sizeは 128サンプル, 256byte(int16)と定義。
// (★2) 256byte(最低バッファサイズ256から間引いた個数x2byte)をchunkとして管理。
2023-01-11 21:49:22 +03:00
// 24000sample -> 1sec, 128sample(1chunk) -> 5.333msec
2023-01-11 22:52:01 +03:00
// 187.5chunk -> 1sec
2023-01-04 20:28:36 +03:00
2023-03-09 00:47:11 +03:00
export const ClientType = {
"MMVCv15": "MMVCv15",
"MMVCv13": "MMVCv13",
2023-04-05 12:08:06 +03:00
"so-vits-svc-40": "so-vits-svc-40",
"so-vits-svc-40_c": "so-vits-svc-40_c",
2023-04-05 20:31:10 +03:00
"so-vits-svc-40v2": "so-vits-svc-40v2",
2023-04-16 15:34:00 +03:00
"DDSP-SVC": "DDSP-SVC",
2023-04-05 20:31:10 +03:00
"RVC": "RVC"
2023-03-15 02:56:17 +03:00
2023-03-09 00:47:11 +03:00
} as const
export type ClientType = typeof ClientType[keyof typeof ClientType]
///////////////////////
// サーバセッティング
///////////////////////
export const InputSampleRate = {
"48000": 48000,
2023-03-14 20:39:34 +03:00
"44100": 44100,
"24000": 24000
} as const
export type InputSampleRate = typeof InputSampleRate[keyof typeof InputSampleRate]
2023-04-07 22:39:04 +03:00
export const ModelSamplingRate = {
"48000": 48000,
"40000": 40000,
"32000": 32000
} as const
export type ModelSamplingRate = typeof InputSampleRate[keyof typeof InputSampleRate]
export const CrossFadeOverlapSize = {
"1024": 1024,
"2048": 2048,
"4096": 4096,
} as const
export type CrossFadeOverlapSize = typeof CrossFadeOverlapSize[keyof typeof CrossFadeOverlapSize]
2023-02-14 16:32:25 +03:00
export const OnnxExecutionProvider = {
"CPUExecutionProvider": "CPUExecutionProvider",
"CUDAExecutionProvider": "CUDAExecutionProvider",
"DmlExecutionProvider": "DmlExecutionProvider",
"OpenVINOExecutionProvider": "OpenVINOExecutionProvider",
} as const
export type OnnxExecutionProvider = typeof OnnxExecutionProvider[keyof typeof OnnxExecutionProvider]
export const Framework = {
"PyTorch": "PyTorch",
"ONNX": "ONNX",
} as const
export type Framework = typeof Framework[keyof typeof Framework]
export const F0Detector = {
"dio": "dio",
"harvest": "harvest",
2023-04-16 15:34:00 +03:00
"parselmouth": "parselmouth",
"crepe": "crepe",
} as const
export type F0Detector = typeof F0Detector[keyof typeof F0Detector]
2023-02-19 13:22:00 +03:00
export const ServerSettingKey = {
"srcId": "srcId",
"dstId": "dstId",
"gpu": "gpu",
2023-01-12 15:42:02 +03:00
"crossFadeOffsetRate": "crossFadeOffsetRate",
"crossFadeEndRate": "crossFadeEndRate",
"crossFadeOverlapSize": "crossFadeOverlapSize",
2023-04-14 03:18:34 +03:00
"solaEnabled": "solaEnabled",
"framework": "framework",
"onnxExecutionProvider": "onnxExecutionProvider",
"f0Factor": "f0Factor",
"f0Detector": "f0Detector",
"recordIO": "recordIO",
2023-03-11 02:21:16 +03:00
"tran": "tran",
"noiceScale": "noiceScale",
"predictF0": "predictF0",
"silentThreshold": "silentThreshold",
"extraConvertSize": "extraConvertSize",
"clusterInferRatio": "clusterInferRatio",
2023-03-11 02:21:16 +03:00
2023-04-07 21:11:37 +03:00
"indexRatio": "indexRatio",
2023-04-07 22:39:04 +03:00
"rvcQuality": "rvcQuality",
"modelSamplingRate": "modelSamplingRate",
2023-04-16 15:34:00 +03:00
"enableEnhancer": "enableEnhancer",
"enhancerTune": "enhancerTune",
2023-04-07 21:11:37 +03:00
"inputSampleRate": "inputSampleRate",
} as const
export type ServerSettingKey = typeof ServerSettingKey[keyof typeof ServerSettingKey]
export type VoiceChangerServerSetting = {
2023-01-04 20:28:36 +03:00
srcId: number,
dstId: number,
gpu: number,
crossFadeOffsetRate: number,
crossFadeEndRate: number,
crossFadeOverlapSize: CrossFadeOverlapSize,
2023-04-14 03:18:34 +03:00
solaEnabled: number,
2023-01-07 14:07:39 +03:00
2023-01-12 10:38:45 +03:00
framework: Framework
onnxExecutionProvider: OnnxExecutionProvider,
2023-02-10 18:59:44 +03:00
f0Factor: number
f0Detector: F0Detector // dio or harvest
2023-02-14 23:02:51 +03:00
recordIO: number // 0:off, 1:on
2023-03-11 02:21:16 +03:00
tran: number // so-vits-svc
noiceScale: number // so-vits-svc
predictF0: number // so-vits-svc
silentThreshold: number // so-vits-svc
extraConvertSize: number// so-vits-svc
clusterInferRatio: number // so-vits-svc
2023-03-11 02:21:16 +03:00
2023-04-07 21:11:37 +03:00
indexRatio: number // RVC
2023-04-07 22:39:04 +03:00
rvcQuality: number // 0:low, 1:high
modelSamplingRate: ModelSamplingRate // 32000,40000,48000
2023-04-07 21:11:37 +03:00
2023-04-16 15:34:00 +03:00
enableEnhancer: number // DDSP-SVC
enhancerTune: number // DDSP-SVC
2023-02-18 14:53:15 +03:00
inputSampleRate: InputSampleRate
2023-01-04 20:28:36 +03:00
}
export type ServerInfo = VoiceChangerServerSetting & {
status: string
configFile: string,
pyTorchModelFile: string,
onnxModelFile: string,
onnxExecutionProviders: OnnxExecutionProvider[]
}
export type ServerInfoSoVitsSVC = ServerInfo & {
speakers: { [key: string]: number }
}
2023-03-09 00:55:57 +03:00
export const DefaultServerSetting_MMVCv15: ServerInfo = {
srcId: 0,
dstId: 101,
gpu: 0,
2023-02-20 22:07:43 +03:00
crossFadeOffsetRate: 0.0,
crossFadeEndRate: 1.0,
crossFadeOverlapSize: CrossFadeOverlapSize[1024],
2023-04-14 03:18:34 +03:00
solaEnabled: 0,
framework: Framework.PyTorch,
f0Factor: 1.0,
onnxExecutionProvider: OnnxExecutionProvider.CPUExecutionProvider,
2023-03-09 00:55:57 +03:00
f0Detector: F0Detector.dio,
recordIO: 0,
2023-03-11 02:21:16 +03:00
tran: 0,
noiceScale: 0,
predictF0: 0,
silentThreshold: 0,
extraConvertSize: 0,
clusterInferRatio: 0,
2023-03-11 02:21:16 +03:00
2023-04-07 21:11:37 +03:00
indexRatio: 0,
2023-04-07 22:39:04 +03:00
rvcQuality: 0,
modelSamplingRate: 48000,
2023-04-07 21:11:37 +03:00
2023-04-16 15:34:00 +03:00
enableEnhancer: 0,
enhancerTune: 0,
2023-03-09 00:55:57 +03:00
inputSampleRate: 24000,
//
status: "ok",
configFile: "",
pyTorchModelFile: "",
onnxModelFile: "",
onnxExecutionProviders: []
}
export const DefaultServerSetting_MMVCv13: ServerInfo = {
srcId: 107,
dstId: 100,
gpu: 0,
crossFadeOffsetRate: 0.0,
crossFadeEndRate: 1.0,
crossFadeOverlapSize: CrossFadeOverlapSize[1024],
2023-04-14 03:18:34 +03:00
solaEnabled: 0,
2023-03-09 00:55:57 +03:00
framework: Framework.ONNX,
f0Factor: 1.0,
onnxExecutionProvider: OnnxExecutionProvider.CPUExecutionProvider,
f0Detector: F0Detector.dio,
recordIO: 0,
2023-03-11 02:21:16 +03:00
tran: 0,
noiceScale: 0,
predictF0: 0,
silentThreshold: 0,
extraConvertSize: 0,
clusterInferRatio: 0,
2023-03-11 02:21:16 +03:00
2023-04-07 21:11:37 +03:00
indexRatio: 0,
2023-04-07 22:39:04 +03:00
rvcQuality: 0,
modelSamplingRate: 48000,
2023-04-16 15:34:00 +03:00
enableEnhancer: 0,
enhancerTune: 0,
2023-04-07 21:11:37 +03:00
2023-03-09 00:55:57 +03:00
inputSampleRate: 24000,
//
status: "ok",
configFile: "",
pyTorchModelFile: "",
onnxModelFile: "",
onnxExecutionProviders: []
}
2023-03-18 19:43:36 +03:00
export const DefaultServerSetting_so_vits_svc_40: ServerInfo = {
srcId: 0,
dstId: 0,
gpu: 0,
crossFadeOffsetRate: 0.0,
crossFadeEndRate: 1.0,
crossFadeOverlapSize: CrossFadeOverlapSize[1024],
2023-04-14 03:18:34 +03:00
solaEnabled: 0,
2023-03-18 19:43:36 +03:00
framework: Framework.PyTorch,
f0Factor: 1.0,
onnxExecutionProvider: OnnxExecutionProvider.CPUExecutionProvider,
f0Detector: F0Detector.dio,
recordIO: 0,
// tran: 0,
// noiceScale: 0,
// predictF0: 0,
// silentThreshold: 0,
tran: 10,
noiceScale: 0.3,
predictF0: 0,
silentThreshold: 0.00001,
extraConvertSize: 1024 * 32,
clusterInferRatio: 0.1,
2023-04-07 21:11:37 +03:00
indexRatio: 0,
2023-04-07 22:39:04 +03:00
rvcQuality: 0,
modelSamplingRate: 48000,
2023-04-16 15:34:00 +03:00
enableEnhancer: 0,
enhancerTune: 0,
2023-04-07 21:11:37 +03:00
2023-03-18 19:43:36 +03:00
inputSampleRate: 24000,
//
status: "ok",
configFile: "",
pyTorchModelFile: "",
onnxModelFile: "",
onnxExecutionProviders: []
}
2023-04-05 12:08:06 +03:00
export const DefaultServerSetting_so_vits_svc_40_c: ServerInfo = {
srcId: 0,
dstId: 0,
gpu: 0,
crossFadeOffsetRate: 0.0,
crossFadeEndRate: 1.0,
crossFadeOverlapSize: CrossFadeOverlapSize[1024],
2023-04-14 03:18:34 +03:00
solaEnabled: 0,
2023-04-05 12:08:06 +03:00
framework: Framework.ONNX,
f0Factor: 1.0,
onnxExecutionProvider: OnnxExecutionProvider.CPUExecutionProvider,
f0Detector: F0Detector.dio,
recordIO: 0,
// tran: 0,
// noiceScale: 0,
// predictF0: 0,
// silentThreshold: 0,
tran: 10,
noiceScale: 0.3,
predictF0: 0,
silentThreshold: 0.00001,
extraConvertSize: 1024 * 32,
clusterInferRatio: 0.1,
2023-04-07 21:11:37 +03:00
indexRatio: 0,
2023-04-07 22:39:04 +03:00
rvcQuality: 0,
modelSamplingRate: 48000,
2023-04-16 15:34:00 +03:00
enableEnhancer: 0,
enhancerTune: 0,
2023-04-07 21:11:37 +03:00
2023-04-05 12:08:06 +03:00
inputSampleRate: 24000,
//
status: "ok",
configFile: "",
pyTorchModelFile: "",
onnxModelFile: "",
onnxExecutionProviders: []
}
2023-03-11 02:37:41 +03:00
export const DefaultServerSetting_so_vits_svc_40v2: ServerInfo = {
2023-03-09 00:55:57 +03:00
srcId: 0,
dstId: 0,
gpu: 0,
crossFadeOffsetRate: 0.0,
crossFadeEndRate: 1.0,
crossFadeOverlapSize: CrossFadeOverlapSize[1024],
2023-04-14 03:18:34 +03:00
solaEnabled: 0,
2023-03-09 00:55:57 +03:00
framework: Framework.PyTorch,
f0Factor: 1.0,
onnxExecutionProvider: OnnxExecutionProvider.CPUExecutionProvider,
f0Detector: F0Detector.dio,
recordIO: 0,
// tran: 0,
// noiceScale: 0,
2023-03-11 03:26:02 +03:00
// predictF0: 0,
// silentThreshold: 0,
tran: 10,
noiceScale: 0.3,
predictF0: 0,
silentThreshold: 0.00001,
extraConvertSize: 1024 * 32,
clusterInferRatio: 0.1,
2023-03-11 02:21:16 +03:00
2023-04-07 21:11:37 +03:00
indexRatio: 0,
2023-04-07 22:39:04 +03:00
rvcQuality: 0,
modelSamplingRate: 48000,
2023-04-16 15:34:00 +03:00
enableEnhancer: 0,
enhancerTune: 0,
inputSampleRate: 24000,
//
status: "ok",
configFile: "",
pyTorchModelFile: "",
onnxModelFile: "",
onnxExecutionProviders: []
}
export const DefaultServerSetting_DDSP_SVC: ServerInfo = {
srcId: 0,
2023-04-18 03:49:47 +03:00
dstId: 1,
2023-04-16 15:34:00 +03:00
gpu: 0,
crossFadeOffsetRate: 0.0,
crossFadeEndRate: 1.0,
crossFadeOverlapSize: CrossFadeOverlapSize[1024],
solaEnabled: 0,
framework: Framework.PyTorch,
f0Factor: 1.0,
onnxExecutionProvider: OnnxExecutionProvider.CPUExecutionProvider,
f0Detector: F0Detector.dio,
recordIO: 0,
// tran: 0,
// noiceScale: 0,
// predictF0: 0,
// silentThreshold: 0,
tran: 10,
noiceScale: 0.3,
predictF0: 0,
silentThreshold: 0.00001,
extraConvertSize: 1024 * 32,
clusterInferRatio: 0.1,
indexRatio: 0,
rvcQuality: 0,
modelSamplingRate: 48000,
enableEnhancer: 0,
enhancerTune: 0,
2023-04-07 21:11:37 +03:00
2023-02-20 22:07:43 +03:00
inputSampleRate: 24000,
//
status: "ok",
configFile: "",
pyTorchModelFile: "",
onnxModelFile: "",
2023-02-19 13:22:00 +03:00
onnxExecutionProviders: []
}
2023-04-05 22:03:09 +03:00
export const DefaultServerSetting_RVC: ServerInfo = {
srcId: 0,
dstId: 0,
gpu: 0,
crossFadeOffsetRate: 0.1,
crossFadeEndRate: 0.8,
crossFadeOverlapSize: CrossFadeOverlapSize[1024],
2023-04-14 03:18:34 +03:00
solaEnabled: 1,
2023-04-05 22:03:09 +03:00
framework: Framework.PyTorch,
f0Factor: 1.0,
onnxExecutionProvider: OnnxExecutionProvider.CPUExecutionProvider,
f0Detector: F0Detector.harvest,
recordIO: 0,
// tran: 0,
// noiceScale: 0,
// predictF0: 0,
// silentThreshold: 0,
tran: 10,
noiceScale: 0.3,
predictF0: 0,
silentThreshold: 0.00001,
extraConvertSize: 1024 * 32,
clusterInferRatio: 0.1,
2023-04-07 21:11:37 +03:00
indexRatio: 0,
2023-04-07 22:39:04 +03:00
rvcQuality: 0,
modelSamplingRate: 48000,
2023-04-07 21:11:37 +03:00
2023-04-16 15:34:00 +03:00
enableEnhancer: 0,
enhancerTune: 0,
inputSampleRate: 48000,
2023-04-05 22:03:09 +03:00
//
status: "ok",
configFile: "",
pyTorchModelFile: "",
onnxModelFile: "",
onnxExecutionProviders: []
}
///////////////////////
// Workletセッティング
///////////////////////
2023-01-11 22:52:01 +03:00
export type WorkletSetting = {
numTrancateTreshold: number,
volTrancateThreshold: number,
volTrancateLength: number
}
2023-02-19 08:20:37 +03:00
export const DefaultWorkletSetting: WorkletSetting = {
2023-02-19 22:49:34 +03:00
numTrancateTreshold: 100,
2023-02-19 08:20:37 +03:00
volTrancateThreshold: 0.0005,
volTrancateLength: 32
2023-02-17 22:15:34 +03:00
}
2023-02-19 08:20:37 +03:00
///////////////////////
2023-02-19 20:21:51 +03:00
// Worklet Nodeセッティング
2023-02-19 08:20:37 +03:00
///////////////////////
2023-01-05 05:45:42 +03:00
export const Protocol = {
2023-01-04 20:28:36 +03:00
"sio": "sio",
"rest": "rest",
} as const
2023-01-05 05:45:42 +03:00
export type Protocol = typeof Protocol[keyof typeof Protocol]
2023-01-04 20:28:36 +03:00
2023-02-19 08:20:37 +03:00
export const SendingSampleRate = {
"48000": 48000,
2023-03-14 20:39:34 +03:00
"44100": 44100,
2023-02-19 08:20:37 +03:00
"24000": 24000
2023-01-04 20:28:36 +03:00
} as const
2023-02-19 08:20:37 +03:00
export type SendingSampleRate = typeof SendingSampleRate[keyof typeof SendingSampleRate]
2023-01-04 20:28:36 +03:00
2023-02-14 16:32:25 +03:00
export const DownSamplingMode = {
"decimate": "decimate",
"average": "average"
} as const
export type DownSamplingMode = typeof DownSamplingMode[keyof typeof DownSamplingMode]
2023-02-19 08:20:37 +03:00
2023-02-19 20:21:51 +03:00
export type WorkletNodeSetting = {
2023-02-19 08:20:37 +03:00
serverUrl: string,
protocol: Protocol,
sendingSampleRate: SendingSampleRate,
inputChunkNum: number,
downSamplingMode: DownSamplingMode,
}
2023-02-19 20:21:51 +03:00
export const DefaultWorkletNodeSetting: WorkletNodeSetting = {
2023-02-19 08:20:37 +03:00
serverUrl: "",
protocol: "sio",
2023-02-20 22:07:43 +03:00
sendingSampleRate: 24000,
2023-02-19 08:20:37 +03:00
inputChunkNum: 48,
downSamplingMode: "average"
}
2023-03-18 19:43:36 +03:00
export const DefaultWorkletNodeSetting_so_vits_svc_40: WorkletNodeSetting = {
serverUrl: "",
protocol: "sio",
sendingSampleRate: 24000,
inputChunkNum: 128,
downSamplingMode: "average"
}
export const DefaultWorkletNodeSetting_so_vits_svc_40v2: WorkletNodeSetting = {
serverUrl: "",
protocol: "sio",
sendingSampleRate: 24000,
inputChunkNum: 128,
downSamplingMode: "average"
}
2023-04-16 15:34:00 +03:00
export const DefaultWorkletNodeSetting_DDSP_SVC: WorkletNodeSetting = {
serverUrl: "",
protocol: "sio",
sendingSampleRate: 48000,
inputChunkNum: 256,
downSamplingMode: "average"
}
2023-04-05 22:03:09 +03:00
export const DefaultWorkletNodeSetting_RVC: WorkletNodeSetting = {
serverUrl: "",
protocol: "sio",
sendingSampleRate: 48000,
2023-04-05 22:03:09 +03:00
inputChunkNum: 256,
downSamplingMode: "average"
}
2023-02-19 08:20:37 +03:00
///////////////////////
// クライアントセッティング
///////////////////////
2023-01-04 20:28:36 +03:00
export const SampleRate = {
"48000": 48000,
} as const
export type SampleRate = typeof SampleRate[keyof typeof SampleRate]
2023-02-19 13:22:00 +03:00
export type Speaker = {
"id": number,
"name": string,
}
export type Correspondence = {
"sid": number,
"correspondence": number,
"dirname": string
}
2023-02-19 08:20:37 +03:00
export type VoiceChangerClientSetting = {
audioInput: string | MediaStream | null,
sampleRate: SampleRate, // 48000Hz
echoCancel: boolean,
noiseSuppression: boolean,
noiseSuppression2: boolean
2023-02-19 13:22:00 +03:00
speakers: Speaker[],
correspondences: Correspondence[],
2023-02-19 08:20:37 +03:00
inputGain: number
outputGain: number
}
2023-01-05 05:45:42 +03:00
2023-01-12 10:38:45 +03:00
export const DefaultVoiceChangerClientSetting: VoiceChangerClientSetting = {
2023-01-05 12:35:56 +03:00
audioInput: null,
2023-01-05 05:45:42 +03:00
sampleRate: 48000,
2023-02-19 13:22:00 +03:00
speakers: [
{
"id": 0,
"name": "user"
},
{
"id": 101,
"name": "ずんだもん"
},
{
"id": 102,
"name": "そら"
},
{
"id": 103,
"name": "めたん"
},
{
"id": 104,
"name": "つむぎ"
}
],
correspondences: [],
echoCancel: false,
noiseSuppression: false,
2023-02-14 23:02:51 +03:00
noiseSuppression2: false,
2023-02-12 12:19:22 +03:00
inputGain: 1.0,
outputGain: 1.0
2023-01-04 20:28:36 +03:00
}
2023-01-07 14:07:39 +03:00
2023-02-19 08:20:37 +03:00
////////////////////////////////////
// Exceptions
////////////////////////////////////
2023-01-05 05:45:42 +03:00
export const VOICE_CHANGER_CLIENT_EXCEPTION = {
ERR_SIO_CONNECT_FAILED: "ERR_SIO_CONNECT_FAILED",
ERR_SIO_INVALID_RESPONSE: "ERR_SIO_INVALID_RESPONSE",
2023-01-07 14:07:39 +03:00
ERR_REST_INVALID_RESPONSE: "ERR_REST_INVALID_RESPONSE",
ERR_MIC_STREAM_NOT_INITIALIZED: "ERR_MIC_STREAM_NOT_INITIALIZED"
2023-01-05 05:45:42 +03:00
} as const
export type VOICE_CHANGER_CLIENT_EXCEPTION = typeof VOICE_CHANGER_CLIENT_EXCEPTION[keyof typeof VOICE_CHANGER_CLIENT_EXCEPTION]
2023-01-04 20:28:36 +03:00
2023-01-29 03:42:45 +03:00
////////////////////////////////////
// indexedDB
////////////////////////////////////
2023-03-02 03:56:42 +03:00
export const INDEXEDDB_DB_APP_NAME = "INDEXEDDB_KEY_VOICE_CHANGER"
export const INDEXEDDB_DB_NAME = "INDEXEDDB_KEY_VOICE_CHANGER_DB"
2023-01-29 03:42:45 +03:00
export const INDEXEDDB_KEY_CLIENT = "INDEXEDDB_KEY_VOICE_CHANGER_LIB_CLIENT"
export const INDEXEDDB_KEY_SERVER = "INDEXEDDB_KEY_VOICE_CHANGER_LIB_SERVER"
2023-02-19 20:21:51 +03:00
export const INDEXEDDB_KEY_WORKLETNODE = "INDEXEDDB_KEY_VOICE_CHANGER_LIB_WORKLETNODE"
2023-01-29 09:25:44 +03:00
export const INDEXEDDB_KEY_MODEL_DATA = "INDEXEDDB_KEY_VOICE_CHANGER_LIB_MODEL_DATA"
export const INDEXEDDB_KEY_WORKLET = "INDEXEDDB_KEY_VOICE_CHANGER_LIB_WORKLET"
2023-04-13 02:00:28 +03:00
// ONNX
export type OnnxExporterInfo = {
"status": string
"path": string
"filename": string
}