voice-changer/client/python/vc_client.py
2023-02-24 02:51:52 +09:00

156 lines
4.3 KiB
Python

import argparse
import pyaudio
import wave
import struct
import socketio
import ssl
from datetime import datetime
import time
import urllib3
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
import signal
import sys
import numpy as np
BUFFER_SIZE = 2048 * 2
def setupArgParser():
parser = argparse.ArgumentParser()
parser.add_argument("--url", type=str, default="http://localhost:18888", help="url")
parser.add_argument("--input", type=int, required=True, help="input device index")
parser.add_argument("--output", type=int, default=-1, help="input device index")
parser.add_argument("--to", type=str, default="", help="sid")
return parser
class MockStream:
def __init__(self, sampling_rate):
self.sampling_rate = sampling_rate
self.start_count = 2
self.end_count = 2
self.fr = None
self.fw = None
def open_inputfile(self, input_filename):
self.fr = wave.open(input_filename, 'rb')
def open_outputfile(self, output_filename):
self.fw = wave.open(output_filename, 'wb')
self.fw.setnchannels(1)
self.fw.setsampwidth(2)
self.fw.setframerate(self.sampling_rate)
def read(self, length, exception_on_overflow=False):
if self.start_count > 0:
wav = bytes(length * 2)
self.start_count -= 1
else:
wav = self.fr.readframes(length)
if len(wav) <= 0:
wav = bytes(length * 2)
self.end_count -= 1
if self.end_count < 0:
Hyperparameters.VC_END_FLAG = True
return wav
def write(self, wav):
self.fw.writeframes(wav)
def stop_stream(self):
pass
def close(self):
if self.fr != None:
self.fr.close()
self.fr = None
if self.fw != None:
self.fw.close()
self.fw = None
class MyCustomNamespace(socketio.ClientNamespace):
def __init__(self, namespace: str, audio_output_stream, file_output_stream):
super().__init__(namespace)
self.audio_output_stream = audio_output_stream
self.file_output_stream = file_output_stream
def on_connect(self):
print(f'connected')
def on_disconnect(self):
print(f'disconnected')
def on_response(self, msg):
timestamp = msg[0]
responseTime = time.time() * 1000 - timestamp
data = msg[1]
perf = msg[2]
print(f"RT:{responseTime}msec", perf)
# unpackedData = struct.unpack('<%sh' % (len(data) // struct.calcsize('<h')), data)
if self.file_output_stream != None:
self.file_output_stream.write(data)
if self.audio_output_stream != None:
self.audio_output_stream.write(data)
if __name__ == '__main__':
parser = setupArgParser()
args, unknown = parser.parse_known_args()
url = args.url
inputDevice = args.input
outputDevice = args.output
to = args.to
audio = pyaudio.PyAudio()
audio_input_stream = audio.open(
format=pyaudio.paInt16,
channels=1,
rate=24000,
frames_per_buffer=BUFFER_SIZE,
input_device_index=inputDevice,
input=True)
print("output device", outputDevice)
if outputDevice >= 0:
audio_output_stream = audio.open(
format=pyaudio.paInt16,
channels=1,
rate=24000,
frames_per_buffer=BUFFER_SIZE,
output_device_index=outputDevice,
output=True)
else:
audio_output_stream = None
# mock_stream_out = MockStream(24000)
# mock_stream_out.open_outputfile("test.wav")
mock_stream_out = None
# mock_stream_in = MockStream(24000)
# mock_stream_in.open_outputfile("test_in.wav")
my_namespace = MyCustomNamespace("/test", audio_output_stream, mock_stream_out)
sio = socketio.Client(ssl_verify=False)
sio.register_namespace(my_namespace)
sio.connect(url)
try:
while True:
in_wav = audio_input_stream.read(BUFFER_SIZE, exception_on_overflow=False)
sio.emit('request_message', [time.time() * 1000, in_wav], namespace="/test")
except KeyboardInterrupt:
audio_input_stream.stop_stream()
audio_input_stream.close()
audio_output_stream.stop_stream()
audio_output_stream.close()
audio.terminate()
mock_stream_out.close()