8 lines
614 B
Python
8 lines
614 B
Python
from cosyvoice.cli.cosyvoice import CosyVoice
|
|
from cosyvoice.utils.file_utils import load_wav
|
|
import torchaudio
|
|
cosyvoice = CosyVoice(r'D:\AI\download\CosyVoice-300M', load_jit=True, load_onnx=False, fp16=True)
|
|
print(cosyvoice.list_avaliable_spks())
|
|
prompt_speech_16k = load_wav('example_audio.wav', 16000)
|
|
for i, j in enumerate(cosyvoice.inference_zero_shot('你好,我是通义生成式语音大模型,请问有什么可以帮您的吗?', '对,这就是我,万人敬仰的太乙真人', prompt_speech_16k, stream=False)):
|
|
torchaudio.save('zero_shot_{}.wav'.format(i), j['tts_speech'], 22050) |