From 86cdb40906994db9d7072f6e73ca6de7f1ff4ce9 Mon Sep 17 00:00:00 2001 From: "yanyuxiyangzk@126.com" Date: Mon, 8 Apr 2024 14:52:10 +0800 Subject: [PATCH] tts --- llm/README.md | 8 ++++++++ tts/README.md | 12 ++++++++++++ tts/tts_test.py | 28 ++++++++++++++++++++++++++++ 3 files changed, 48 insertions(+) create mode 100644 tts/README.md create mode 100644 tts/tts_test.py diff --git a/llm/README.md b/llm/README.md index 6e92bbf..5f06829 100644 --- a/llm/README.md +++ b/llm/README.md @@ -10,6 +10,14 @@ python -m vllm.entrypoints.openai.api_server --tensor-parallel-size=1 --trust-r python -m vllm.entrypoints.openai.api_server --port 8101 --tensor-parallel-size=1 --trust-remote-code --max-model-len 1024 --model THUDM/chatglm3-6b +CUDA_VISIBLE_DEVICES=6,7 python -m vllm.entrypoints.openai.api_server \ +--model="/data/mnt/ShareFolder/common_models/Ziya-Reader-13B-v1.0" \ +--max-model-len=8192 \ +--tensor-parallel-size=2 \ +--trust-remote-code \ +--port=8101 + + 3、测试 curl http://127.0.0.1:8101/v1/completions \ -H "Content-Type: application/json" \ diff --git a/tts/README.md b/tts/README.md new file mode 100644 index 0000000..e25b513 --- /dev/null +++ b/tts/README.md @@ -0,0 +1,12 @@ +一、采用gpt-sovits方案,bert-sovits适合长音频训练,gpt-sovits运行短音频快速推理 + + + + + + + + +http://127.0.0.1:9880/tts?text=我是一个粉刷匠,粉刷本领强。我要把那新房子,刷得更漂亮。刷了房顶又刷墙,刷子像飞一样。哎呀我的小鼻子,变呀变了样。&text_lang=zh&ref_audio_path=mengpai.wav&prompt_lang=zh&prompt_text=呜哇好生气啊!不要把我跟一斗相提并论!&text_split_method=cut5&batch_size=1&media_type=wav&streaming_mode=true + + diff --git a/tts/tts_test.py b/tts/tts_test.py new file mode 100644 index 0000000..08437d5 --- /dev/null +++ b/tts/tts_test.py @@ -0,0 +1,28 @@ +import requests +import pyaudio + +# 流式传输音频的URL,你可以自由改成Post +stream_url = 'http://127.0.0.1:5000/tts?text=这是一段测试文本,旨在通过多种语言风格和复杂性的内容来全面检验文本到语音系统的性能。接下来,我们会探索各种主题和语言结构,包括文学引用、技术性描述、日常会话以及诗歌等。首先,让我们从一段简单的描述性文本开始:“在一个阳光明媚的下午,一位年轻的旅者站在山顶上,眺望着下方那宽广而繁忙的城市。他的心中充满了对未来的憧憬和对旅途的期待。”这段文本测试了系统对自然景观描写的处理能力和情感表达的细腻程度。&stream=true' + +# 初始化pyaudio +p = pyaudio.PyAudio() + +# 打开音频流 +stream = p.open(format=p.get_format_from_width(2), + channels=1, + rate=32000, + output=True) + +# 使用requests获取音频流,你可以自由改成Post +response = requests.get(stream_url, stream=True) + +# 读取数据块并播放 +for data in response.iter_content(chunk_size=1024): + stream.write(data) + +# 停止和关闭流 +stream.stop_stream() +stream.close() + +# 终止pyaudio +p.terminate()