1 Star 1 Fork 2

AI Large Model/Step Audio

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
文件
克隆/下载
tts_inference.py 1.81 KB
一键复制 编辑 原始数据 按行查看 历史
yanc 提交于 2025-02-18 15:18 +08:00 . update tts speakers
import torchaudio
import argparse
from tts import StepAudioTTS
from tokenizer import StepAudioTokenizer
from utils import load_audio
import os
def main():
parser = argparse.ArgumentParser(description="StepAudio Offline Inference")
parser.add_argument(
"--model-path", type=str, required=True, help="Base path for model files"
)
parser.add_argument(
"--synthesis-type", type=str, default="tts", help="Use tts or Clone for Synthesis"
)
parser.add_argument(
"--output-path", type=str, required=True, help="Output path for synthesis audios"
)
args = parser.parse_args()
os.makedirs(f"{args.output_path}", exist_ok=True)
encoder = StepAudioTokenizer(f"{args.model_path}/Step-Audio-Tokenizer")
tts_engine = StepAudioTTS(f"{args.model_path}/Step-Audio-TTS-3B", encoder)
if args.synthesis_type == "tts":
text = "(RAP)我踏上自由的征途,追逐那遥远的梦想,挣脱束缚的枷锁,让心灵随风飘荡,每一步都充满力量,每一刻都无比闪亮,自由的信念在燃烧,照亮我前进的方向!"
output_audio, sr = tts_engine(text, "Tingting")
torchaudio.save(f"{args.output_path}/output_tts.wav", output_audio, sr)
else:
clone_speaker = {"speaker":"test","prompt_text":"叫做秋风起蟹脚痒,啊,什么意思呢?就是说这秋风一起啊,螃蟹就该上市了。", "wav_path":"examples/prompt_wav_yuqian.wav"}
text_clone = "人活一辈子,生老病死,总得是有高峰,有低谷,有顺境,有逆境,每个人都差不多。要不老话怎么讲,三十年河东,三十年河西呢。"
output_audio, sr = tts_engine(text_clone, "",clone_speaker)
torchaudio.save(f"{args.output_path}/output_clone.wav", output_audio, sr)
if __name__ == "__main__":
main()
Loading...
马建仓 AI 助手
尝试更多
代码解读
代码找茬
代码优化
1
https://gitee.com/AI-LargeModel/Step-Audio.git
git@gitee.com:AI-LargeModel/Step-Audio.git
AI-LargeModel
Step-Audio
Step Audio
main

搜索帮助