# 1. 下载代码
1 2 3
| git clone --recursive https://github.com/FunAudioLLM/CosyVoice.git cd CosyVoice git submodule update --init --recursive
|
# 2. 修改 requirements.txt
1 2
| onnxruntime-gpu==1.18.0 onnxruntime==1.18.0
|
改为
# 3. 创建 Python 环境
执行 00 conda 创建环境.bat 创建 Python 3.10 环境
# 4. 激活 Conda 环境
执行 激活 conda 环境.bat 激活 conda 环境
# 5. 安装依赖
1 2
| conda install -y -c conda-forge pynini==2.1.5 pip install -r requirements.txt -i https://mirrors.aliyun.com/pypi/simple/ --trusted-host=mirrors.aliyun.com
|
# 6. 下载模型
# 6.1 代码下载模型
创建一个 download_models.py
1 2 3 4 5 6 7 8
| from modelscope import snapshot_download snapshot_download('iic/CosyVoice2-0.5B', local_dir='pretrained_models/CosyVoice2-0.5B') snapshot_download('iic/CosyVoice-300M', local_dir='pretrained_models/CosyVoice-300M') snapshot_download('iic/CosyVoice-300M-25Hz', local_dir='pretrained_models/CosyVoice-300M-25Hz') snapshot_download('iic/CosyVoice-300M-SFT', local_dir='pretrained_models/CosyVoice-300M-SFT') snapshot_download('iic/CosyVoice-300M-Instruct', local_dir='pretrained_models/CosyVoice-300M-Instruct') snapshot_download('iic/CosyVoice-ttsfrd', local_dir='pretrained_models/CosyVoice-ttsfrd')
|
下载模型
1
| python download_models.py
|
模型下载失败
1 2
| pip install modelscope==1.17.0 -i https://pypi.tuna.tsinghua.edu.cn/simple
|
# 6.2 git 下载模型
1 2 3 4 5 6 7 8
| mkdir -p pretrained_models git clone https://www.modelscope.cn/iic/CosyVoice2-0.5B.git pretrained_models/CosyVoice2-0.5B git clone https://www.modelscope.cn/iic/CosyVoice-300M.git pretrained_models/CosyVoice-300M git clone https://www.modelscope.cn/iic/CosyVoice-300M-25Hz.git pretrained_models/CosyVoice-300M-25Hz git clone https://www.modelscope.cn/iic/CosyVoice-300M-SFT.git pretrained_models/CosyVoice-300M-SFT git clone https://www.modelscope.cn/iic/CosyVoice-300M-Instruct.git pretrained_models/CosyVoice-300M-Instruct git clone https://www.modelscope.cn/iic/CosyVoice-ttsfrd.git pretrained_models/CosyVoice-ttsfrd
|
# 7. 启动
# 7.1 内置音色模型启动
1 2 3 4 5 6
| @echo off set PYTHONPATH=third_party/Matcha-TTS call activate .\env python webui.py --port 50000 --model_dir pretrained_models/CosyVoice-300M-SFT start http://127.0.0.1:50000 pause
|
# 7.2 克隆音色 + 跨语种克隆模型启动
1 2 3 4 5 6
| @echo off set PYTHONPATH=third_party/Matcha-TTS call activate .\env start http://127.0.0.1:50001 python webui.py --port 50001 --model_dir pretrained_models/CosyVoice-300M pause
|
# 7.3 内置音色 + 语气微调模型启动
1 2 3 4 5 6 7
| @echo off set PYTHONPATH=third_party/Matcha-TTS call activate .\env start http://127.0.0.1:50002 python webui.py --port 50002 --model_dir pretrained_models/CosyVoice-300M-Instruct pause
|