From 70ee188d28864578fd0bf8439e28fbb5a2614ab8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E8=B5=B5=E6=B1=9F=E6=B1=9F?= Date: Tue, 27 May 2025 20:16:35 +0800 Subject: [PATCH] =?UTF-8?q?fix:=20cosyvoice=20readme=E4=BF=AE=E6=94=B9?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../built-in/audio/CosyVoice/README.md | 29 +++++++++++++++++-- 1 file changed, 26 insertions(+), 3 deletions(-) diff --git a/ACL_PyTorch/built-in/audio/CosyVoice/README.md b/ACL_PyTorch/built-in/audio/CosyVoice/README.md index b33213321d..1265ca94a6 100755 --- a/ACL_PyTorch/built-in/audio/CosyVoice/README.md +++ b/ACL_PyTorch/built-in/audio/CosyVoice/README.md @@ -61,13 +61,21 @@ wget https://www.openfst.org/twiki/pub/FST/FstDownload/openfst-1.8.3.tar.gz # 进入目录后编译安装 ./configure --enable-far --enable-mpdt --enable-pdt + make -j$(nproc) make install + # 确认动态库文件存在: + ls /usr/local/lib/libfstmpdtscript.so.26 + # 配置动态库路径 + export LD_LIBRARY_PATH=/usr/local/lib:$LD_LIBRARY_PATH + sudo ldconfig + # 安装WeTextProcessing pip3 install WeTextProcessing==1.0.4.1 ``` + 3. 安装msit工具 - 参考[msit](https://gitee.com/ascend/msit)安装工具中的benchmark和surgen组件。 + 参考[msit](https://gitee.com/ascend/msit)安装工具中的benchmark和surgen组件。(未安装会提示 ais_bench 导入失败报错) 4. 获取权重数据 @@ -82,6 +90,19 @@ git clone https://www.modelscope.cn/iic/CosyVoice-300M.git CosyVoice/CosyVoice-300M ``` +5. 文件结构如下: + ```text + 📁 CosyVoice/ + ├── 📁 CosyVoice/ + | |── 📁 CosyVoice的源码文件 # CosyVoice其他的源码文件,此处不一一列举 + │ ├── 📁 CosyVoice-300M/ # 权重文件 + │ ├── 📄 infer.py # 推理脚本 + │ └── 📄 modify_onnx.py # 模型转换脚本 + ├── 📄 diff_300I.patch + └── 📄 diff_800I.patch + ``` + + ## 模型推理 ### 1 模型转换 @@ -116,15 +137,17 @@ ### 2 开始推理验证 - 1. 首先移动infer.py文件到CosyVoice目录下 + 1. **首先移动infer.py文件到CosyVoice目录下** 2. 设置环境变量,执行推理命令 ``` - # 指定使用NPU ID,默认为0 + # 1. 指定使用NPU ID,默认为0 export ASCEND_RT_VISIBLE_DEVICES=0 + # 2. 设置环境变量 export PYTHONPATH=third_party/Matcha-TTS:$PYTHONPATH + # 3. 执行推理脚本 python3 infer.py --model_path=${CosyVoice-300M} ``` - --model_path: 权重路径 -- Gitee