voxblink2_samresnet100_ft / download_mms_model.py
MCplayer's picture
speech similarity model
29c0409
raw
history blame
1.14 kB
import torchaudio
import os
from pathlib import Path
def download_mms_model(download_dir="/inspire/hdd/project/embodied-multimodality/public/yqzhang/auto_evaluation/models/mms_fa"):
"""下载MMS-FA模型到指定目录"""
# 创建下载目录
download_path = Path(download_dir)
download_path.mkdir(parents=True, exist_ok=True)
print(f"开始下载MMS-FA模型到: {download_path}")
try:
# 获取MMS-FA bundle
bundle = torchaudio.pipelines.MMS_FA
# 下载模型
model = bundle.get_model(with_star=False, dl_kwargs={'model_dir': str(download_path)})
print(f"✅ 模型下载成功!保存在: {download_path}")
print(f"模型文件: {list(download_path.glob('*'))}")
return str(download_path)
except Exception as e:
print(f"❌ 下载失败: {e}")
return None
if __name__ == "__main__":
# 下载模型
model_path = download_mms_model()
if model_path:
print(f"\n使用方法:")
print(f"evaluator = SpeakerSimilarityEvaluator(alignment_model_dir='{model_path}')")