MCplayer
/

voxblink2_samresnet100_ft

Model card Files Files and versions

voxblink2_samresnet100_ft / download_mms_model.py

MCplayer's picture

speech similarity model

29c0409 3 months ago

1.14 kB

	import torchaudio
	import os
	from pathlib import Path

	def download_mms_model(download_dir="/inspire/hdd/project/embodied-multimodality/public/yqzhang/auto_evaluation/models/mms_fa"):
	"""下载MMS-FA模型到指定目录"""

	# 创建下载目录
	download_path = Path(download_dir)
	download_path.mkdir(parents=True, exist_ok=True)

	print(f"开始下载MMS-FA模型到: {download_path}")

	try:
	# 获取MMS-FA bundle
	bundle = torchaudio.pipelines.MMS_FA

	# 下载模型
	model = bundle.get_model(with_star=False, dl_kwargs={'model_dir': str(download_path)})

	print(f"✅ 模型下载成功！保存在: {download_path}")
	print(f"模型文件: {list(download_path.glob('*'))}")

	return str(download_path)

	except Exception as e:
	print(f"❌ 下载失败: {e}")
	return None

	if __name__ == "__main__":
	# 下载模型
	model_path = download_mms_model()
	if model_path:
	print(f"\n使用方法:")
	print(f"evaluator = SpeakerSimilarityEvaluator(alignment_model_dir='{model_path}')")