release/1.0.5

分支 (6)

管理

管理

release/1.0.5

develop

release/0.3.9

release/0.x

legacy2

legacy

VoiceprintRecognition-Pytorch
/
infer_recognition.py

import argparse
import functools

from mvector.predict import MVectorPredictor
from mvector.utils.record import RecordAudio
from mvector.utils.utils import add_arguments, print_arguments

parser = argparse.ArgumentParser(description=__doc__)
add_arg = functools.partial(add_arguments, argparser=parser)
add_arg('configs',          str,    'configs/cam++.yml',        '配置文件')
add_arg('use_gpu',          bool,   True,                       '是否使用GPU预测')
add_arg('audio_db_path',    str,    'audio_db/',                '音频库的路径')
add_arg('record_seconds',   int,    3,                          '录音长度')
add_arg('threshold',        float,  0.6,                        '判断是否为同一个人的阈值')
add_arg('model_path',       str,    'models/CAMPPlus_Fbank/best_model/', '导出的预测模型文件路径')
args = parser.parse_args()
print_arguments(args=args)

# 获取识别器
predictor = MVectorPredictor(configs=args.configs,
                             threshold=args.threshold,
                             audio_db_path=args.audio_db_path,
                             model_path=args.model_path,
                             use_gpu=args.use_gpu)

record_audio = RecordAudio()

while True:
    select_fun = int(input("请选择功能，0为注册音频到声纹库，1为执行声纹识别，2为删除用户："))
    if select_fun == 0:
        input(f"按下回车键开机录音，录音{args.record_seconds}秒中：")
        audio_data = record_audio.record(record_seconds=args.record_seconds)
        name = input("请输入该音频用户的名称：")
        if name == '': continue
        predictor.register(user_name=name, audio_data=audio_data, sample_rate=record_audio.sample_rate)
    elif select_fun == 1:
        input(f"按下回车键开机录音，录音{args.record_seconds}秒中：")
        audio_data = record_audio.record(record_seconds=args.record_seconds)
        name, score = predictor.recognition(audio_data, sample_rate=record_audio.sample_rate)
        if name:
            print(f"识别说话的为：{name}，得分：{score}")
        else:
            print(f"没有识别到说话人，可能是没注册。")
    elif select_fun == 2:
        name = input("请输入该音频用户的名称：")
        if name == '': continue
        predictor.remove_user(user_name=name)
    else:
        print('请正确选择功能')