批量语音转文字python

批量语音转文字python,第1张

from pydub import AudioSegment
from aip import AipSpeech
#baidu-aip

# 百度AI库获取的参数

# 构造读取语音文件函数
def get_file_content(filePath):
    with open(filePath, 'rb') as fp:
        return fp.read()



def cut_wav(segment):
    wav[segment*60*1000:(segment+1)*60*1000].export('record'+'/'+filename+'cut'+str(segment)+'.wav', format="wav")
    #wav[2*60*1000:3*60*1000].export(filename+'cut'+segment+'.wav', format="wav")



if __name__ == '__main__':
    #开始第一步,将录音文件切成多个小片段
    filename = '04月05日_1'

    wav = AudioSegment.from_wav(filename + '.wav')
    totoal_time = wav.duration_seconds

    cut_count = int(wav.duration_seconds/60)
    print(cut_count)
    cut_wav(cut_count)

    for i in range(1, cut_count):
        cut_wav(i)

    #开始第二步,批量语音转文字

    APP_ID = '26029972'
    API_KEY = 'uDbACFSOmNVOkXyvydMSUuQR'
    SECRET_KEY = 'cuI1zBwGjgHtNFI3Mx15RXCQvrIrMYVN'

    client = AipSpeech(APP_ID, API_KEY, SECRET_KEY)

    result = client.asr(get_file_content(r'C:\Users\PycharmProjects\pythonProject\record月05日_1cut1.wav'), 'wav', 16000,
                        {'lan': 'zh', })
    # 此处地址处必须要加r,使其成为绝对地址,要么容易字符转义出现错误
    print(result)












欢迎分享,转载请注明来源:内存溢出

原文地址: https://outofmemory.cn/langs/734649.html

(0)
打赏 微信扫一扫 微信扫一扫 支付宝扫一扫 支付宝扫一扫
上一篇 2022-04-27
下一篇 2022-04-27

发表评论

登录后才能评论

评论列表(0条)

保存