python录音

#!/usr/bin/env python

# -*- coding: utf-8 -*-

# Date : 2018-12-02 19:04:55

import wave

import requests

import time

import base64

from pyaudio import PyAudio, paInt16

import webbrowser

framerate = 16000 # 采

num_samples = 2000 # 采样点

channels = 1 # 声道

sampwidth = 2 # 采样宽度2bytes

FILEPATH = 'speech.wav'

base_url = "https://openapi.baidu.com/oauth/2.0/token?grant_type=client_credentials&client_id=%s&client_secret=%s"

APIKey = "A0YzbOlHhA7P3w8pKpeaPH3r"

SecretKey = "L8Y8c1MaQj0uNHMcjdrYKGLYyhQGZOpQ"

HOST = base_url % (APIKey, SecretKey)

def getToken(host):

res = requests.post(host)

return res.json()['access_token']

def save_wave_file(filepath, data):

wf = wave.open(filepath, 'wb')

wf.setnchannels(channels)

wf.setsampwidth(sampwidth)

wf.setframerate(framerate)

wf.writeframes(b''.join(data))

wf.close()

def my_record():

pa = PyAudio()

stream = pa.open(format=paInt16, channels=channels,

rate=framerate, input=True, frames_per_buffer=num_samples)

my_buf = []

# count = 0

t = time.time()

print('正在录音...')

while time.time() < t + 4: # 秒

string_audio_data = stream.read(num_samples)

my_buf.append(string_audio_data)

print('录音结束.')

save_wave_file(FILEPATH, my_buf)

stream.close()

def get_audio(file):

with open(file, 'rb') as f:

data = f.read()

return data

def speech2text(speech_data, token, dev_pid=1537):

FORMAT = 'wav'

RATE = '16000'

CHANNEL = 1

CUID = '*******'

SPEECH = base64.b64encode(speech_data).decode('utf-8')

data = {

'format': FORMAT,

'rate': RATE,

'channel': CHANNEL,

'cuid': CUID,

'len': len(speech_data),

'speech': SPEECH,

'token': token,

'dev_pid': dev_pid

}

url = 'https://vop.baidu.com/server_api'

headers = {'Content-Type': 'application/json'}

# r=requests.post(url,data=json.dumps(data),headers=headers)

print('正在识别...')

r = requests.post(url, json=data, headers=headers)

Result = r.json()

if 'result' in Result:

return Result['result'][0]

else:

return Result

def openbrowser(text):

maps = {

'百度': ['百度', 'baidu'],

'腾讯': ['腾讯', 'tengxun'],

'网易': ['网易', 'wangyi']

}

if text in maps['百度']:

webbrowser.open_new_tab('https://www.baidu.com')

elif text in maps['腾讯']:

webbrowser.open_new_tab('https://www.qq.com')

elif text in maps['网易']:

webbrowser.open_new_tab('https://www.163.com/')

else:

webbrowser.open_new_tab('https://www.baidu.com/s?wd=%s' % text)

if __name__ == '__main__':

flag = 'y'

while flag.lower() == 'y':

print('请输入数字选择语言：')

devpid = input('1536：普通话(简单英文),1537:普通话(有标点),1737:英语,1637:粤语,1837:四川话\n')

my_record()

TOKEN = getToken(HOST)

speech = get_audio(FILEPATH)

result = speech2text(speech, TOKEN, int(devpid))

print(result)

if type(result) == str:

openbrowser(result.strip('，'))

flag = input('Continue?(y/n):')

posted @ 2019-10-23 12:51 ngdty 阅读(380) 评论(0) 收藏举报

刷新页面返回顶部

ngdty

python录音

公告