Python实现聊天机器人（语音录入与语音输出）

本站以下代码，Python3.6完美运行，使用工具Pycham，系统Win10

一、思路

　　1. 功能简述

　　　　登录后进入聊天界面，如果服务器都在同一个地址，则都进入同一个房间，进入离开发消息都可以看到，输入“tuling”或“chatbot”可以切换为和Tuling机器人或者ChatBot聊天，如下图

　　　　Tuling，是图灵，已经录入大量中文对话，直接调用接口即可实现自动回复，实用于开发聊天软件

　　　　ChatBot，可自行训练机器人，让机器人拥有自己的语料库，实用于企业智能聊天个性化

　　2. 需要的核心技术　　　　　　　　　　

　　　　a. 输入语音经识别后转换为输入文字

　　　　b. Tuling或ChatBot两种聊天模式获取输出文字

　　　　c. 输出文字转换为输出语音并播放　　

　　以上a和c主要调用Baidu提供的API进行转换，如果理解本文，可自行尝试调用Google提供的API实现，Google技术强大但是否对中文支持良好，博主不存尝试不妄自揣度　

二、源码设计（贴上完整源码自己去理解）

　　　　运行顺序，TrainChat.py训练本地机器人 —— server.py开启服务器 —— n次client.py运行无限次，每次运行都可登陆一个用户

　　1. 服务器server.py 主要处理用户的登录校验，房间的人员消息处理，此处通过config.py中配置的列表PORT = range(1, 3)生成两个房间（实用时可以无限个），地址分别是127.0.0.1:1和127.0.0.1:2，启用客户端前，这个服务器要先运行

　　此中CommandHandler类拆解client客户端发送的信息中的命令，并绑定函数

 
   server.py

　　2. 训练chatbot的TrainChat.py 主要用来训练chatbot，数据保存在本地sqlite数据库（如果没有数据库自动创建），个人学习此数据足以，作为企业可改为mongodb保存数据，速度会有保障

 
   TrainChat.py

　　提供了两种语料训练方法，当然选择自定义语料训练比较好，自定义语料格式，首先我们找到安装chatbot后默认提供的中文语料格式D:\Python\Lib\site-packages\chatterbot_corpus\data\chinese，打开后格式就有了，这里我们按照格式新增一个mytrain文件夹，写入自己的语料文件，如我写的phone.yml

 
   phone.yml

　　Pycham快捷键Ctrl+Shift+F10运行TrainChat.py(如果语料有更新，再运行一次即可) ，此时我们定义的语料已经保存在本地数据库db.sqlite3（没有则自动创建）中了，接下来直接使用即可

　　3. 录音并保存文件recorder.py，提供录音功能并将录音文件保存在本地

 
   recorder.py

　　4. chatbot.py, 提供播放音频文件，调用图灵Tuling接口返回文本信息，调用chatbot返回文本信息，调用百度api语音识别，调用百度api转文本为语音(有两个百度api都可用，第一个不用密匙)，其中chatbot的数据库配置要和TrainChat.py中配置的名称一致

 
      
    
import pygame
from chatterbot import ChatBot
import requests
import json
from config import *
import time
import os
import random
import urllib.request
import base64


# 初始化百度返回的音频文件地址，后面会变为全局变量，随需改变
mp3_url = 'E:\Python_Doc\\voice_du\\voice_ss.mp3'


# 播放Mp3文件
def play_mp3():
   # 接受服务器的消息
   pygame.mixer.init()
   pygame.mixer.music.load(mp3_url)
   pygame.mixer.music.play()
   while pygame.mixer.music.get_busy():
       time.sleep(1)
   pygame.mixer.music.stop()
   pygame.mixer.quit()


# 删除声音文件
def remove_voice():
   path = r"E:\Python_Doc\voice_du"
   for i in os.listdir(path):
       path_file = os.path.join(path, i)
       try:
           os.remove(path_file)
       except:
           continue


# 图灵自动回复
def tuling(info):
   url = tuling_url + "?key=%s&info=%s" % (tuling_app_key, info)
   content = requests.get(url, headers=headers)
   answer = json.loads(content.text)
   return answer['text']


# 聊天机器人回复
def chatbot(info):
   my_bot = ChatBot("", read_only=True,
                    database="./db.sqlite3")
   res = my_bot.get_response(info)
   return str(res)


# 百度讲文本转为声音文件保存在本地 tts地址，无需token实时认证
def baidu_api(answer):
   api_url = '{11}?idx={0}&tex={1}&cuid={2}&cod={3}&lan={4}&ctp={5}&pdt={6}&spd={7}&per={8}&vol={9}&pit={10}'\
       .format(baidu_api_set["idx"], answer, baidu_api_set["cuid"], baidu_api_set["cod"], baidu_api_set["lan"],
               baidu_api_set["ctp"], baidu_api_set["pdt"], baidu_api_set["spd"], baidu_api_set["per"],
               baidu_api_set["vol"], baidu_api_set["pit"], baidu_api_url)
   res = requests.get(api_url, headers=headers2)
   # 本地Mp3语音文件保存位置
   iname = random.randrange(1, 99999)
   global mp3_url
   mp3_url = 'E:\Python_Doc\\voices\\voice_tts' + str(iname) + '.mp3'
   with open(mp3_url, 'wb') as f:
       f.write(res.content)


# 百度讲文本转为声音文件保存在本地 方法2 tsn地址
def baidu_api2(answer):
   # 获取access_token
   token = getToken()
   get_url = baidu_api_url2 % (urllib.parse.quote(answer), "test", token)
   voice_data = urllib.request.urlopen(get_url).read()
   # 本地Mp3语音文件保存位置
   name = random.randrange(1, 99999)
   global mp3_url
   mp3_url = 'E:\Python_Doc\\voice_du\\voice_tsn' + str(name) + '.mp3'
   voice_fp = open(mp3_url, 'wb+')
   voice_fp.write(voice_data)
   voice_fp.close()
   return


# 百度语音转文本
def getText(filename):
   # 获取access_token
   token = getToken()
   data = {}
   data['format'] = 'wav'
   data['rate'] = 16000
   data['channel'] = 1
   data['cuid'] = str(random.randrange(123456, 999999))
   data['token'] = token
   wav_fp = open(filename, 'rb')
   voice_data = wav_fp.read()
   data['len'] = len(voice_data)
   data['speech'] = base64.b64encode(voice_data).decode('utf-8')
   post_data = json.dumps(data)
   # 语音识别的api url
   upvoice_url = 'http://vop.baidu.com/server_api'
   r_data = urllib.request.urlopen(upvoice_url, data=bytes(post_data, encoding="utf-8")).read()
   print(json.loads(r_data))
   err = json.loads(r_data)['err_no']
   if err == 0:
       return json.loads(r_data)['result'][0]
   else:
       return json.loads(r_data)['err_msg']


# 获取百度API调用的认证，实时生成，因为有时间限制
def getToken():
   # token认证的url
   api_url = "https://openapi.baidu.com/oauth/2.0/token?" \
                    "grant_type=client_credentials&client_id=%s&client_secret=%s"
   token_url = api_url % (BaiDu_API_Key_GetVoi, BaiDu_Secret_Key_GetVoi)
   r_str = urllib.request.urlopen(token_url).read()
   token_data = json.loads(r_str)
   token_str = token_data['access_token']
   return token_str 
      
    

　　5. client.py,提供登录窗口，聊天窗口，已及响应事件，say按钮绑定sayDown录音和sayUp获取语音文本并发送两个事件，Users显示当前房间所有用户...

 
      
    
import wx
import telnetlib
from time import sleep
import _thread as thread
import time
import os
from chatbot import baidu_api2, chatbot, tuling, play_mp3, remove_voice, getText
from config import BOTS, BOT, default_server, VOICE_SWITCH
from recorder import recording


bot_use = BOT


class LoginFrame(wx.Frame):
   """
   登录窗口
   """
   def __init__(self, parent, id, title, size):
       # 初始化，添加控件并绑定事件
       wx.Frame.__init__(self, parent, id, title)
       self.SetSize(size)
       self.Center()
       self.serverAddressLabel = wx.StaticText(self, label="Server Address", pos=(15, 40), size=(120, 25))
       self.userNameLabel = wx.StaticText(self, label="UserName", pos=(45, 90), size=(120, 25))
       self.serverAddress = wx.TextCtrl(self, value=default_server,
                                        pos=(120, 37), size=(150, 25), style=wx.TE_PROCESS_ENTER)
       self.userName = wx.TextCtrl(self, pos=(120, 87), size=(150, 25), style=wx.TE_PROCESS_ENTER)
       self.loginButton = wx.Button(self, label='Login', pos=(50, 145), size=(90, 30))
       self.exitButton = wx.Button(self, label='Exit', pos=(180, 145), size=(90, 30))
       # 绑定登录方法
       self.loginButton.Bind(wx.EVT_BUTTON, self.login)
       # 绑定退出方法
       self.exitButton.Bind(wx.EVT_BUTTON, self.exit)
       # 服务器输入框Tab事件
       self.serverAddress.SetFocus()
       self.Bind(wx.EVT_TEXT_ENTER, self.usn_focus, self.serverAddress)
       # 用户名回车登录
       self.Bind(wx.EVT_TEXT_ENTER, self.login, self.userName)
       self.Show()

   # 回车调到用户名输入栏
   def usn_focus(self, event):
       self.userName.SetFocus()

   def login(self, event):
       # 登录处理
       try:
           serverAddress = self.serverAddress.GetLineText(0).split(':')
           con.open(serverAddress[0], port=int(serverAddress[1]), timeout=10)
           response = con.read_some()
           if response != b'Connect Success':
               self.showDialog('Error', 'Connect Fail!', (200, 100))
               return
           con.write(('login ' + str(self.userName.GetLineText(0)) + '\n').encode("utf-8"))
           response = con.read_some()
           if response == b'UserName Empty':
               self.showDialog('Error', 'UserName Empty!', (200, 100))
           elif response == b'UserName Exist':
               self.showDialog('Error', 'UserName Exist!', (200, 100))
           else:
               self.Close()
               ChatFrame(None, 2, title='当前用户：'+str(self.userName.GetLineText(0)), size=(515, 400))
       except Exception:
           self.showDialog('Error', 'Connect Fail!', (95, 20))

   def exit(self, event):
       self.Close()

   # 显示错误信息对话框
   def showDialog(self, title, content, size):
       dialog = wx.Dialog(self, title=title, size=size)
       dialog.Center()
       wx.StaticText(dialog, label=content)
       dialog.ShowModal()


class ChatFrame(wx.Frame):
   """
   聊天窗口
   """
   def __init__(self, parent, id, title, size):
       # 初始化，添加控件并绑定事件
       wx.Frame.__init__(self, parent, id, title, style=wx.SYSTEM_MENU | wx.CAPTION | wx.CLOSE_BOX |
                                                        wx.DEFAULT_FRAME_STYLE)
       self.SetSize(size)
       self.Center()
       self.chatFrame = wx.TextCtrl(self, pos=(5, 5), size=(490, 310), style=wx.TE_MULTILINE | wx.TE_READONLY)
       self.sayButton = wx.Button(self, label="Say", pos=(5, 320), size=(58, 25))
       self.message = wx.TextCtrl(self, pos=(65, 320), size=(240, 25), style=wx.TE_PROCESS_ENTER)
       self.sendButton = wx.Button(self, label="Send", pos=(310, 320), size=(58, 25))
       self.usersButton = wx.Button(self, label="Users", pos=(373, 320), size=(58, 25))
       self.closeButton = wx.Button(self, label="Close", pos=(436, 320), size=(58, 25))
       # 发送按钮绑定发送消息方法
       self.sendButton.Bind(wx.EVT_BUTTON, self.send)
       # 输入框回车发送信息
       self.message.SetFocus()
       # 发送消息
       self.sayButton.Bind(wx.EVT_LEFT_DOWN, self.sayDown)
       self.sayButton.Bind(wx.EVT_LEFT_UP, self.sayUp)
       # 发送消息
       self.Bind(wx.EVT_TEXT_ENTER, self.send, self.message)
       # Users按钮绑定获取在线用户数量方法
       self.usersButton.Bind(wx.EVT_BUTTON, self.lookUsers)
       # 关闭按钮绑定关闭方法
       self.closeButton.Bind(wx.EVT_BUTTON, self.close)
       thread.start_new_thread(self.receive, ())
       # self.ShowFullScreen(True)
       self.Show()

   def sayDown(self, event):
       thread.start_new_thread(recording, ())
       # print("ON")

   def sayUp(self, event):
       sayText = getText(r"E:\Python_Doc\voice_say\say_voice.wav")
       self.message.AppendText(str(sayText))
       self.send(self)

   def send(self, event):
       # 发送消息
       message = str(self.message.GetLineText(0)).strip()
       global bot_use
       if message != '':
           if message == "chatbot":
               bot_use = "ChatBot"
               self.message.Clear()
               con.write(('noone_say You have been changed ChatBot-Chat' + '\n').encode("utf-8"))
               return
           elif message == "tuling":
               bot_use = "TuLing"
               self.message.Clear()
               con.write(('noone_say You have been changed TuLing-Chat' + '\n').encode("utf-8"))
               return
           elif message == "user":
               bot_use = "User"
               self.message.Clear()
               con.write(('noone_say You have been changed User-Chat' + '\n').encode("utf-8"))
               return
           con.write(('say ' + message + '\n').encode("utf-8"))
           self.message.Clear()
           # 机器人回复
           if bot_use == "ChatBot":
               answer = chatbot(message)
               con.write(('chatbot_say ' + answer + '\n').encode("utf-8"))
           elif bot_use == "TuLing":
               answer = tuling(message)
               con.write(('tuling_say ' + answer + '\n').encode("utf-8"))
           elif bot_use == "User":
               return 

           if VOICE_SWITCH:
               # 写本地音乐文件
               baidu_api2(answer)
               # 新建线程播放音乐
               thread.start_new_thread(play_mp3, ())
       return

   def lookUsers(self, event):
       # 查看当前在线用户
       con.write(b'look\n')

   def close(self, event):
       # 关闭窗口
       thread.start_new_thread(remove_voice, ())
       con.write(b'logout\n')
       con.close()
       self.Close()

   def receive(self):
       # 接受服务器的消息
       while True:
           sleep(0.6)
           result = con.read_very_eager()
           if result != '':
               self.chatFrame.AppendText(result)


if __name__ == '__main__':
   app = wx.App()
   con = telnetlib.Telnet()
   LoginFrame(None, -1, title="Login", size=(320, 250))
   app.MainLoop() 
      
    

　　6. config配置文件，*号内容自行去对应官网申请，本文不提供，文字转换语音并播放开关默认Flase，可自己修改

 
      
    
# 默认输入的服务器地址，测试时候使用，避免登录总是输入地址麻烦
default_server = "127.0.0.1:1"

# 定义服务器端口，一个端口一个房间
PORT = range(1, 3)

# 图灵Tuling机器人还是ChatBot聊天机器人选择
BOTS = ["TuLing", "ChatBot", "User"]
BOT = BOTS[2]

# 浏览器请求头文件
headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 '
                        '(KHTML, like Gecko) Chrome/53.0.2785.143 Safari/537.36', }
headers2 = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 '
                         '(KHTML, like Gecko)Chrome/62.0.3202.94 Safari/537.36'}

# 图灵密匙，自动回复地址，选择的key不同，tuling机器人的回答也各不相同
tuling_app_key = "******"
tuling_app_key2 = "******"
tuling_url = "http://www.tuling123.com/openapi/api"

# 语音保存播放开关
VOICE_SWITCH = False

# 百度文本转语音地址和配置 tts地址
baidu_api_url = "http://tts.baidu.com/text2audio"
baidu_api_set = {"idx": 1, "cuid": "baidu_speech_demo", "cod": 2,
                "lan": "zh", "ctp": 1, "pdt": 1, "spd": 4, "per": 4, "vol": 5, "pit": 5}

# 百度文字转语音 tsn地址
baidu_api_url2 = "http://tsn.baidu.com/text2audio?tex=%s&lan=zh&cuid=%s&ctp=1&tok=%s"
BaiDu_API_Key_GetVoi = "******"
BaiDu_Secret_Key_GetVoi = "******"

# 百度语音识别
BaiDu_App_ID = "******"
BaiDu_API_Key = "******"
BaiDu_Secret_Key = "******"
BaiDu_OpenApi_Url = "https://openapi.baidu.com/oauth/2.0/token" \
                   "?grant_type=client_credentials&client_id=%&client_secret=%" 
      
    

三、总结

　　此文在语音识别之处，尚有不足，因为对百度提供的api识别没用好，不知道是说的语音质量问题，还是配置的传参问题，读者可自行研究，另博主业余爱好可能文章不足之处较多，欢迎指正！

　　转载请指明出处！

分类: Python

Python实现聊天机器人（语音录入与语音输出）

猜你喜欢