科大訊飛語(yǔ)音識(shí)別控制實(shí)際機(jī)器人運(yùn)動(dòng)。
本文將ros與語(yǔ)音識(shí)別想結(jié)合進(jìn)行開(kāi)發(fā)。進(jìn)行以下步驟,
1、創(chuàng)作ros工作空間
2、安裝mpalyer播放器
sudo apt-get install mplayer
3、將訊非的語(yǔ)音庫(kù)動(dòng)態(tài)文件.so文件放到/usr/lib/下
4、ros工程目錄src下新建文件xf_asr.cpp 并將以下內(nèi)容復(fù)制進(jìn)去,appid改成你自己的(官網(wǎng)申請(qǐng))。
/*
* 語(yǔ)音聽(tīng)寫(iFly Auto Transform)技術(shù)能夠?qū)崟r(shí)地將語(yǔ)音轉(zhuǎn)換成對(duì)應(yīng)的文字。
*/#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include "qisr.h"
#include "msp_cmn.h"
#include "msp_errors.h"
#include "speech_recognizer.h"
#include <iconv.h>#include "ros/ros.h"
#include "std_msgs/String.h"#define FRAME_LEN 640
#define BUFFER_SIZE 4096int wakeupFlag = 0 ;
int resultFlag = 0 ;static void show_result(char *string, char is_over)
{resultFlag=1; printf("\rResult: [ %s ]", string);if(is_over)putchar('\n');
}static char *g_result = NULL;static unsigned int g_buffersize = BUFFER_SIZE;void on_result(const char *result, char is_last)
{if (result) {size_t left = g_buffersize - 1 - strlen(g_result);size_t size = strlen(result);if (left < size) {g_result = (char*)realloc(g_result, g_buffersize + BUFFER_SIZE);if (g_result)g_buffersize += BUFFER_SIZE;else {printf("mem alloc failed\n");return;}}strncat(g_result, result, size);show_result(g_result, is_last);}
}void on_speech_begin()
{if (g_result){free(g_result);}g_result = (char*)malloc(BUFFER_SIZE);g_buffersize = BUFFER_SIZE;memset(g_result, 0, g_buffersize);printf("Start Listening...\n");
}
void on_speech_end(int reason)
{if (reason == END_REASON_VAD_DETECT)printf("\nSpeaking done \n");elseprintf("\nRecognizer error %d\n", reason);
}/* demo recognize the audio from microphone */
static void demo_mic(const char* session_begin_params)
{int errcode;int i = 0;struct speech_rec iat;struct speech_rec_notifier recnotifier = {on_result,on_speech_begin,on_speech_end};errcode = sr_init(&iat, session_begin_params, SR_MIC, &recnotifier);if (errcode) {printf("speech recognizer init failed\n");return;}errcode = sr_start_listening(&iat);if (errcode) {printf("start listen failed %d\n", errcode);}/* demo 10 seconds recording */while(i++ < 2)sleep(1);errcode = sr_stop_listening(&iat);if (errcode) {printf("stop listening failed %d\n", errcode);}sr_uninit(&iat);
}/* main thread: start/stop record ; query the result of recgonization.* record thread: record callback(data write)* helper thread: ui(keystroke detection)*/void WakeUp(const std_msgs::String::ConstPtr& msg)
{printf("waking up\r\n");usleep(700*1000);wakeupFlag=1;
}int main(int argc, char* argv[])
{// 初始化ROSros::init(argc, argv, "voiceRecognition");ros::NodeHandle n;ros::Rate loop_rate(10);// 聲明Publisher和Subscriber// 訂閱喚醒語(yǔ)音識(shí)別的信號(hào)ros::Subscriber wakeUpSub = n.subscribe("voiceWakeup", 1000, WakeUp); // 訂閱喚醒語(yǔ)音識(shí)別的信號(hào) ros::Publisher voiceWordsPub = n.advertise<std_msgs::String>("voiceWords", 1000); ROS_INFO("Sleeping...");int count=0;while(ros::ok()){// 語(yǔ)音識(shí)別喚醒if (wakeupFlag){ROS_INFO("Wakeup...");int ret = MSP_SUCCESS;const char* login_params = "appid = , work_dir = .";const char* session_begin_params ="sub = iat, domain = iat, language = zh_cn, ""accent = mandarin, sample_rate = 16000, ""result_type = plain, result_encoding = utf8";ret = MSPLogin(NULL, NULL, login_params);if(MSP_SUCCESS != ret){MSPLogout();printf("MSPLogin failed , Error code %d.\n",ret);}printf("Demo recognizing the speech from microphone\n");printf("Speak in 3 seconds\n");demo_mic(session_begin_params);printf("3 sec passed\n");wakeupFlag=1;MSPLogout();}// 語(yǔ)音識(shí)別完成if(resultFlag){resultFlag=0;std_msgs::String msg;msg.data = g_result;voiceWordsPub.publish(msg);}ros::spinOnce();loop_rate.sleep();count++;}exit:MSPLogout(); // Logout...return 0;
}
5、CMakeLists.txt增加以下代碼
add_executable(xf_asr src/xf_asr.cpp)
target_link_libraries(xf_asr ${catkin_LIBRARIES} -lmsc -ldl -lpthread -lm -lrt)
add_dependencies(xf_asr xf_voice_generate_messages_cpp)(這句要不要都可以)
6、回到工作空間編譯,編譯后source一下。此時(shí)語(yǔ)音識(shí)別已經(jīng)可以運(yùn)行,打開(kāi)新的終端運(yùn)行roscore。在另一個(gè)終端運(yùn)行asr。
7、添加語(yǔ)音控制的package,新創(chuàng)建一個(gè)新的package,在新的src里面創(chuàng)建voice_cmd.cpp。復(fù)制一下代碼、
#include<ros/ros.h>
#include<geometry_msgs/Twist.h>
#include<std_msgs/String.h>
#include<pthread.h>
#include<iostream>
#include<stdio.h>
//#include<string.h>
using namespace std;
ros::Publisher pub;
geometry_msgs::Twist vel_cmd;
pthread_t pth_[5];void* vel_ctr(void* arg)
{while(true){pub.publish(vel_cmd);ros::spinOnce();sleep(1);}return 0;
}
//void callback(const package_name::type_name & msg)
void callback(const std_msgs::String::ConstPtr& msg)
{cout<<"收到:"<<msg->data.c_str()<<endl;string str1 = msg->data.c_str();string str2 = "11";string str3 = "22";string str4 = "33";string str5 = "44";string str6 = "55";//if(str1 == str2)if(str1.find("前進(jìn)"))
// if(strstr(&str1, &str2)){// cout<<"11111"<<endl;vel_cmd.linear.x = 0.2;vel_cmd.angular.z = 0;pthread_create(&pth_[0],NULL,vel_ctr,NULL);}//if(str1 == str3)if(str1.find("后退“))//if(strstr(&str1 , &str3)){vel_cmd.linear.x = -0.2;vel_cmd.angular.z = 0;pthread_create(&pth_[1],NULL,vel_ctr,NULL);}if(str1.find("左轉(zhuǎn)"))//if(strstr(&str1 , &str4)){vel_cmd.linear.x = 0;vel_cmd.angular.z = 0.05;pthread_create(&pth_[2],NULL,vel_ctr,NULL);}if(str1.find("右轉(zhuǎn)"))//if(strstr(&str1 ,&str5)){vel_cmd.linear.x = 0;vel_cmd.angular.z = -0.05;pthread_create(&pth_[3],NULL,vel_ctr,NULL);}if(str1.find("停止"))//if(strstr(&str1 ,&str6)){vel_cmd.linear.x = 0;vel_cmd.angular.z = 0;pthread_create(&pth_[4],NULL,vel_ctr,NULL);}
}int main(int argc, char** argv)
{ros::init(argc, argv, "sub_word");ros::NodeHandle n;//pub = n.advertise<geometry_msgs::Twist>("/cmd_vel_mux/input/teleop",10);pub = n.advertise<geometry_msgs::Twist>("/mobile_base/mobile_base_controller/cmd_vel",1000);ros::Subscriber sub = n.subscribe("/voiceWords",10,callback);
// ros::Subscriber sub = n.subscribe("read",10,callback);//ros::Publisher pub = n.advertise<geometry_msgs::Twist>("/cmd_vel_mux/input/teleop", 10);cout<<"您好!你可以語(yǔ)音控制啦!"<<endl;
cout<<"向前行———————————>前進(jìn)"<<endl;
cout<<"向后退———————————>后退"<<endl;
cout<<"向左轉(zhuǎn)———————————>左轉(zhuǎn)"<<endl;
cout<<"向右轉(zhuǎn)———————————>右轉(zhuǎn)"<<endl;
cout<<"使停止———————————>停止"<<endl;ros::spin();
}
8、同理在Cmakelist加上以下:
add_executable(voice_cmd src/voice_cmd.cpp)
target_link_libraries(voice_cmd ${catkin_LIBRARIES} )
add_dependencies(voice_cmd voice_cmd_generate_messages_cpp)
9、回到工作空間編譯,運(yùn)行。
10、運(yùn)行上面兩個(gè)模塊后再打開(kāi)一個(gè)終端運(yùn)行rqt_graph查看節(jié)點(diǎn)圖是否聯(lián)通。(完)
或者用python去控制機(jī)器人運(yùn)動(dòng),訂閱asr的內(nèi)容,
以下是python代碼:
#!/usr/bin/env python
# This Python file uses the following encoding: utf-8
import os, sysimport roslib; roslib.load_manifest('pocketsphinx')
import rospy
import mathfrom geometry_msgs.msg import Twist
from std_msgs.msg import Stringclass voice_cmd_vel:def __init__(self):rospy.on_shutdown(self.cleanup)self.speed = 0.2self.msg = Twist()# publish to cmd_vel, subscribe to speech output#self.pub_ = rospy.Publisher('/mobile_base/commands/velocity', Twist)self.pub_ = rospy.Publisher('/mobile_base/mobile_base_controller/cmd_vel', Twist)rospy.Subscriber('/voiceWords', String, self.speechCb)r = rospy.Rate(10.0)while not rospy.is_shutdown():self.pub_.publish(self.msg)r.sleep()def speechCb(self, msg):rospy.loginfo(msg.data)#if msg.data.find("full speed") > -1:if msg.data.find("加速") > -1:if self.speed == 0.2:self.msg.linear.x = self.msg.linear.x*2self.msg.angular.z = self.msg.angular.z*2self.speed = 0.4if msg.data.find("減速") > -1:if self.speed == 0.4:self.msg.linear.x = self.msg.linear.x/2self.msg.angular.z = self.msg.angular.z/2self.speed = 0.2if msg.data.find("前進(jìn)") > -1:#if msg.data.find("forward") > -1: self.msg.linear.x = self.speedself.msg.angular.z = 0elif msg.data.find("左轉(zhuǎn)") > -1:if self.msg.linear.x != 0:if self.msg.angular.z < self.speed:self.msg.angular.z += 0.05else: self.msg.angular.z = self.speed*2elif msg.data.find("右轉(zhuǎn)") > -1: if self.msg.linear.x != 0:if self.msg.angular.z > -self.speed:self.msg.angular.z -= 0.05else: self.msg.angular.z = -self.speed*2elif msg.data.find("后退") > -1:self.msg.linear.x = -self.speedself.msg.angular.z = 0elif msg.data.find("停止") > -1 or msg.data.find("立定") > -1: self.msg = Twist()self.pub_.publish(self.msg)def cleanup(self):# stop the robot!twist = Twist()self.pub_.publish(twist)if __name__=="__main__":rospy.init_node('voice_cmd_vel')try:voice_cmd_vel()except:pass
總結(jié)
以上是生活随笔為你收集整理的ROS+科大讯飞语音识别控制机器人的全部?jī)?nèi)容,希望文章能夠幫你解決所遇到的問(wèn)題。
如果覺(jué)得生活随笔網(wǎng)站內(nèi)容還不錯(cuò),歡迎將生活随笔推薦給好友。