日韩性视频-久久久蜜桃-www中文字幕-在线中文字幕av-亚洲欧美一区二区三区四区-撸久久-香蕉视频一区-久久无码精品丰满人妻-国产高潮av-激情福利社-日韩av网址大全-国产精品久久999-日本五十路在线-性欧美在线-久久99精品波多结衣一区-男女午夜免费视频-黑人极品ⅴideos精品欧美棵-人人妻人人澡人人爽精品欧美一区-日韩一区在线看-欧美a级在线免费观看

歡迎訪問 生活随笔!

生活随笔

當前位置: 首頁 > 编程资源 > 编程问答 >内容正文

编程问答

ROS+科大讯飞语音识别控制机器人

發(fā)布時間:2024/3/26 编程问答 52 豆豆
生活随笔 收集整理的這篇文章主要介紹了 ROS+科大讯飞语音识别控制机器人 小編覺得挺不錯的,現在分享給大家,幫大家做個參考.

科大訊飛語音識別控制實際機器人運動。

本文將ros與語音識別想結合進行開發(fā)。進行以下步驟,
1、創(chuàng)作ros工作空間
2、安裝mpalyer播放器

sudo apt-get install mplayer

3、將訊非的語音庫動態(tài)文件.so文件放到/usr/lib/下
4、ros工程目錄src下新建文件xf_asr.cpp 并將以下內容復制進去,appid改成你自己的(官網申請)。

/* * 語音聽寫(iFly Auto Transform)技術能夠實時地將語音轉換成對應的文字。 */#include <stdlib.h> #include <stdio.h> #include <string.h> #include <unistd.h> #include "qisr.h" #include "msp_cmn.h" #include "msp_errors.h" #include "speech_recognizer.h" #include <iconv.h>#include "ros/ros.h" #include "std_msgs/String.h"#define FRAME_LEN 640 #define BUFFER_SIZE 4096int wakeupFlag = 0 ; int resultFlag = 0 ;static void show_result(char *string, char is_over) {resultFlag=1; printf("\rResult: [ %s ]", string);if(is_over)putchar('\n'); }static char *g_result = NULL;static unsigned int g_buffersize = BUFFER_SIZE;void on_result(const char *result, char is_last) {if (result) {size_t left = g_buffersize - 1 - strlen(g_result);size_t size = strlen(result);if (left < size) {g_result = (char*)realloc(g_result, g_buffersize + BUFFER_SIZE);if (g_result)g_buffersize += BUFFER_SIZE;else {printf("mem alloc failed\n");return;}}strncat(g_result, result, size);show_result(g_result, is_last);} }void on_speech_begin() {if (g_result){free(g_result);}g_result = (char*)malloc(BUFFER_SIZE);g_buffersize = BUFFER_SIZE;memset(g_result, 0, g_buffersize);printf("Start Listening...\n"); } void on_speech_end(int reason) {if (reason == END_REASON_VAD_DETECT)printf("\nSpeaking done \n");elseprintf("\nRecognizer error %d\n", reason); }/* demo recognize the audio from microphone */ static void demo_mic(const char* session_begin_params) {int errcode;int i = 0;struct speech_rec iat;struct speech_rec_notifier recnotifier = {on_result,on_speech_begin,on_speech_end};errcode = sr_init(&iat, session_begin_params, SR_MIC, &recnotifier);if (errcode) {printf("speech recognizer init failed\n");return;}errcode = sr_start_listening(&iat);if (errcode) {printf("start listen failed %d\n", errcode);}/* demo 10 seconds recording */while(i++ < 2)sleep(1);errcode = sr_stop_listening(&iat);if (errcode) {printf("stop listening failed %d\n", errcode);}sr_uninit(&iat); }/* main thread: start/stop record ; query the result of recgonization.* record thread: record callback(data write)* helper thread: ui(keystroke detection)*/void WakeUp(const std_msgs::String::ConstPtr& msg) {printf("waking up\r\n");usleep(700*1000);wakeupFlag=1; }int main(int argc, char* argv[]) {// 初始化ROSros::init(argc, argv, "voiceRecognition");ros::NodeHandle n;ros::Rate loop_rate(10);// 聲明Publisher和Subscriber// 訂閱喚醒語音識別的信號ros::Subscriber wakeUpSub = n.subscribe("voiceWakeup", 1000, WakeUp); // 訂閱喚醒語音識別的信號 ros::Publisher voiceWordsPub = n.advertise<std_msgs::String>("voiceWords", 1000); ROS_INFO("Sleeping...");int count=0;while(ros::ok()){// 語音識別喚醒if (wakeupFlag){ROS_INFO("Wakeup...");int ret = MSP_SUCCESS;const char* login_params = "appid = , work_dir = .";const char* session_begin_params ="sub = iat, domain = iat, language = zh_cn, ""accent = mandarin, sample_rate = 16000, ""result_type = plain, result_encoding = utf8";ret = MSPLogin(NULL, NULL, login_params);if(MSP_SUCCESS != ret){MSPLogout();printf("MSPLogin failed , Error code %d.\n",ret);}printf("Demo recognizing the speech from microphone\n");printf("Speak in 3 seconds\n");demo_mic(session_begin_params);printf("3 sec passed\n");wakeupFlag=1;MSPLogout();}// 語音識別完成if(resultFlag){resultFlag=0;std_msgs::String msg;msg.data = g_result;voiceWordsPub.publish(msg);}ros::spinOnce();loop_rate.sleep();count++;}exit:MSPLogout(); // Logout...return 0; }

5、CMakeLists.txt增加以下代碼

add_executable(xf_asr src/xf_asr.cpp) target_link_libraries(xf_asr ${catkin_LIBRARIES} -lmsc -ldl -lpthread -lm -lrt) add_dependencies(xf_asr xf_voice_generate_messages_cpp)(這句要不要都可以)

6、回到工作空間編譯,編譯后source一下。此時語音識別已經可以運行,打開新的終端運行roscore。在另一個終端運行asr。
7、添加語音控制的package,新創(chuàng)建一個新的package,在新的src里面創(chuàng)建voice_cmd.cpp。復制一下代碼、

#include<ros/ros.h> #include<geometry_msgs/Twist.h> #include<std_msgs/String.h> #include<pthread.h> #include<iostream> #include<stdio.h> //#include<string.h> using namespace std; ros::Publisher pub; geometry_msgs::Twist vel_cmd; pthread_t pth_[5];void* vel_ctr(void* arg) {while(true){pub.publish(vel_cmd);ros::spinOnce();sleep(1);}return 0; } //void callback(const package_name::type_name & msg) void callback(const std_msgs::String::ConstPtr& msg) {cout<<"收到:"<<msg->data.c_str()<<endl;string str1 = msg->data.c_str();string str2 = "11";string str3 = "22";string str4 = "33";string str5 = "44";string str6 = "55";//if(str1 == str2)if(str1.find("前進")) // if(strstr(&str1, &str2)){// cout<<"11111"<<endl;vel_cmd.linear.x = 0.2;vel_cmd.angular.z = 0;pthread_create(&pth_[0],NULL,vel_ctr,NULL);}//if(str1 == str3)if(str1.find("后退“))//if(strstr(&str1 , &str3)){vel_cmd.linear.x = -0.2;vel_cmd.angular.z = 0;pthread_create(&pth_[1],NULL,vel_ctr,NULL);}if(str1.find("左轉"))//if(strstr(&str1 , &str4)){vel_cmd.linear.x = 0;vel_cmd.angular.z = 0.05;pthread_create(&pth_[2],NULL,vel_ctr,NULL);}if(str1.find("右轉"))//if(strstr(&str1 ,&str5)){vel_cmd.linear.x = 0;vel_cmd.angular.z = -0.05;pthread_create(&pth_[3],NULL,vel_ctr,NULL);}if(str1.find("停止"))//if(strstr(&str1 ,&str6)){vel_cmd.linear.x = 0;vel_cmd.angular.z = 0;pthread_create(&pth_[4],NULL,vel_ctr,NULL);} }int main(int argc, char** argv) {ros::init(argc, argv, "sub_word");ros::NodeHandle n;//pub = n.advertise<geometry_msgs::Twist>("/cmd_vel_mux/input/teleop",10);pub = n.advertise<geometry_msgs::Twist>("/mobile_base/mobile_base_controller/cmd_vel",1000);ros::Subscriber sub = n.subscribe("/voiceWords",10,callback); // ros::Subscriber sub = n.subscribe("read",10,callback);//ros::Publisher pub = n.advertise<geometry_msgs::Twist>("/cmd_vel_mux/input/teleop", 10);cout<<"您好!你可以語音控制啦!"<<endl; cout<<"向前行———————————>前進"<<endl; cout<<"向后退———————————>后退"<<endl; cout<<"向左轉———————————>左轉"<<endl; cout<<"向右轉———————————>右轉"<<endl; cout<<"使停止———————————>停止"<<endl;ros::spin(); }

8、同理在Cmakelist加上以下:

add_executable(voice_cmd src/voice_cmd.cpp) target_link_libraries(voice_cmd ${catkin_LIBRARIES} ) add_dependencies(voice_cmd voice_cmd_generate_messages_cpp)

9、回到工作空間編譯,運行。
10、運行上面兩個模塊后再打開一個終端運行rqt_graph查看節(jié)點圖是否聯通。(完)

或者用python去控制機器人運動,訂閱asr的內容,
以下是python代碼:

#!/usr/bin/env python # This Python file uses the following encoding: utf-8 import os, sysimport roslib; roslib.load_manifest('pocketsphinx') import rospy import mathfrom geometry_msgs.msg import Twist from std_msgs.msg import Stringclass voice_cmd_vel:def __init__(self):rospy.on_shutdown(self.cleanup)self.speed = 0.2self.msg = Twist()# publish to cmd_vel, subscribe to speech output#self.pub_ = rospy.Publisher('/mobile_base/commands/velocity', Twist)self.pub_ = rospy.Publisher('/mobile_base/mobile_base_controller/cmd_vel', Twist)rospy.Subscriber('/voiceWords', String, self.speechCb)r = rospy.Rate(10.0)while not rospy.is_shutdown():self.pub_.publish(self.msg)r.sleep()def speechCb(self, msg):rospy.loginfo(msg.data)#if msg.data.find("full speed") > -1:if msg.data.find("加速") > -1:if self.speed == 0.2:self.msg.linear.x = self.msg.linear.x*2self.msg.angular.z = self.msg.angular.z*2self.speed = 0.4if msg.data.find("減速") > -1:if self.speed == 0.4:self.msg.linear.x = self.msg.linear.x/2self.msg.angular.z = self.msg.angular.z/2self.speed = 0.2if msg.data.find("前進") > -1:#if msg.data.find("forward") > -1: self.msg.linear.x = self.speedself.msg.angular.z = 0elif msg.data.find("左轉") > -1:if self.msg.linear.x != 0:if self.msg.angular.z < self.speed:self.msg.angular.z += 0.05else: self.msg.angular.z = self.speed*2elif msg.data.find("右轉") > -1: if self.msg.linear.x != 0:if self.msg.angular.z > -self.speed:self.msg.angular.z -= 0.05else: self.msg.angular.z = -self.speed*2elif msg.data.find("后退") > -1:self.msg.linear.x = -self.speedself.msg.angular.z = 0elif msg.data.find("停止") > -1 or msg.data.find("立定") > -1: self.msg = Twist()self.pub_.publish(self.msg)def cleanup(self):# stop the robot!twist = Twist()self.pub_.publish(twist)if __name__=="__main__":rospy.init_node('voice_cmd_vel')try:voice_cmd_vel()except:pass

總結

以上是生活随笔為你收集整理的ROS+科大讯飞语音识别控制机器人的全部內容,希望文章能夠幫你解決所遇到的問題。

如果覺得生活随笔網站內容還不錯,歡迎將生活随笔推薦給好友。