




已阅读5页,还剩7页未读, 继续免费阅读
版权说明:本文档由用户提供并上传,收益归属内容提供方,若内容存在侵权,请进行举报或认领
文档简介
基于Windows Speech SDK使用VC 6.0实现语音识别的示例程序(1)2009-02-24 13:41#include #include #include #include #include #include sphelper.h/Copyright (c) Microsoft Corporation. All rights reserved.inline HRESULT BlockForResult(ISpRecoContext * pRecoCtxt, ISpRecoResult * ppResult). HRESULT hr = S_OK; CSpEvent event;while (SUCCEEDED(hr) & SUCCEEDED(hr = event.GetFrom(pRecoCtxt) & hr = S_FALSE). hr = pRecoCtxt-WaitForNotifyEvent(INFINITE); *ppResult = event.RecoResult();if (*ppResult). (*ppResult)-AddRef(); return hr;const WCHAR * StopWord().const WCHAR * pchStop; LANGID LangId = :SpGetUserDefaultUILanguage();switch (LangId).case MAKELANGID(LANG_JAPANESE, SUBLANG_DEFAULT): pchStop = L42N860b70e50fc0ea0e70fc/05708504608a087046;break;default: pchStop = LStop;break; return pchStop;int main(int argc, char* argv). HRESULT hr = E_FAIL;bool fUseTTS = true;/ turn TTS play back on or offbool fReplay = true;/ turn Audio replay on or off/ Process optional argumentsif (argc 1).int i;for (i = 1; i argc; i+).if (_stricmp(argvi, -noTTS) = 0). fUseTTS = false;continue; if (_stricmp(argvi, -noReplay) = 0). fReplay = false;continue; printf (Usage: %s -noTTS -noReplay , argv0);return hr; 基于Windows Speech SDK使用VC 6.0实现语音识别的示例程序(2)2009-02-24 13:42if (SUCCEEDED(hr = :CoInitialize(NULL). CComPtr cpRecoCtxt; CComPtr cpGrammar; CComPtr cpVoice; hr = cpRecoCtxt.CoCreateInstance(CLSID_SpSharedRecoContext);if(SUCCEEDED(hr). hr = cpRecoCtxt-GetVoice(&cpVoice); if (cpRecoCtxt & cpVoice & SUCCEEDED(hr = cpRecoCtxt-SetNotifyWin32Event() & SUCCEEDED(hr = cpRecoCtxt-SetInterest(SPFEI(SPEI_RECOGNITION), SPFEI(SPEI_RECOGNITION) & SUCCEEDED(hr = cpRecoCtxt-SetAudioOptions(SPAO_RETAIN_AUDIO, NULL, NULL) & SUCCEEDED(hr = cpRecoCtxt-CreateGrammar(0, &cpGrammar) & SUCCEEDED(hr = cpGrammar-LoadDictation(NULL, SPLO_STATIC) & SUCCEEDED(hr = cpGrammar-SetDictationState(SPRS_ACTIVE). USES_CONVERSION;const WCHAR * const pchStop = StopWord(); CComPtr cpResult; printf( I will repeat everything you say. Say %s to exit. , W2A(pchStop) );while (SUCCEEDED(hr = BlockForResult(cpRecoCtxt, &cpResult). cpGrammar-SetDictationState( SPRS_INACTIVE ); CSpDynamicString dstrText;if (SUCCEEDED(cpResult-GetText(SP_GETWHOLEPHRASE, SP_GETWHOLEPHRASE, TRUE, &dstrText, NULL). printf(I heard: %s , W2A(dstrText);if (fUseTTS). cpVoice-Speak( LI heard, SPF_ASYNC, NULL); cpVoice-Speak( dstrText, SPF_ASYNC, NULL ); if (fReplay).if (fUseTTS) cpVoice-Speak( Lwhen you said, SPF_ASYNC, NULL);else printf ( when you said. ); cpResult-SpeakAudio(NULL, 0, NULL, NULL); cpResult.Release(); if (_wcsicmp(dstrText, pchStop) = 0).break; cpGrammar-SetDictationState( SPRS_ACTIVE ); :CoUninitialize(); return hr;VC如何编写一个语音识别的类2009-02-24 13:441)在构造语音类之前,必须先设置好工程环境: a、从微软官方网站下载windows speech sdk并安装,然后在Visual Studio 6.0中进行相关设置,在Project Setings选项的C+选项卡的“分类:预处理器”添加“,_WIN32_DCOM”(为预先初始化COM组件成功); b、将预处理头文件选项选中“自动使用预补偿页眉”; c、在常规选项卡中选择“实用MFC静态连接库”; 2)封装语音类 由于采用面向对象的编程理念,借助UML(Unified Modeling Language统一建模语言)构造CSPEECH语音类如下 CSPEECH类 + void InitSR(); /初始化语音 +void RecoEvent();/识别命令函数 +BOOL b_initSR; +BOOL b_Cmd_Grammar; /3个语音接口 +CComPtr m_cpRecocontxt; +CComPtr m_cpRecoGrammar; +CComPtr m_cpRecoEngine; 然后开始添加语音类,需要注意的是在定义语音类的头文件中,包含sphelper.h并且自定义语音识别消息和类型 #define GID_CMD_GR 333333 #define WM_RECOEVENT WM_USER+102 剩下来就是对cpp文件的函数initSR()和RecoEvent()补充函数体 3)具体见下面代码: (1)void CSpeech:initSR() HRESULT hr=S_OK; hr=m_cpRecoEngine.CoCreateInstance(CLSID_SpInprocRecognizer);/创建识别引擎COM实例 if(SUCCEEDED(hr) hr =m_cpRecoEngine-CreateRecoContext(&m_cpRecoCtxt );/创建识别上下文 else MessageBox(hWnd,error1,error,S_OK); if(SUCCEEDED(hr) hr = m_cpRecoCtxt-SetNotifyWindowMessage(hWnd, WM_RECOEVENT, 0, 0 ); /消息机制设置,使计算机时刻监听语音消息 else MessageBox(hWnd,error2,error,S_OK); if (SUCCEEDED(hr) ULONGLONG ullMyEvents = SPFEI(SPEI_RECOGNITION) | SPFEI(SPEI_HYPOTHESIS); hr = m_cpRecoCtxt-SetInterest(ullMyEvents, ullMyEvents); else MessageBox(hWnd,error3,error,S_OK); /设置默认的音频 CComPtr m_cpAudio; hr=SpCreateDefaultObjectFromCategoryId(SPCAT_AUDIOIN,&m_cpAudio);/建立默认的音频输入对象 hr=m_cpRecoEngine-SetInput(m_cpAudio,TRUE);/设置识别引擎输入源 hr=m_cpRecoCtxt-CreateGrammar(GID_CMD_GR,&m_cpCmdGrammar);/创建命令语法 b_Cmd_Grammar=TRUE; if(FAILED(hr) MessageBox(hWnd,error 4,error,S_OK); hr=m_cpCmdGrammar-LoadCmdFromResource(NULL,MAKEINTRESOURCEW(IDR_CMDCTRL),LSRGRAMMAR,MAKELANGID(LANG_NEUTRAL,SUBLANG_NEUTRAL), SPLO_DYNAMIC);/加载命令语法文件 if(FAILED(hr) MessageBox(hWnd,error5,error,S_OK); b_initSR=TRUE; (2)BOOL CSpeech:RecoEvent() USES_CONVERSION; CSpEvent event; while(event.GetFrom(m_cpRecoCtxt)=S_OK) switch(event.eEventId) case SPEI_RECOGNITION: static const WCHAR wszUnrecognized=L; CSpDynamicString dstrText; if(FAILED(event.RecoResult()-GetText(SP_GETWHOLEPHRASE,SP_GETWHOLEPHRASE,TRUE,&dstrText,NULL) dstrText=wszUnrecognized; dstrText.CopyToBSTR(&SRout); Recstring.Empty(); Recstring=SRout; if(b_Cmd_Grammar) if(Recstring=左) ISpVoice *pVoice=NULL; if(FAILED(CoInitialize(NULL) MessageBox(hWnd,Error to initialize COM,error,S_OK); return FALSE; HRESULT hr=CoCreateInstance(CLSID_SpVoice,NULL,CLSCTX_ALL,IID_ISpVoice,(void*)&pVoice); if(SUCCEEDED(hr) hr=pVoice-Speak(L左转,0,NULL); pVoice-Release(); pVoice=NULL; CoUninitialize(); m_OpenGL-m_baiscobj-LEFT=1; return TRUE ; if(Recstring=向下走) ISpVoice *pVoice=NULL; if(FAILED(CoInitialize(NULL) MessageBox(hWnd,Error to initialize COM,error,S_OK); return FALSE; HRESULT hr=CoCreateInstance(CLSID_SpVoice,NULL,CLSCTX_ALL,IID_ISpVoice,(void*)&pVoice); if(SUCCEEDED(hr) hr=pVoice-Speak(L开始后退,0,NULL); pVoice-Release(); pVoice=NULL; CoUninitialize(); m_OpenGL-m_baiscobj-BACK=1; return TRUE ; if(Recstring=最小化) ISpVoice *pVoice=NULL; if(FAILED(CoInitialize(NULL) MessageBox(hWnd,Error to initialize COM,error,S_OK); return FALSE; HRESULT hr=CoCreateInstance(CLSID_SpVoice,NULL,CLSCTX_ALL,IID_ISpVoice,(void*)&pVoice); if(SUCCEEDED(hr) hr=pVoice-Speak(L最小化,0,NULL); pVoice-Release(); pVoice=NULL; CoUninitialize(); SendMessage(hWnd,WM_SYSCOMMAND, SC_MINIMIZE, MAKELPARAM(0, 0); return TRUE; if(Recstring=右) ISpVoice *pVoice=NULL; if(FAILED(CoInitialize(NULL) MessageBox(hWnd,Error to initialize COM,error,S_OK); return FALSE; HRESULT hr=CoCreateInstance(CLSID_SpVoice,NULL,CLSCTX_ALL,IID_ISpVoice,(void*)&pVoice); if(SUCCEEDED(hr) hr=pVoice-Speak(L开始右转,0,NULL); pVoice-Release(); pVoice=NULL; CoUninitialize(); m_OpenGL-m_baiscobj-RIGHT=1; return TRUE ; if(Recstring=停下来) ISpVoice *pVoice=NULL; if(FAILED(CoInitialize(NULL) MessageBox(hWnd,Error to initialize COM,error,S_OK); return FALSE; HRESULT hr=CoCreateInstance(CLSID_SpVoice,NULL,CLSCTX_ALL,IID_ISpVoice,(void*)&pVoice); if(SUCCEEDED(hr) hr=pVoice-Speak(L动作开始了,0,NULL); pVoice-Release(); pVoice=NULL; CoUninitialize(); m_OpenGL-m_baiscobj-Move=0; m_OpenGL-m_baiscobj-BACK=0; m_OpenGL-m_baiscobj-LEFT=0; m_OpenGL-m_baiscobj-RIGHT=0; return TRUE ; if(Recstring=跑步) ISpVoice *pVoice=NULL; if(FAILED(CoInitialize(NULL) MessageBox(hWnd,Error to initialize COM,error,S_OK); return FALSE; HRESULT hr=CoCreateInstance(CLSID_SpVoice,NULL,CLSCTX_ALL,IID_ISpVoice,(void*)&pVoice); if(SUCCEEDED(hr) hr=pVoice-Speak(L动作开始了,0,NULL); pVoice-Release(); pVoice=NULL; CoUninitialize(); m_OpenGL-m_baiscobj-Move=1; return TRUE ; if(Recstring=退出) m_OpenGL-CleanUp(); / 结束处理 PostQuitMessage(0); return TRUE; return TRUE; 要注意的是RecoEvent()必须能处理人物、摄像头的漫游,所以在人物、摄像机类的行为函数中添加了控制变量Move、BACK、LEFT、RIGHT;并附了初值1,当在行为函数中为1时行为函数体执行,所以也必须 #include OpenGL.h #include baiscobj.h 其间我们借助于指针变量,巧妙的使语音能控制行为,却不影响动画的刷新,但不足的是由于opengl动画md2模型的不能导入成功,使踢球,跳木箱等功能函数没有完成,所以只要行为函数出来,可通过上述同样方法实现语音控制。 4)如何在winmain()函数中执行语音程序? 首先包含语音头文件sapi.h 接着(#define CSpeech speech)定义语音类对象 INT WINAPI WinMain(HINSTANCE hInst,HINSTANCE,LPSTR,INT )/ WinMain程序入口 :CoInitializeEx(NULL,COINIT_APARTMENTTHREADED);/初始化COM char cc=tml; WNDCLASSEX wc = sizeof(WNDCLASSEX), CS_CLASSDC, MsgProc, 0L, 0L, GetModuleHandle(NULL), NULL, NULL, NULL, (LPCTSTR)IDR_MENU1, cc, NULL ; RegisterClassEx( &wc ); m_OpenGL=new OpenGL();/ hWnd = CreateWindowEx(NULL,cc,智能精灵键盘(进退右左UP仰DOWM俯), dwStyle|WS_CLIPCHILDREN|WS_CLIPSIBLINGS,nX,nY,Width, Height,NULL,NULL,hInst,NULL); / 创建窗口 Sho
温馨提示
- 1. 本站所有资源如无特殊说明,都需要本地电脑安装OFFICE2007和PDF阅读器。图纸软件为CAD,CAXA,PROE,UG,SolidWorks等.压缩文件请下载最新的WinRAR软件解压。
- 2. 本站的文档不包含任何第三方提供的附件图纸等,如果需要附件,请联系上传者。文件的所有权益归上传用户所有。
- 3. 本站RAR压缩包中若带图纸,网页内容里面会有图纸预览,若没有图纸预览就没有图纸。
- 4. 未经权益所有人同意不得将文件中的内容挪作商业或盈利用途。
- 5. 人人文库网仅提供信息存储空间,仅对用户上传内容的表现方式做保护处理,对用户上传分享的文档内容本身不做任何修改或编辑,并不能对任何下载内容负责。
- 6. 下载文件中如有侵权或不适当内容,请与我们联系,我们立即纠正。
- 7. 本站不保证下载资源的准确性、安全性和完整性, 同时也不承担用户因使用这些下载资源对自己和他人造成任何形式的伤害或损失。
最新文档
- 2025年国内知名企业数据分析师岗位招聘面试题及答案
- 2025年人事专员面试问题及模拟题答案
- 2025年健康照护师专业资格认证考试模拟题及答案
- 2025年旋挖钻机项目建议书
- 2025年口服降血糖药项目建议书
- 2025年生物质气化机组项目建议书
- 抛光粉尘安全知识培训课件
- 抗过敏药课件
- 广西南宁市西乡塘区、江南区2024-2025学年七年级下学期期末检测地理试卷(含答案)
- 2025年电视节目自动播出设备项目建议书
- 分布式清洁能源多源互补供热研究现状分析
- 传统乐器琵琶课件
- 船舶碰撞应急预案
- 廉洁征兵培训课件
- 供应链经理上半年工作总结
- 产品功能与使用说明手册
- 开学防自然灾害 反毒品安全主题班会 课件
- 《颅骨骨折》课件
- 整体施工劳务服务方案
- DBJT13-119-2010 福建省住宅工程质量分户验收规程
- 北师大版七年级数学上册丰富的图形世界《从立体图形到平面图形》第二课时示范公开课教学课件
评论
0/150
提交评论