17#ifdef ENABLE_NI_SPEECH
27CNiSpeech::CNiSpeech(IStream* stream, WAVEFORMATEX* format)
29 m_pSpeechStream = NULL;
30 m_pSpeechRecognizer = NULL;
31 m_pSpeechContext = NULL;
32 m_pSpeechGrammar = NULL;
34 m_hSpeechEvent = NULL;
36 m_speechThread = NULL;
40 if (stream!=NULL && format!=NULL) init(stream, format);
45BOOL CNiSpeech::init(IStream* stream, WAVEFORMATEX* format)
47 DEBUG_INFO(
"CNiSpeech::init(): START\n");
50 if (stream==NULL || format==NULL)
return FALSE;
52 HRESULT hr = CoCreateInstance(CLSID_SpStream, NULL, CLSCTX_INPROC_SERVER, __uuidof(ISpStream), (
void**)&m_pSpeechStream);
54 DEBUG_INFO(
"CNiSpeech::init(): ERR 1\n");
58 hr = m_pSpeechStream->SetBaseStream(stream, SPDFID_WaveFormatEx, format);
60 DEBUG_INFO(
"CNiSpeech::init(): ERR 2\n");
65 DEBUG_INFO(
"CNiSpeech::init(): END\n");
71void CNiSpeech::free(
void)
73 DEBUG_INFO(
"CNiSpeech::free(): START\n");
78 DEBUG_INFO(
"CNiSpeech::free(): END\n");
83BOOL CNiSpeech::create(LPCTSTR lang)
85 DEBUG_INFO(
"CNiSpeech::create(): START\n");
86 ISpObjectToken *pEngineToken = NULL;
91 HRESULT hr = CoCreateInstance(CLSID_SpInprocRecognizer, NULL, CLSCTX_INPROC_SERVER, __uuidof(ISpRecognizer), (
void**)&m_pSpeechRecognizer);
93 DEBUG_INFO(
"CNiSpeech::create(): ERR 1\n");
97 m_pSpeechRecognizer->SetInput(m_pSpeechStream, FALSE);
98 hr = SpFindBestToken(SPCAT_RECOGNIZERS, lang, NULL, &pEngineToken);
101 m_pSpeechRecognizer->SetRecognizer(pEngineToken);
102 hr = m_pSpeechRecognizer->CreateRecoContext(&m_pSpeechContext);
107 DEBUG_INFO(
"CNiSpeech::create(): ERR 2\n");
114 DEBUG_INFO(
"CNiSpeech::create(): END\n");
120BOOL CNiSpeech::load(LPCTSTR file)
122 DEBUG_INFO(
"CNiSpeech::load(): START\n");
124 if (m_pSpeechContext==NULL) {
125 DEBUG_INFO(
"CNiSpeech::load(): SpeechContext ERR\n");
131 HRESULT hr = m_pSpeechContext->CreateGrammar(1, &m_pSpeechGrammar);
133 if (SUCCEEDED(hr)) hr = m_pSpeechGrammar->LoadCmdFromFile(file, SPLO_STATIC);
135 DEBUG_INFO(
"CNiSpeech::load: ERR 2\n");
140 DEBUG_INFO(
"CNiSpeech::load(): END\n");
146BOOL CNiSpeech::start(
double confidence=0.1)
148 if (m_pSpeechGrammar==NULL || m_pSpeechRecognizer==NULL || m_pSpeechContext==NULL)
return FALSE;
149 DEBUG_INFO(
"CNiSpeech::start(): START\n");
153 m_confidence = confidence;
155 m_pSpeechGrammar->SetRuleState(NULL, NULL, SPRS_ACTIVE);
156 m_pSpeechRecognizer->SetRecoState(SPRST_ACTIVE_ALWAYS);
157 DEBUG_INFO(
"CNiSpeech::start(): SetRecoState OK\n");
161 m_pSpeechContext->SetInterest(SPFEI(SPEI_RECOGNITION), SPFEI(SPEI_RECOGNITION));
162 HRESULT hr = m_pSpeechContext->Resume(0);
164 DEBUG_INFO(
"CNiSpeech::start(): Resume ERR\n");
168 DEBUG_INFO(
"CNiSpeech::start(): Resume OK\n");
170 m_hStopEvent = CreateEvent(NULL, FALSE, FALSE, NULL);
171 m_hSpeechEvent = m_pSpeechContext->GetNotifyEventHandle();
173 m_speechThread = AfxBeginThread(speechThread, (LPVOID)
this, THREAD_PRIORITY_NORMAL, 0, CREATE_SUSPENDED);
174 m_speechThread->m_bAutoDelete = FALSE;
175 m_speechThread->ResumeThread();
178 DEBUG_INFO(
"CNiSpeech::start(): END");
184void CNiSpeech::stop(
void)
186 DEBUG_INFO(
"CNiSpeech::stop(): START\n");
188 if (m_hStopEvent!=NULL) {
189 SetEvent(m_hStopEvent);
191 if (m_speechThread!=NULL) {
192 WaitForSingleObject(m_speechThread->m_hThread, INFINITE);
193 CloseHandle(m_speechThread->m_hThread);
194 delete m_speechThread;
195 m_speechThread = NULL;
198 DEBUG_INFO(
"CNiSpeech::stop(): Pause OK\n");
200 CloseHandle(m_hStopEvent);
205 if (m_hSpeechEvent!=NULL) {
206 CloseHandle(m_hSpeechEvent);
207 m_hSpeechEvent = NULL;
210 DEBUG_INFO(
"CNiSpeech::stop(): END\n");
216void CNiSpeech::process(
void)
221 m_pSpeechContext->GetEvents(1, &curEvent, &fetched);
224 if (curEvent.eEventId==SPEI_RECOGNITION && curEvent.elParamType==SPET_LPARAM_IS_OBJECT) {
226 ISpRecoResult* result =
reinterpret_cast<ISpRecoResult*
>(curEvent.lParam);
227 SPPHRASE* pPhrase = NULL;
228 result->GetPhrase(&pPhrase);
231 if (pPhrase->pProperties!=NULL && pPhrase->pProperties->pFirstChild!=NULL) {
232 const SPPHRASEPROPERTY* pSemanticTag = pPhrase->pProperties->pFirstChild;
234 map2action(pSemanticTag->pszValue, pSemanticTag->SREngineConfidence);
236 ::CoTaskMemFree(pPhrase);
240 m_pSpeechContext->GetEvents(1, &curEvent, &fetched);
248void CNiSpeech::setConfidence(
double confd)
250 if (confd>1.0) confd = 1.0;
251 else if (confd<0.0) confd = 0.0;
253 m_confidence = confd;
262UINT CNiSpeech::speechThread(LPVOID pParam)
264 CNiSpeech* pthis = (CNiSpeech*)pParam;
265 return pthis->speechThread();
270UINT CNiSpeech::speechThread(
void)
272 DEBUG_INFO(
"CNiSpeech::speechThread(): START\n");
274 bool bContinue =
true;
278 if (WaitForSingleObject(m_hStopEvent, 0)==WAIT_OBJECT_0) {
283 if (WaitForSingleObject(m_hSpeechEvent, 0)==WAIT_OBJECT_0) {
290 DEBUG_INFO(
"CNiSpeech::speechThread(): END\n");
296void CNiSpeech::map2action(LPCTSTR tag,
double confd)
300 if (confd>=m_confidence) {
void SendWinMessage(UINT mesg, WPARAM wparam=NULL, LPARAM lparam=NULL)
void releaseNull(T *&ptr)