JunkBox_Win_Lib 1.5.3
Loading...
Searching...
No Matches
NiSpeech.cpp
Go to the documentation of this file.
1
12#include "WinBaseLib.h"
13#include "NiSpeech.h"
14
15
16
17#ifdef ENABLE_NI_SPEECH
18
19
20using namespace jbxl;
21using namespace jbxwl;
22
23
25// Face Tracker クラス
26
27CNiSpeech::CNiSpeech(IStream* stream, WAVEFORMATEX* format)
28{
29 m_pSpeechStream = NULL;
30 m_pSpeechRecognizer = NULL;
31 m_pSpeechContext = NULL;
32 m_pSpeechGrammar = NULL;
33
34 m_hSpeechEvent = NULL;
35 m_hStopEvent = NULL;
36 m_speechThread = NULL;
37
38 m_confidence = 0.1;
39
40 if (stream!=NULL && format!=NULL) init(stream, format);
41}
42
43
44
45BOOL CNiSpeech::init(IStream* stream, WAVEFORMATEX* format)
46{
47 DEBUG_INFO("CNiSpeech::init(): START\n");
48 free();
49
50 if (stream==NULL || format==NULL) return FALSE;
51
52 HRESULT hr = CoCreateInstance(CLSID_SpStream, NULL, CLSCTX_INPROC_SERVER, __uuidof(ISpStream), (void**)&m_pSpeechStream);
53 if (FAILED(hr)) {
54 DEBUG_INFO("CNiSpeech::init(): ERR 1\n");
55 return FALSE;
56 }
57
58 hr = m_pSpeechStream->SetBaseStream(stream, SPDFID_WaveFormatEx, format);
59 if (FAILED(hr)) {
60 DEBUG_INFO("CNiSpeech::init(): ERR 2\n");
61 releaseNull(m_pSpeechStream);
62 return FALSE;
63 }
64
65 DEBUG_INFO("CNiSpeech::init(): END\n");
66 return TRUE;
67}
68
69
70
71void CNiSpeech::free(void)
72{
73 DEBUG_INFO("CNiSpeech::free(): START\n");
74 releaseNull(m_pSpeechGrammar);
75 releaseNull(m_pSpeechContext);
76 releaseNull(m_pSpeechRecognizer);
77 //releaseNull(m_pSpeechStream); // sometimes crash
78 DEBUG_INFO("CNiSpeech::free(): END\n");
79}
80
81
82
83BOOL CNiSpeech::create(LPCTSTR lang)
84{
85 DEBUG_INFO("CNiSpeech::create(): START\n");
86 ISpObjectToken *pEngineToken = NULL;
87
88 releaseNull(m_pSpeechContext);
89 releaseNull(m_pSpeechRecognizer);
90
91 HRESULT hr = CoCreateInstance(CLSID_SpInprocRecognizer, NULL, CLSCTX_INPROC_SERVER, __uuidof(ISpRecognizer), (void**)&m_pSpeechRecognizer);
92 if (FAILED(hr)) {
93 DEBUG_INFO("CNiSpeech::create(): ERR 1\n");
94 return FALSE;
95 }
96
97 m_pSpeechRecognizer->SetInput(m_pSpeechStream, FALSE);
98 hr = SpFindBestToken(SPCAT_RECOGNIZERS, lang, NULL, &pEngineToken);
99
100 if (SUCCEEDED(hr)) {
101 m_pSpeechRecognizer->SetRecognizer(pEngineToken);
102 hr = m_pSpeechRecognizer->CreateRecoContext(&m_pSpeechContext);
103 releaseNull(pEngineToken);
104 }
105
106 if (FAILED(hr)) {
107 DEBUG_INFO("CNiSpeech::create(): ERR 2\n");
108 releaseNull(m_pSpeechContext);
109 releaseNull(m_pSpeechRecognizer);
110 releaseNull(m_pSpeechStream);
111 return FALSE;
112 }
113
114 DEBUG_INFO("CNiSpeech::create(): END\n");
115 return TRUE;
116}
117
118
119
120BOOL CNiSpeech::load(LPCTSTR file)
121{
122 DEBUG_INFO("CNiSpeech::load(): START\n");
123
124 if (m_pSpeechContext==NULL) {
125 DEBUG_INFO("CNiSpeech::load(): SpeechContext ERR\n");
126 return FALSE;
127 }
128
129 releaseNull(m_pSpeechGrammar);
130
131 HRESULT hr = m_pSpeechContext->CreateGrammar(1, &m_pSpeechGrammar);
132
133 if (SUCCEEDED(hr)) hr = m_pSpeechGrammar->LoadCmdFromFile(file, SPLO_STATIC);
134 if (FAILED(hr)) {
135 DEBUG_INFO("CNiSpeech::load: ERR 2\n");
136 releaseNull(m_pSpeechGrammar);
137 return FALSE;
138 }
139
140 DEBUG_INFO("CNiSpeech::load(): END\n");
141 return TRUE;
142}
143
144
145
146BOOL CNiSpeech::start(double confidence=0.1)
147{
148 if (m_pSpeechGrammar==NULL || m_pSpeechRecognizer==NULL || m_pSpeechContext==NULL) return FALSE;
149 DEBUG_INFO("CNiSpeech::start(): START\n");
150
151// stop(); // if working then stop
152
153 m_confidence = confidence;
154 //
155 m_pSpeechGrammar->SetRuleState(NULL, NULL, SPRS_ACTIVE);
156 m_pSpeechRecognizer->SetRecoState(SPRST_ACTIVE_ALWAYS);
157 DEBUG_INFO("CNiSpeech::start(): SetRecoState OK\n");
158 ::DisPatcher();
159 ::Sleep(100);
160
161 m_pSpeechContext->SetInterest(SPFEI(SPEI_RECOGNITION), SPFEI(SPEI_RECOGNITION));
162 HRESULT hr = m_pSpeechContext->Resume(0);
163 if (FAILED(hr)) {
164 DEBUG_INFO("CNiSpeech::start(): Resume ERR\n");
165 free();
166 return FALSE;
167 }
168 DEBUG_INFO("CNiSpeech::start(): Resume OK\n");
169
170 m_hStopEvent = CreateEvent(NULL, FALSE, FALSE, NULL);
171 m_hSpeechEvent = m_pSpeechContext->GetNotifyEventHandle();
172 //
173 m_speechThread = AfxBeginThread(speechThread, (LPVOID)this, THREAD_PRIORITY_NORMAL, 0, CREATE_SUSPENDED);
174 m_speechThread->m_bAutoDelete = FALSE;
175 m_speechThread->ResumeThread();
176 ::Sleep(10);
177
178 DEBUG_INFO("CNiSpeech::start(): END");
179 return TRUE;
180}
181
182
183
184void CNiSpeech::stop(void)
185{
186 DEBUG_INFO("CNiSpeech::stop(): START\n");
187
188 if (m_hStopEvent!=NULL) {
189 SetEvent(m_hStopEvent);
190 //
191 if (m_speechThread!=NULL) {
192 WaitForSingleObject(m_speechThread->m_hThread, INFINITE);
193 CloseHandle(m_speechThread->m_hThread);
194 delete m_speechThread; // as m_bAutoDelete==FALSE
195 m_speechThread = NULL;
196 //
197 //m_pSpeechContext->Pause(0);
198 DEBUG_INFO("CNiSpeech::stop(): Pause OK\n");
199 }
200 CloseHandle(m_hStopEvent);
201 m_hStopEvent = NULL;
202 }
203
204 //
205 if (m_hSpeechEvent!=NULL) {
206 CloseHandle(m_hSpeechEvent);
207 m_hSpeechEvent = NULL;
208 }
209
210 DEBUG_INFO("CNiSpeech::stop(): END\n");
211 return;
212}
213
214
215
216void CNiSpeech::process(void)
217{
218 SPEVENT curEvent;
219 ULONG fetched = 0;
220
221 m_pSpeechContext->GetEvents(1, &curEvent, &fetched);
222
223 while (fetched>0) {
224 if (curEvent.eEventId==SPEI_RECOGNITION && curEvent.elParamType==SPET_LPARAM_IS_OBJECT) {
225 //
226 ISpRecoResult* result = reinterpret_cast<ISpRecoResult*>(curEvent.lParam);
227 SPPHRASE* pPhrase = NULL;
228 result->GetPhrase(&pPhrase);
229 //
230 if (pPhrase!=NULL) {
231 if (pPhrase->pProperties!=NULL && pPhrase->pProperties->pFirstChild!=NULL) {
232 const SPPHRASEPROPERTY* pSemanticTag = pPhrase->pProperties->pFirstChild;
233 //
234 map2action(pSemanticTag->pszValue, pSemanticTag->SREngineConfidence);
235 }
236 ::CoTaskMemFree(pPhrase);
237 }
238 }
239
240 m_pSpeechContext->GetEvents(1, &curEvent, &fetched);
241 }
242
243 return;
244}
245
246
247
248void CNiSpeech::setConfidence(double confd)
249{
250 if (confd>1.0) confd = 1.0;
251 else if (confd<0.0) confd = 0.0;
252
253 m_confidence = confd;
254}
255
256
257
258
260// スレッド
261
262UINT CNiSpeech::speechThread(LPVOID pParam)
263{
264 CNiSpeech* pthis = (CNiSpeech*)pParam;
265 return pthis->speechThread();
266}
267
268
269
270UINT CNiSpeech::speechThread(void)
271{
272 DEBUG_INFO("CNiSpeech::speechThread(): START\n");
273
274 bool bContinue = true;
275
276 while(bContinue) {
277 //
278 if (WaitForSingleObject(m_hStopEvent, 0)==WAIT_OBJECT_0) {
279 bContinue = false;
280 continue;
281 }
282
283 if (WaitForSingleObject(m_hSpeechEvent, 0)==WAIT_OBJECT_0) {
284 process();
285 }
286
287 Sleep(10);
288 }
289
290 DEBUG_INFO("CNiSpeech::speechThread(): END\n");
291 return TRUE;
292}
293
294
295
296void CNiSpeech::map2action(LPCTSTR tag, double confd)
297{
298 WORD param;
299
300 if (confd>=m_confidence) {
301 param = TRUE;
302 SendWinMessage(JBXWL_WM_SPEECH_EVENT, (WPARAM)&param, (LPARAM)tag);
303 }
304 else {
305 param = FALSE;
306 SendWinMessage(JBXWL_WM_SPEECH_EVENT, (WPARAM)&param, (LPARAM)_T("N/A"));
307 }
308}
309
310
311#endif // ENABLE_NI_SPEECH
312
Speech Platform クラス ヘッダ
#define JBXWL_WM_SPEECH_EVENT
Definition WinTools.h:41
void SendWinMessage(UINT mesg, WPARAM wparam=NULL, LPARAM lparam=NULL)
Definition WinTools.cpp:561
void releaseNull(T *&ptr)
Definition WinTools.h:220