In this tutorial SIGVerse user will learn how to use the Julius speech recognition service.
Use of the sharing memory between SIGVerse Service and Julius recognition
sendMsg(“VoiceReco_Service”,”Start_Recognition”)Disable service:
sendMsg(“VoiceReco_Service”,”Stop_Recognition”)
User has to use Language Model file which contains a large list of words and their probability of occurrence in a given sequence or grammar file which contains much smaller sets of predefined combinations of words. We use grammar in our service for doing command. Each word in grammar file has an associated list of phonemes (which correspond to the distinct sounds that makes a word). Acoustic model is associated to grammar it contain a statistical representation of each sound that makes each word. Each sound corresponds to a phoneme. Recognition grammar is separated into two files:
• the ".grammar" file which defines a set of rules governing the words the SRE is expected to recognize; rather than listing out each word in the .grammar file, a Julian grammar file uses "Word Categories" - which is the name for a list of words to be recognized (which are defined in a separate ".voca" file);
• the ".voca" file which defines the actual "Word Candidates" in each Word Category and their pronunciation information (Note: the phonemes that make up this pronunciation information must be the same as will be used to train your Acoustic Model).
Compiling grammar : The .grammar and .voca files need to be compiled into ".dfa" and ".dict" files so that Julius can use them. This is done using "mkdfa.pl" grammar compiler. The .grammar and .voca files need to have the same file prefix, and this prefix is then specified to the mkdfa.pl script.
PATH-TO-EXECUTABLE/mkdfa.pl .\grammar\simple
This will generate the expected grammar
#include <sphelper.h> #include <string> #include <iostream> #include "SIGService.h" #include <windows.h> #include <tchar.h> #include <conio.h> #include "app.h" //includes for Shared memory #include <windows.h> #include <stdio.h> #include <conio.h> #include <tchar.h> #pragma comment(lib, "user32.lib")
#define BUF_SIZE 256 TCHAR szName[]=TEXT("Global\\MyFileMappingObject"); LPCTSTR pBuf; HANDLE hMapFile; bool Enable; std::string send_msg_for;
class VoiceRecognition : public sigverse::SIGService { public: VoiceRecognition(std::string name) : SIGService(name){}; ~VoiceRecognition(); double onAction(); void onRecvMsg(sigverse::RecvMsgEvent &evt); void onInit (); };
VoiceRecognition::~VoiceRecognition() { this->disconnect(); }
void VoiceRecognition::onInit (){ //system("start"); Enable = true; system("start .\\julius.exe -input mic -C .\\SIGVerseGrammar/Sample.jconf"); std::string send_msg_for = ""; sleep(2000); }
double VoiceRecognition::onAction() { char* kk = ""; /////// shared memory ////// if (Enable) { hMapFile = CreateFileMapping( INVALID_HANDLE_VALUE, // use paging file NULL, // default security PAGE_READWRITE, // read/write access 0, // maximum object size (high-order DWORD) BUF_SIZE, // maximum object size (low-order DWORD) szName); // name of mapping object if (hMapFile == NULL) { _tprintf(TEXT("Could not create file mapping object (%d).\n"), GetLastError()); return 1; } pBuf = (LPTSTR) MapViewOfFile(hMapFile, // handle to map object FILE_MAP_ALL_ACCESS, // read/write permission 0, 0, BUF_SIZE); if (pBuf == NULL) { _tprintf(TEXT("Could not map view of file (%d).\n"), GetLastError()); CloseHandle(hMapFile); return 0.1; } std::string send_msg ="VOICE_DATA " + (std::string) pBuf; //strcat((char*) send_msg.c_str(),"VOICE_DATA "); //strcat(kk,"VOICE_DATA "); //strcat(kk,(char*)send_msg.c_str()); //std::string send_msgs; //strcpy((char*)send_msgs.c_str(),kk); //if(strcmp(send_msg.c_str(),send_msg_for.c_str())==1) // { this->sendMsg("man_000",(char*) send_msg.c_str()); //this->sendMsg("man_000",kk); printf ("%s \n", (char*) send_msg.c_str() ); // printf ("%s \n", kk ); // } send_msg_for = send_msg; UnmapViewOfFile(pBuf); pBuf = _T(""); CloseHandle(hMapFile); // printf("close the file mapping \n"); } return 0.1; }
void VoiceRecognition::onRecvMsg(sigverse::RecvMsgEvent &evt) { std::string sender = evt.getSender(); std::string msg = evt.getMsg(); std::string s = msg; printf("Message : %s \n",s.c_str()); std::wstring ws; printf("Sender : %s \n", sender.c_str()); if (strcmp(s.c_str(),"Stop_Reco")==0) { Enable = false; } else if(strcmp(s.c_str(),"Start_Reco")==0) { Enable = true; } }
int main(int argc, char** argv) { VoiceRecognition srv("VoiceReco_Service"); srv.onInit(); unsigned short port = (unsigned short)(atoi(argv[2])); srv.connect(argv[1], port); //srv.connect("192.168.40.195", 9000); srv.startLoop(); return 0; }