[mirotalksfu] - Merge pull request #206 from AkibHossainOmi/main

feat: Add dynamic switching between English and Bangla for voice recognition
هذا الالتزام موجود في:
Miroslav Pejic
2025-04-27 08:04:30 +02:00
ملتزم من قبل GitHub
الأصل 79ec677b86 ca9ef96cc5
التزام 2cadfd485f

عرض الملف

@@ -4,70 +4,138 @@ let isWebkitSpeechRecognitionSupported = false;
let recognition;
let isVoiceCommandsEnabled = true;
let browserLanguage = navigator.language || navigator.userLanguage;
let isVoiceCommandSupported = browserLanguage.includes('en-');
let isVoiceCommandSupported = browserLanguage.includes('en-') || browserLanguage.includes('bn-');
let currentLanguage = 'en';
let currentLangCode = 'en-US';
const speechRecognition = window.SpeechRecognition || window.webkitSpeechRecognition;
/**
* Enable real-time voice recognition in the chat, allowing you to execute commands using your voice.
* Note: Currently, it supports only the English language.
* TODO make it multi languages...
* Note: Currently, it supports only the English and Bangla language.
* TODO add more languages...
*/
const commands = {
shareRoom: 'room',
hideMe: 'hide me',
showMe: 'show me',
newRoom: 'new room',
leaveRoom: 'exit the room',
audioOn: 'start the audio',
audioOff: 'stop the audio',
videoOn: 'start the video',
videoOff: 'stop the video',
screenOn: 'start the screen',
screenOff: 'stop the screen',
chatOn: 'open the chat',
chatSend: 'send',
chatOff: 'close the chat',
pollOn: 'open the poll',
pollOff: 'close the poll',
editorOn: 'open the editor',
editorOff: 'close the editor',
toggleTr: 'toggle transcription',
whiteboardOn: 'open the whiteboard',
whiteboardOff: 'close the whiteboard',
snapshotRoom: 'Snapshot room',
recordingOn: 'start the recording',
recordingPause: 'pause the recording',
recordingResume: 'resume the recording',
recordingOff: 'stop the recording',
settingsOn: 'open the settings',
settingsOff: 'close the settings',
participantsOn: 'show the participants',
participantsOff: 'hide the participants',
participantsVideoOff: 'stop the participants video',
participantsAudioOff: 'stop the participants audio',
participantsKickOut: 'kick out the participants',
fileShareOn: 'open a file',
fileShareOff: 'close a file',
videoShareOn: 'share the video',
videoShareOff: 'close the video',
swapCamera: 'swap the camera',
raiseHand: 'raise the hand',
lowerHand: 'lower the hand',
roomLock: 'lock the room',
roomUnlock: 'unlock the room',
about: 'show the about',
email: 'open email',
google: 'open google',
googleTr: 'open google translate',
youtube: 'open youtube',
facebook: 'open facebook',
linkedin: 'open linkedin',
twitter: 'open twitter',
tiktok: 'open tiktok',
github: 'open github',
survey: 'open survey',
stopRecognition: 'stop the voice recognition',
const languageHandlers = {
en: {
langCode: 'en-US',
commands: {
shareRoom: 'room',
hideMe: 'hide me',
showMe: 'show me',
newRoom: 'new room',
leaveRoom: 'exit the room',
audioOn: 'start the audio',
audioOff: 'stop the audio',
videoOn: 'start the video',
videoOff: 'stop the video',
screenOn: 'start the screen',
screenOff: 'stop the screen',
chatOn: 'open the chat',
chatSend: 'send',
chatOff: 'close the chat',
pollOn: 'open the poll',
pollOff: 'close the poll',
editorOn: 'open the editor',
editorOff: 'close the editor',
toggleTr: 'toggle transcription',
whiteboardOn: 'open the whiteboard',
whiteboardOff: 'close the whiteboard',
snapshotRoom: 'Snapshot room',
recordingOn: 'start the recording',
recordingPause: 'pause the recording',
recordingResume: 'resume the recording',
recordingOff: 'stop the recording',
settingsOn: 'open the settings',
settingsOff: 'close the settings',
participantsOn: 'show the participants',
participantsOff: 'hide the participants',
participantsVideoOff: 'stop the participants video',
participantsAudioOff: 'stop the participants audio',
participantsKickOut: 'kick out the participants',
fileShareOn: 'open a file',
fileShareOff: 'close a file',
videoShareOn: 'share the video',
videoShareOff: 'close the video',
swapCamera: 'swap the camera',
raiseHand: 'raise the hand',
lowerHand: 'lower the hand',
roomLock: 'lock the room',
roomUnlock: 'unlock the room',
about: 'show the about',
email: 'open email',
google: 'open google',
googleTr: 'open google translate',
youtube: 'open youtube',
facebook: 'open facebook',
linkedin: 'open linkedin',
twitter: 'open twitter',
tiktok: 'open tiktok',
github: 'open github',
survey: 'open survey',
recognizeBangla: 'recognise bangla',
stopRecognition: 'stop the voice recognition',
},
},
bn: {
langCode: 'bn-BD',
commands: {
shareRoom: 'রুম শেয়ার করো',
hideMe: 'আমাকে লুকাও',
showMe: 'আমাকে দেখাও',
newRoom: 'নতুন রুম',
leaveRoom: 'রুম থেকে বের হও',
audioOn: 'অডিও চালু করো',
audioOff: 'অডিও বন্ধ করো',
videoOn: 'ভিডিও চালু করো',
videoOff: 'ভিডিও বন্ধ করো',
screenOn: 'স্ক্রিন চালু করো',
screenOff: 'স্ক্রিন বন্ধ করো',
chatOn: 'চ্যাট খুলো',
chatSend: 'পাঠাও',
chatOff: 'চ্যাট বন্ধ করো',
pollOn: 'পোল খুলো',
pollOff: 'পোল বন্ধ করো',
editorOn: 'এডিটর খুলো',
editorOff: 'এডিটর বন্ধ করো',
toggleTr: 'ট্রান্সক্রিপশন চালু/বন্ধ করো',
whiteboardOn: 'হোয়াইটবোর্ড খুলো',
whiteboardOff: 'হোয়াইটবোর্ড বন্ধ করো',
snapshotRoom: 'রুমের ছবি তুলো',
recordingOn: 'রেকর্ডিং শুরু করো',
recordingPause: 'রেকর্ডিং বিরতি দাও',
recordingResume: 'রেকর্ডিং আবার শুরু করো',
recordingOff: 'রেকর্ডিং বন্ধ করো',
settingsOn: 'সেটিংস খুলো',
settingsOff: 'সেটিংস বন্ধ করো',
participantsOn: 'অংশগ্রহণকারীদের দেখাও',
participantsOff: 'অংশগ্রহণকারীদের লুকাও',
participantsVideoOff: 'অংশগ্রহণকারীদের ভিডিও বন্ধ করো',
participantsAudioOff: 'অংশগ্রহণকারীদের অডিও বন্ধ করো',
participantsKickOut: 'অংশগ্রহণকারীদের বের করে দাও',
fileShareOn: 'ফাইল খুলো',
fileShareOff: 'ফাইল বন্ধ করো',
videoShareOn: 'ভিডিও শেয়ার করো',
videoShareOff: 'ভিডিও বন্ধ করো',
swapCamera: 'ক্যামেরা পরিবর্তন করো',
raiseHand: 'হাত তুলো',
lowerHand: 'হাত নামাও',
roomLock: 'রুম লক করো',
roomUnlock: 'রুম আনলক করো',
about: 'সম্পর্কিত দেখাও',
email: 'ইমেইল খুলো',
google: 'গুগল খুলো',
googleTr: 'গুগল অনুবাদ খুলো',
youtube: 'ইউটিউব খুলো',
facebook: 'ফেসবুক খুলো',
linkedin: 'লিঙ্কডইন খুলো',
twitter: 'টুইটার খুলো',
tiktok: 'টিকটক খুলো',
github: 'গিটহাব খুলো',
survey: 'সার্ভে খুলো',
recognizeEnglish: 'ইংরেজিতে করো',
stopRecognition: 'ভয়েস রিকগনিশন বন্ধ করো',
},
},
};
const browser = {
@@ -88,7 +156,7 @@ if (speechRecognition) {
recognition.maxAlternatives = 1;
recognition.continuous = true;
recognition.lang = browserLanguage;
setRecognitionLanguage(recognition, currentLangCode);
console.log('Speech recognition', recognition);
@@ -104,7 +172,7 @@ if (speechRecognition) {
let current = e.resultIndex;
let transcript = e.results[current][0].transcript;
if (transcript) {
if (transcript.trim().toLowerCase() != commands.chatSend) {
if (transcript.trim().toLowerCase() != languageHandlers[currentLanguage].commands.chatSend) {
chatMessage.value = transcript;
}
if (isVoiceCommandsEnabled && isVoiceCommandSupported) {
@@ -132,8 +200,17 @@ if (speechRecognition) {
console.warn('This browser not supports webkitSpeechRecognition');
}
function setRecognitionLanguage(recognition, languageCode) {
if (!recognition) {
console.error('Recognition object is not defined.');
return;
}
recognition.lang = languageCode;
console.log(`Voice recognition language set to: ${languageCode}`);
}
function startSpeech() {
recognition.lang = browserLanguage;
recognition.lang = languageHandlers[currentLanguage]?.langCode || 'en-US';
recognition.start();
}
@@ -143,229 +220,243 @@ function stopSpeech() {
function execVoiceCommands(transcript) {
switch (transcript.trim().toLowerCase()) {
case commands.shareRoom:
printCommand(commands.shareRoom);
case languageHandlers[currentLanguage].commands.shareRoom:
printCommand(languageHandlers[currentLanguage].commands.shareRoom);
shareButton.click();
break;
case commands.hideMe:
printCommand(commands.hideMe);
case languageHandlers[currentLanguage].commands.hideMe:
printCommand(languageHandlers[currentLanguage].commands.hideMe);
hideMeButton.click();
break;
case commands.showMe:
printCommand(commands.showMe);
case languageHandlers[currentLanguage].commands.showMe:
printCommand(languageHandlers[currentLanguage].commands.showMe);
hideMeButton.click();
break;
case commands.newRoom:
printCommand(commands.newRoom);
case languageHandlers[currentLanguage].commands.newRoom:
printCommand(languageHandlers[currentLanguage].commands.newRoom);
openURL(browser.newroom);
break;
case commands.leaveRoom:
printCommand(commands.leaveRoom);
case languageHandlers[currentLanguage].commands.leaveRoom:
printCommand(languageHandlers[currentLanguage].commands.leaveRoom);
exitButton.click();
break;
case commands.audioOn:
printCommand(commands.audioOn);
case languageHandlers[currentLanguage].commands.audioOn:
printCommand(languageHandlers[currentLanguage].commands.audioOn);
startAudioButton.click();
break;
case commands.audioOff:
printCommand(commands.audioOff);
case languageHandlers[currentLanguage].commands.audioOff:
printCommand(languageHandlers[currentLanguage].commands.audioOff);
stopAudioButton.click();
break;
case commands.videoOn:
printCommand(commands.videoOn);
case languageHandlers[currentLanguage].commands.videoOn:
printCommand(languageHandlers[currentLanguage].commands.videoOn);
startVideoButton.click();
break;
case commands.videoOff:
printCommand(commands.videoOff);
case languageHandlers[currentLanguage].commands.videoOff:
printCommand(languageHandlers[currentLanguage].commands.videoOff);
stopVideoButton.click();
break;
case commands.screenOn:
printCommand(commands.screenOn);
case languageHandlers[currentLanguage].commands.screenOn:
printCommand(languageHandlers[currentLanguage].commands.screenOn);
startScreenButton.click();
break;
case commands.screenOff:
printCommand(commands.screenOff);
case languageHandlers[currentLanguage].commands.screenOff:
printCommand(languageHandlers[currentLanguage].commands.screenOff);
stopScreenButton.click();
break;
case commands.chatOn:
printCommand(commands.chatOn);
case languageHandlers[currentLanguage].commands.chatOn:
printCommand(languageHandlers[currentLanguage].commands.chatOn);
chatButton.click();
break;
case commands.pollOn:
printCommand(commands.pollOn);
case languageHandlers[currentLanguage].commands.pollOn:
printCommand(languageHandlers[currentLanguage].commands.pollOn);
pollButton.click();
break;
case commands.pollOff:
printCommand(commands.pollOff);
case languageHandlers[currentLanguage].commands.pollOff:
printCommand(languageHandlers[currentLanguage].commands.pollOff);
pollCloseBtn.click();
break;
case commands.editorOn:
printCommand(commands.editorOn);
case languageHandlers[currentLanguage].commands.editorOn:
printCommand(languageHandlers[currentLanguage].commands.editorOn);
editorButton.click();
break;
case commands.editorOff:
printCommand(commands.editorOff);
case languageHandlers[currentLanguage].commands.editorOff:
printCommand(languageHandlers[currentLanguage].commands.editorOff);
editorCloseBtn.click();
break;
case commands.chatSend:
printCommand(commands.chatSend);
case languageHandlers[currentLanguage].commands.chatSend:
printCommand(languageHandlers[currentLanguage].commands.chatSend);
chatSendButton.click();
break;
case commands.chatOff:
printCommand(commands.chatOff);
case languageHandlers[currentLanguage].commands.chatOff:
printCommand(languageHandlers[currentLanguage].commands.chatOff);
chatCloseButton.click();
break;
case commands.toggleTr:
case languageHandlers[currentLanguage].commands.toggleTr:
transcriptionButton.click();
break;
case commands.whiteboardOn:
printCommand(commands.whiteboardOn);
case languageHandlers[currentLanguage].commands.whiteboardOn:
printCommand(languageHandlers[currentLanguage].commands.whiteboardOn);
whiteboardButton.click();
break;
case commands.whiteboardOff:
printCommand(commands.whiteboardOff);
case languageHandlers[currentLanguage].commands.whiteboardOff:
printCommand(languageHandlers[currentLanguage].commands.whiteboardOff);
whiteboardCloseBtn.click();
break;
case commands.snapshotRoom:
printCommand(commands.snapshotRoom);
case languageHandlers[currentLanguage].commands.snapshotRoom:
printCommand(languageHandlers[currentLanguage].commands.snapshotRoom);
snapshotRoomButton.click();
break;
case commands.recordingOn:
printCommand(commands.recordingOn);
case languageHandlers[currentLanguage].commands.recordingOn:
printCommand(languageHandlers[currentLanguage].commands.recordingOn);
startRecButton.click();
break;
case commands.recordingPause:
printCommand(commands.recordingPause);
case languageHandlers[currentLanguage].commands.recordingPause:
printCommand(languageHandlers[currentLanguage].commands.recordingPause);
pauseRecButton.click();
break;
case commands.recordingResume:
printCommand(commands.recordingResume);
case languageHandlers[currentLanguage].commands.recordingResume:
printCommand(languageHandlers[currentLanguage].commands.recordingResume);
recordingResume.click();
break;
case commands.recordingOff:
printCommand(commands.recordingOff);
case languageHandlers[currentLanguage].commands.recordingOff:
printCommand(languageHandlers[currentLanguage].commands.recordingOff);
stopRecButton.click();
break;
case commands.settingsOn:
printCommand(commands.settingsOn);
case languageHandlers[currentLanguage].commands.settingsOn:
printCommand(languageHandlers[currentLanguage].commands.settingsOn);
settingsButton.click();
break;
case commands.settingsOff:
printCommand(commands.settingsOff);
case languageHandlers[currentLanguage].commands.settingsOff:
printCommand(languageHandlers[currentLanguage].commands.settingsOff);
mySettingsCloseBtn.click();
break;
case commands.participantsOn:
printCommand(commands.participantsOn);
case languageHandlers[currentLanguage].commands.participantsOn:
printCommand(languageHandlers[currentLanguage].commands.participantsOn);
chatButton.click();
break;
case commands.participantsOff:
printCommand(commands.participantsOff);
case languageHandlers[currentLanguage].commands.participantsOff:
printCommand(languageHandlers[currentLanguage].commands.participantsOff);
chatCloseButton.click();
break;
case commands.participantsVideoOff:
printCommand(commands.participantsVideoOff);
case languageHandlers[currentLanguage].commands.participantsVideoOff:
printCommand(languageHandlers[currentLanguage].commands.participantsVideoOff);
rc.peerAction('me', socket.id, 'hide', true, true);
break;
case commands.participantsAudioOff:
printCommand(commands.participantsAudioOff);
case languageHandlers[currentLanguage].commands.participantsAudioOff:
printCommand(languageHandlers[currentLanguage].commands.participantsAudioOff);
rc.peerAction('me', socket.id, 'mute', true, true);
break;
case commands.participantsKickOut:
printCommand(commands.participantsKickOut);
case languageHandlers[currentLanguage].commands.participantsKickOut:
printCommand(languageHandlers[currentLanguage].commands.participantsKickOut);
rc.peerAction('me', socket.id, 'eject', true, true);
break;
case commands.fileShareOn:
printCommand(commands.fileShareOn);
case languageHandlers[currentLanguage].commands.fileShareOn:
printCommand(languageHandlers[currentLanguage].commands.fileShareOn);
fileShareButton.click();
break;
case commands.fileShareOff:
printCommand(commands.fileShareOff);
case languageHandlers[currentLanguage].commands.fileShareOff:
printCommand(languageHandlers[currentLanguage].commands.fileShareOff);
sendAbortBtn.click();
break;
case commands.videoShareOn:
printCommand(commands.videoShareOn);
case languageHandlers[currentLanguage].commands.videoShareOn:
printCommand(languageHandlers[currentLanguage].commands.videoShareOn);
videoShareButton.click();
break;
case commands.videoShareOff:
printCommand(commands.videoShareOff);
case languageHandlers[currentLanguage].commands.videoShareOff:
printCommand(languageHandlers[currentLanguage].commands.videoShareOff);
videoCloseBtn.click();
break;
case commands.swapCamera:
printCommand(commands.swapCamera);
case languageHandlers[currentLanguage].commands.swapCamera:
printCommand(languageHandlers[currentLanguage].commands.swapCamera);
swapCameraButton.click();
break;
case commands.raiseHand:
printCommand(commands.raiseHand);
case languageHandlers[currentLanguage].commands.raiseHand:
printCommand(languageHandlers[currentLanguage].commands.raiseHand);
raiseHandButton.click();
break;
case commands.lowerHand:
printCommand(commands.lowerHand);
case languageHandlers[currentLanguage].commands.lowerHand:
printCommand(languageHandlers[currentLanguage].commands.lowerHand);
lowerHandButton.click();
break;
case commands.roomLock:
printCommand(commands.roomLock);
case languageHandlers[currentLanguage].commands.roomLock:
printCommand(languageHandlers[currentLanguage].commands.roomLock);
lockRoomButton.click();
break;
case commands.roomUnlock:
printCommand(commands.roomUnlock);
case languageHandlers[currentLanguage].commands.roomUnlock:
printCommand(languageHandlers[currentLanguage].commands.roomUnlock);
unlockRoomButton.click();
break;
case commands.about:
printCommand(commands.about);
case languageHandlers[currentLanguage].commands.about:
printCommand(languageHandlers[currentLanguage].commands.about);
aboutButton.click();
break;
case commands.email:
printCommand(commands.email);
case languageHandlers[currentLanguage].commands.email:
printCommand(languageHandlers[currentLanguage].commands.email);
openURL(browser.email, true);
sound('open');
break;
case commands.google:
printCommand(commands.google);
case languageHandlers[currentLanguage].commands.google:
printCommand(languageHandlers[currentLanguage].commands.google);
openURL(browser.google, true);
sound('open');
break;
case commands.googleTr:
printCommand(commands.googleTr);
case languageHandlers[currentLanguage].commands.googleTr:
printCommand(languageHandlers[currentLanguage].commands.googleTr);
openURL(browser.googleTr, true);
sound('open');
break;
case commands.youtube:
printCommand(commands.youtube);
case languageHandlers[currentLanguage].commands.youtube:
printCommand(languageHandlers[currentLanguage].commands.youtube);
openURL(browser.youtube, true);
sound('open');
break;
case commands.facebook:
printCommand(commands.facebook);
case languageHandlers[currentLanguage].commands.facebook:
printCommand(languageHandlers[currentLanguage].commands.facebook);
openURL(browser.facebook, true);
sound('open');
break;
case commands.linkedin:
printCommand(commands.linkedin);
case languageHandlers[currentLanguage].commands.linkedin:
printCommand(languageHandlers[currentLanguage].commands.linkedin);
openURL(browser.linkedin, true);
sound('open');
break;
case commands.twitter:
printCommand(commands.twitter);
case languageHandlers[currentLanguage].commands.twitter:
printCommand(languageHandlers[currentLanguage].commands.twitter);
openURL(browser.twitter, true);
sound('open');
break;
case commands.tiktok:
printCommand(commands.tiktok);
case languageHandlers[currentLanguage].commands.tiktok:
printCommand(languageHandlers[currentLanguage].commands.tiktok);
openURL(browser.tiktok, true);
sound('open');
break;
case commands.github:
printCommand(commands.github);
case languageHandlers[currentLanguage].commands.github:
printCommand(languageHandlers[currentLanguage].commands.github);
openURL(browser.github, true);
sound('open');
break;
case commands.survey:
printCommand(commands.survey);
case languageHandlers[currentLanguage].commands.survey:
printCommand(languageHandlers[currentLanguage].commands.survey);
survey.enabled && openURL(survey.url, true);
sound('open');
break;
case commands.stopRecognition:
printCommand(commands.stopRecognition);
case languageHandlers[currentLanguage].commands.recognizeBangla:
printCommand(languageHandlers[currentLanguage].commands.recognizeBangla);
currentLanguage = 'bn';
setRecognitionLanguage(recognition, languageHandlers[currentLanguage].langCode);
recognition.stop();
setTimeout(() => recognition.start(), 300);
break;
case languageHandlers[currentLanguage].commands.recognizeEnglish:
printCommand(languageHandlers[currentLanguage].commands.recognizeBangla);
currentLanguage = 'en';
setRecognitionLanguage(recognition, languageHandlers[currentLanguage].langCode);
recognition.stop();
setTimeout(() => recognition.start(), 300);
break;
case languageHandlers[currentLanguage].commands.stopRecognition:
printCommand(languageHandlers[currentLanguage].commands.stopRecognition);
chatSpeechStopButton.click();
break;
// ...