131 lines
5.0 KiB
JavaScript
131 lines
5.0 KiB
JavaScript
// ARRAY DI PAROLE NORMALE, POI PYTHON -> split, for loop, POS e <span con classe POS in html
|
|
|
|
|
|
// The Myth of the Natural Language %%
|
|
// Speech2Design!!
|
|
|
|
// Welcome to the core-code of the Speech-to-text
|
|
|
|
// The tool we are gonna use is the "Web Speech API".
|
|
|
|
// What is an API?
|
|
// An API is a set of defined rules that explain how computers or applications communicate with one another.
|
|
// APIs sit between an application and the web server, acting as an intermediary layer that processes data transfer between systems.
|
|
|
|
|
|
|
|
// GLOBAL VARIABLES
|
|
|
|
let interimTranscripts = ""; // Variable for interim results, the Speech-to-text try different worlds before to give us the most correct one.
|
|
let allTheInterim = ""; // Variable to store *all* the interim results
|
|
let finalTranscripts = ""; // Variable for the... final transcripts
|
|
|
|
// To define bridges to the html file:
|
|
let speech = document.getElementById("result"); // where to print the final result of the recognition
|
|
let process = document.getElementById("process"); // and here the process, print the current sentence with interim results
|
|
|
|
// TEXT STORAGE
|
|
|
|
let textStorage = localStorage.getItem("speech"); // This define where to save the results.
|
|
speech.innerHTML = textStorage; // LocalStorage is a type of web storage that allows you to access a local Storage object and store the data in the browser with no expiration date.
|
|
|
|
// RESET STORAGE
|
|
|
|
let resetStorage = document.getElementById("reset"); // This will just reset, through a button, all the results got by that moment.
|
|
|
|
resetStorage.addEventListener("click", () => { // Reset everything!!!
|
|
allTheInterim = "";
|
|
finalTranscripts = "";
|
|
interimTranscripts = "";
|
|
speech.innerHTML = "";
|
|
textStorage = "";
|
|
localStorage.setItem("speech", "");
|
|
});
|
|
|
|
// SAVE FILE
|
|
|
|
let saveButton = document.getElementById("save"); // This will let you save the results in your desktop through a button
|
|
saveButton.addEventListener("click", () => {
|
|
download("speech.txt", localStorage.getItem("speech"));
|
|
});
|
|
|
|
function download(filename, text) {
|
|
var element = document.createElement("a");
|
|
element.setAttribute("href", "data:text/plain;charset=utf-8," + encodeURIComponent(text));
|
|
element.setAttribute("download", filename);
|
|
|
|
element.style.display = "none";
|
|
document.body.appendChild(element);
|
|
|
|
element.click();
|
|
|
|
document.body.removeChild(element);
|
|
}
|
|
|
|
// START LISTENING
|
|
|
|
startConverting(); // Finally, here is where the magic happen.
|
|
|
|
function startConverting() {
|
|
if ("webkitSpeechRecognition" in window) { // Declaring here the API
|
|
let speechRecognizer = new webkitSpeechRecognition() || new SpeechRecognition();
|
|
|
|
// And here the settings, like
|
|
speechRecognizer.continuous = true; // if the recognition should continue or stop when you finish to talk
|
|
speechRecognizer.interimResults = true; // if you want also get the interim results
|
|
speechRecognizer.lang = "en-US"; // which language you want to recognize (!!)
|
|
speechRecognizer.start(); // and then start :))
|
|
|
|
finalTranscripts = "";
|
|
|
|
// EVENTS
|
|
|
|
// ON END
|
|
speechRecognizer.onend = function () { // If the Speech-to-text stops to work, it will be notified in the console...
|
|
console.log("Speech recognition service disconnected");
|
|
speechRecognizer.start(); // and then restart itself
|
|
};
|
|
|
|
// ON SOUND START
|
|
speechRecognizer.onsoundstart = function () { // When it starts the Speech-to-text, it will be notified in the console
|
|
console.log("Some sound is being received");
|
|
};
|
|
|
|
// ON ERROR
|
|
speechRecognizer.onerror = function (event) {};
|
|
|
|
// ON RESULT
|
|
speechRecognizer.onresult = function (event) { // Here is where the Speech-to-text show itself on the web page.
|
|
interimTranscripts = "";
|
|
|
|
for (let i = event.resultIndex; i < event.results.length; i++) {
|
|
let transcript = event.results[i][0].transcript;
|
|
// console.log(event.results[i][0]);
|
|
transcript.replace("\n", "<br>");
|
|
if (event.results[i].isFinal) {
|
|
// finalTranscripts += ' <span class="oneTranscript"> '+transcript+' </span> \n';
|
|
finalTranscripts += transcript+'\n';
|
|
} else { // There are also shown the interim results and according to their "confidence" (the percentage of how much the word is correct) the color of each word could change
|
|
interimTranscripts += transcript;
|
|
allTheInterim += `<span style="opacity: ${
|
|
event.results[i][0].confidence + 0.3
|
|
}">${interimTranscripts}</span> `;
|
|
}
|
|
}
|
|
process.innerHTML = allTheInterim;
|
|
let final =
|
|
finalTranscripts + '<span class="interim">' + interimTranscripts + "</span>";
|
|
|
|
speech.innerHTML = final;
|
|
|
|
textStorage = final;
|
|
console.log(textStorage);
|
|
localStorage.setItem("speech", final); // Here is where is stored the recognized text in the Local Storage
|
|
};
|
|
} else { // Unfortunately this API works only on Chrome...
|
|
speech.innerHTML = "At the moment this works only in Chrome, sorry";
|
|
}
|
|
}
|
|
|
|
|
|
// 2021, copyleft Kamo and Funix
|