Chrome Speech Synthesis with longer texts

前端 未结 12 1176
难免孤独
难免孤独 2020-11-30 19:48

I am getting a problem when trying to use Speech Synthesis API in Chrome 33. It works perfectly with a shorter text, but if I try longer text, it just stops in the middle. A

相关标签:
12条回答
  • 2020-11-30 20:06

    Yes, the google synthesis api will stop at some point during speaking a long text.

    We can see onend event, onpause and onerror event of SpeechSynthesisUtterance won't be fired normally when the sudden stop happens, so does the speechSynthesis onerror event.

    After several trials, found speechSynthesis.paused is working, and speechSynthesis.resume() can help resume the speaking.

    Hence we just need to have a timer to check the pause status during the speaking, and calling speechSynthesis.resume() to continue. The interval should be small enough to prevent glitch when continuing the speak.

    let timer = null;
    let reading = false;
    
    let readText = function(text) {
    
        if (!reading) {
            speechSynthesis.cancel();
            if (timer) {
                clearInterval(timer);
            }
            let msg = new SpeechSynthesisUtterance();
            let voices = window.speechSynthesis.getVoices();
            msg.voice = voices[82];
            msg.voiceURI = 'native';
            msg.volume = 1; // 0 to 1
            msg.rate = 1.0; // 0.1 to 10
            msg.pitch = 1; //0 to 2
            msg.text = text;
            msg.lang = 'zh-TW';
    
            msg.onerror = function(e) {
                speechSynthesis.cancel();
                reading = false;
                clearInterval(timer);
            };
    
            msg.onpause = function(e) {
                console.log('onpause in ' + e.elapsedTime + ' seconds.');
            }            
    
            msg.onend = function(e) {
                console.log('onend in ' + e.elapsedTime + ' seconds.');
                reading = false;
                clearInterval(timer);
            };
    
            speechSynthesis.onerror = function(e) {
                console.log('speechSynthesis onerror in ' + e.elapsedTime + ' seconds.');
                speechSynthesis.cancel();
                reading = false;
                clearInterval(timer);
            };
    
            speechSynthesis.speak(msg);
    
            timer = setInterval(function(){
                if (speechSynthesis.paused) {
                    console.log("#continue")
                    speechSynthesis.resume();
                }
    
            }, 100);
    
            reading = true;
    
        }
    }
    
    0 讨论(0)
  • 2020-11-30 20:10

    A simple and effective solution is to resume periodically.

    function resumeInfinity() {
        window.speechSynthesis.resume();
        timeoutResumeInfinity = setTimeout(resumeInfinity, 1000);
    }
    

    You can associate this with the onend and onstart events, so you will only be invoking the resume if necessary. Something like:

    var utterance = new SpeechSynthesisUtterance();
    
    utterance.onstart = function(event) {
        resumeInfinity();
    };
    
    utterance.onend = function(event) {
        clearTimeout(timeoutResumeInfinity);
    };
    

    I discovered this by chance!

    Hope this help!

    0 讨论(0)
  • 2020-11-30 20:16

    I have solved the probleme while having a timer function which call the pause() and resume() function and callset the timer again. On the onend event I clear the timer.

        var myTimeout;
        function myTimer() {
            window.speechSynthesis.pause();
            window.speechSynthesis.resume();
            myTimeout = setTimeout(myTimer, 10000);
        }
        ...
            window.speechSynthesis.cancel();
            myTimeout = setTimeout(myTimer, 10000);
            var toSpeak = "some text";
            var utt = new SpeechSynthesisUtterance(toSpeak);
            ...
            utt.onend =  function() { clearTimeout(myTimeout); }
            window.speechSynthesis.speak(utt);
        ...
    

    This seem to work well.

    0 讨论(0)
  • 2020-11-30 20:18

    The problem with Peter's answer is it doesn't work when you have a queue of speech synthesis set up. The script will put the new chunk at the end of the queue, and thus out of order. Example: https://jsfiddle.net/1gzkja90/

    <script type='text/javascript' src='http://code.jquery.com/jquery-2.1.0.js'></script>
    <script type='text/javascript'>    
        u = new SpeechSynthesisUtterance();
        $(document).ready(function () {
            $('.t').each(function () {
                u = new SpeechSynthesisUtterance($(this).text());
    
                speechUtteranceChunker(u, {
                    chunkLength: 120
                }, function () {
                    console.log('end');
                });
            });
        });
         /**
         * Chunkify
         * Google Chrome Speech Synthesis Chunking Pattern
         * Fixes inconsistencies with speaking long texts in speechUtterance objects 
         * Licensed under the MIT License
         *
         * Peter Woolley and Brett Zamir
         */
        var speechUtteranceChunker = function (utt, settings, callback) {
            settings = settings || {};
            var newUtt;
            var txt = (settings && settings.offset !== undefined ? utt.text.substring(settings.offset) : utt.text);
            if (utt.voice && utt.voice.voiceURI === 'native') { // Not part of the spec
                newUtt = utt;
                newUtt.text = txt;
                newUtt.addEventListener('end', function () {
                    if (speechUtteranceChunker.cancel) {
                        speechUtteranceChunker.cancel = false;
                    }
                    if (callback !== undefined) {
                        callback();
                    }
                });
            }
            else {
                var chunkLength = (settings && settings.chunkLength) || 160;
                var pattRegex = new RegExp('^[\\s\\S]{' + Math.floor(chunkLength / 2) + ',' + chunkLength + '}[.!?,]{1}|^[\\s\\S]{1,' + chunkLength + '}$|^[\\s\\S]{1,' + chunkLength + '} ');
                var chunkArr = txt.match(pattRegex);
    
                if (chunkArr[0] === undefined || chunkArr[0].length <= 2) {
                    //call once all text has been spoken...
                    if (callback !== undefined) {
                        callback();
                    }
                    return;
                }
                var chunk = chunkArr[0];
                newUtt = new SpeechSynthesisUtterance(chunk);
                var x;
                for (x in utt) {
                    if (utt.hasOwnProperty(x) && x !== 'text') {
                        newUtt[x] = utt[x];
                    }
                }
                newUtt.addEventListener('end', function () {
                    if (speechUtteranceChunker.cancel) {
                        speechUtteranceChunker.cancel = false;
                        return;
                    }
                    settings.offset = settings.offset || 0;
                    settings.offset += chunk.length - 1;
                    speechUtteranceChunker(utt, settings, callback);
                });
            }
    
            if (settings.modifier) {
                settings.modifier(newUtt);
            }
            console.log(newUtt); //IMPORTANT!! Do not remove: Logging the object out fixes some onend firing issues.
            //placing the speak invocation inside a callback fixes ordering and onend issues.
            setTimeout(function () {
                speechSynthesis.speak(newUtt);
            }, 0);
        };
    </script>
    <p class="t">MLA format follows the author-page method of in-text citation. This means that the author's last name and the page number(s) from which the quotation or paraphrase is taken must appear in the text, and a complete reference should appear on your Works Cited page. The author's name may appear either in the sentence itself or in parentheses following the quotation or paraphrase, but the page number(s) should always appear in the parentheses, not in the text of your sentence.</p>
    <p class="t">Joe waited for the train.</p>
    <p class="t">The train was late.</p>
    <p class="t">Mary and Samantha took the bus.</p>
    

    In my case, the answer was to "chunk" the string before adding them to the queue. See here: http://jsfiddle.net/vqvyjzq4/

    Many props to Peter for the idea as well as the regex (which I still have yet to conquer.) I'm sure the javascript can be cleaned up, this is more of a proof of concept.

    <script type='text/javascript' src='http://code.jquery.com/jquery-2.1.0.js'></script>
    <script type='text/javascript'>    
        var chunkLength = 120;
        var pattRegex = new RegExp('^[\\s\\S]{' + Math.floor(chunkLength / 2) + ',' + chunkLength + '}[.!?,]{1}|^[\\s\\S]{1,' + chunkLength + '}$|^[\\s\\S]{1,' + chunkLength + '} ');
    
        $(document).ready(function () {
            var element = this;
            var arr = [];
            var txt = replaceBlank($(element).text());
            while (txt.length > 0) {
                arr.push(txt.match(pattRegex)[0]);
                txt = txt.substring(arr[arr.length - 1].length);
            }
            $.each(arr, function () {
                var u = new SpeechSynthesisUtterance(this.trim());
                window.speechSynthesis.speak(u);
            });
        });
    </script>
    <p class="t">MLA format follows the author-page method of in-text citation. This means that the author's last name and the page number(s) from which the quotation or paraphrase is taken must appear in the text, and a complete reference should appear on your Works Cited page. The author's name may appear either in the sentence itself or in parentheses following the quotation or paraphrase, but the page number(s) should always appear in the parentheses, not in the text of your sentence.</p>
    <p class="t">Joe waited for the train.</p>
    <p class="t">The train was late.</p>
    <p class="t">Mary and Samantha took the bus.</p>
    
    0 讨论(0)
  • 2020-11-30 20:20

    Other suggestion do weird thing with dot or say DOT and do not respect speech intonnation on sentence end.

    var CHARACTER_LIMIT = 200;
    var lang = "en";
    
    var text = "MLA format follows the author-page method of in-text citation. This means that the author's last name and the page number(s) from which the quotation or paraphrase is taken must appear in the text, and a complete reference should appear on your Works Cited page. The author's name may appear either in the sentence itself or in parentheses following the quotation or paraphrase, but the page number(s) should always appear in the parentheses, not in the text of your sentence. Joe waited for the train. The train was late. Mary and Samantha took the bus.";
    
        speak(text, lang)
    
        function speak(text, lang) {
    
          //Support for multipart text (there is a limit on characters)
          var multipartText = [];
    
          if (text.length > CHARACTER_LIMIT) {
    
            var tmptxt = text;
    
            while (tmptxt.length > CHARACTER_LIMIT) {
    
              //Split by common phrase delimiters
              var p = tmptxt.search(/[:!?.;]+/);
              var part = '';
    
              //Coludn't split by priority characters, try commas
              if (p == -1 || p >= CHARACTER_LIMIT) {
                p = tmptxt.search(/[,]+/);
              }
    
              //Couldn't split by normal characters, then we use spaces
              if (p == -1 || p >= CHARACTER_LIMIT) {
    
                var words = tmptxt.split(' ');
    
                for (var i = 0; i < words.length; i++) {
    
                  if (part.length + words[i].length + 1 > CHARACTER_LIMIT)
                    break;
    
                  part += (i != 0 ? ' ' : '') + words[i];
    
                }
    
              } else {
    
                part = tmptxt.substr(0, p + 1);
    
              }
    
              tmptxt = tmptxt.substr(part.length, tmptxt.length - part.length);
    
              multipartText.push(part);
              //console.log(part.length + " - " + part);
    
            }
    
            //Add the remaining text
            if (tmptxt.length > 0) {
              multipartText.push(tmptxt);
            }
    
          } else {
    
            //Small text
            multipartText.push(text);
          }
    
    
          //Play multipart text
          for (var i = 0; i < multipartText.length; i++) {
    
            //Use SpeechSynthesis
            //console.log(multipartText[i]);
    
            //Create msg object
            var msg = new SpeechSynthesisUtterance();
            //msg.voice = profile.systemvoice;
            //msg.voiceURI = profile.systemvoice.voiceURI;
            msg.volume = 1; // 0 to 1
            msg.rate = 1; // 0.1 to 10
            // msg.rate = usersetting || 1; // 0.1 to 10
            msg.pitch = 1; //0 to 2*/
            msg.text = multipartText[i];
            msg.speak = multipartText;
            msg.lang = lang;
            msg.onend = self.OnFinishedPlaying;
            msg.onerror = function (e) {
              console.log('Error');
              console.log(e);
            };
            /*GC*/
            msg.onstart = function (e) {
              var curenttxt = e.currentTarget.text;
              console.log(curenttxt);
              //highlight(e.currentTarget.text);
              //$('#showtxt').text(curenttxt);
              //console.log(e);
            };
            //console.log(msg);
            speechSynthesis.speak(msg);
    
          }
    
        }
    

    https://jsfiddle.net/onigetoc/9r27Ltqz/

    0 讨论(0)
  • 2020-11-30 20:24

    I want to say that through Chrome Extensions and Applications, I solved this quite irritating issue through using chrome.tts, since chrome.tts allows you to speak through the browser, instead of the window which stops the talk when you close the window.

    Using the below code, you can fix the above issue with large speakings:

    chrome.tts.speak("Abnormally large string, over 250 characters, etc...");
    setInterval(() => { chrome.tts.resume(); }, 100);
    

    I'm sure that will work, but I did this just to be safe:

    var largeData = "";
    var smallChunks = largeData.match(/.{1,250}/g);
    for (var chunk of smallChunks) {
      chrome.tts.speak(chunk, {'enqueue': true});
    }
    

    Hope this helps someone! It helped make my application work more functionally, and epicly.

    0 讨论(0)
提交回复
热议问题