javascript synthesizer events etc

eric-urban · eric-urban · commit cc3e7fe960be · 2022-09-29T16:26:56.000-07:00
diff --git a/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/cpp.md b/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/cpp.md
@@ -100,7 +100,7 @@ This time, save the result to a [`SpeechSynthesisResult`](/cpp/cognitive-service
 void synthesizeSpeech()
 {
     auto speechConfig = SpeechConfig::FromSubscription("YourSpeechKey", "YourSpeechRegion");
-    auto synthesizer = SpeechSynthesizer::FromConfig(speechConfig, NULL);
+    auto synthesizer = SpeechSynthesizer::FromConfig(speechConfig);
 
     auto result = synthesizer->SpeakTextAsync("Getting the response as an in-memory stream.").get();
     auto stream = AudioDataStream::FromResult(result);
@@ -132,7 +132,7 @@ void synthesizeSpeech()
     auto speechConfig = SpeechConfig::FromSubscription("YourSpeechKey", "YourSpeechRegion");
     speechConfig->SetSpeechSynthesisOutputFormat(SpeechSynthesisOutputFormat::Riff24Khz16BitMonoPcm);
 
-    auto synthesizer = SpeechSynthesizer::FromConfig(speechConfig, NULL);
+    auto synthesizer = SpeechSynthesizer::FromConfig(speechConfig);
     auto result = synthesizer->SpeakTextAsync("A simple test to write to a file.").get();
 
     auto stream = AudioDataStream::FromResult(result);
@@ -164,7 +164,7 @@ Next, you need to change the speech synthesis request to reference your XML file
 void synthesizeSpeech()
 {
     auto speechConfig = SpeechConfig::FromSubscription("YourSpeechKey", "YourSpeechRegion");
-    auto synthesizer = SpeechSynthesizer::FromConfig(speechConfig, NULL);
+    auto synthesizer = SpeechSynthesizer::FromConfig(speechConfig);
 
     std::ifstream file("./ssml.xml");
     std::string ssml, line;
diff --git a/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/csharp.md b/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/csharp.md
@@ -212,7 +212,7 @@ class Program
         </speak>";
 
         // Required for sentence-level WordBoundary events
-        speechConfig.SetProperty("SpeechServiceResponse_RequestSentenceBoundary", "true");
+        speechConfig.SetProperty(PropertyId.SpeechServiceResponse_RequestSentenceBoundary, "true");
 
         using (var speechSynthesizer = new SpeechSynthesizer(speechConfig))
         {
diff --git a/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/javascript.md b/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/javascript.md
@@ -341,12 +341,100 @@ While using the [SpeechSynthesizer](/javascript/api/microsoft-cognitiveservices-
 
 [!INCLUDE [Event types](events.md)]
 
-Here's an example that shows how to subscribe to the `bookmarkReached` event for speech synthesis. 
+Here's an example that shows how to subscribe to events for speech synthesis. You can follow the instructions in the [quickstart](../../../get-started-text-to-speech.md?pivots=javascript), but replace the contents of that `SpeechSynthesis.js` file with the following JavaScript code.
 
 ```javascript
-synthesizer.bookmarkReached = function (s, e) {
-    window.console.log("(Bookmark reached), Audio offset: " + e.audioOffset / 10000 + "ms, bookmark text: " + e.text);
-}
+(function() {
+
+    "use strict";
+
+    var sdk = require("microsoft-cognitiveservices-speech-sdk");
+
+    var audioFile = "YourAudioFile.wav";
+    const speechConfig = sdk.SpeechConfig.fromSubscription(process.env.SPEECH_KEY, process.env.SPEECH_REGION);
+    const audioConfig = sdk.AudioConfig.fromAudioFileOutput(audioFile);
+
+    var speechSynthesisVoiceName  = "en-US-JennyNeural";  
+    var ssml = `<speak version='1.0' xml:lang='en-US' xmlns='http://www.w3.org/2001/10/synthesis' xmlns:mstts='http://www.w3.org/2001/mstts'> \r\n \
+        <voice name='${speechSynthesisVoiceName}'> \r\n \
+            <mstts:viseme type='redlips_front'/> \r\n \
+            The rainbow has seven colors: <bookmark mark='colors_list_begin'/>Red, orange, yellow, green, blue, indigo, and violet.<bookmark mark='colors_list_end'/>. \r\n \
+        </voice> \r\n \
+    </speak>`;
+    
+    // Required for WordBoundary event sentences.
+    speechConfig.setProperty(sdk.PropertyId.SpeechServiceResponse_RequestSentenceBoundary, "true");
+
+    // Create the speech speechSynthesizer.
+    var speechSynthesizer = new sdk.SpeechSynthesizer(speechConfig, audioConfig);
+
+    speechSynthesizer.bookmarkReached = function (s, e) {
+        var str = `BookmarkReached event: \
+            \r\n\tAudioOffset: ${(e.audioOffset + 5000) / 10000}ms \
+            \r\n\tText: \"${e.Text}\".`;
+        console.log(str);
+    }
+
+    speechSynthesizer.synthesisCanceled = function (s, e) {
+        console.log("SynthesisCanceled event");
+    };
+    
+    speechSynthesizer.synthesisCompleted = function (s, e) {
+        var str = `SynthesisCompleted event: \
+                    \r\n\tAudioData: ${e.result.audioData.byteLength} bytes \
+                    \r\n\tAudioDuration: ${e.result.audioDuration}`;
+        console.log(str);
+    };
+
+    speechSynthesizer.synthesisStarted = function (s, e) {
+        console.log("SynthesisStarted event");
+    };
+
+    speechSynthesizer.synthesizing = function (s, e) {
+        var str = `Synthesizing event: \
+            \r\n\tAudioData: ${e.result.audioData.byteLength} bytes`;
+        console.log(str);
+    };
+    
+    speechSynthesizer.visemeReceived = function(s, e) {
+        var str = `VisemeReceived event: \
+            \r\n\tAudioOffset: ${(e.audioOffset + 5000) / 10000}ms \
+            \r\n\tVisemeId: ${e.visemeId}`;
+        console.log(str);
+    }
+
+    speechSynthesizer.wordBoundary = function (s, e) {
+        // Word, Punctuation, or Sentence
+        var str = `WordBoundary event: \
+            \r\n\tBoundaryType: ${e.boundaryType} \
+            \r\n\tAudioOffset: ${(e.audioOffset + 5000) / 10000}ms \
+            \r\n\tDuration: ${e.duration} \
+            \r\n\tText: \"${e.text}\" \
+            \r\n\tTextOffset: ${e.textOffset} \
+            \r\n\tWordLength: ${e.wordLength}`;
+        console.log(str);
+    };
+
+    // Synthesize the SSML
+    console.log(`SSML to synthesize: \r\n ${ssml}`)
+    console.log(`Synthesize to: ${audioFile}`);
+    speechSynthesizer.speakSsmlAsync(ssml,
+        function (result) {
+      if (result.reason === sdk.ResultReason.SynthesizingAudioCompleted) {
+        console.log("SynthesizingAudioCompleted result");
+      } else {
+        console.error("Speech synthesis canceled, " + result.errorDetails +
+            "\nDid you set the speech resource key and region values?");
+      }
+      speechSynthesizer.close();
+      speechSynthesizer = null;
+    },
+        function (err) {
+      console.trace("err - " + err);
+      speechSynthesizer.close();
+      speechSynthesizer = null;
+    });
+}());
 ```
 
 You can find more text-to-speech samples at [GitHub](https://aka.ms/csspeech/samples).

Original file line number	Diff line number	Diff line change
`@@ -212,7 +212,7 @@ class Program`
`212`	`212`	`</speak>";`
`213`	`213`
`214`	`214`	`// Required for sentence-level WordBoundary events`
`215`		`- speechConfig.SetProperty("SpeechServiceResponse_RequestSentenceBoundary", "true");`
	`215`	`+ speechConfig.SetProperty(PropertyId.SpeechServiceResponse_RequestSentenceBoundary, "true");`
`216`	`216`
`217`	`217`	`using (var speechSynthesizer = new SpeechSynthesizer(speechConfig))`
`218`	`218`	`{`