python synthesizer events

eric-urban · eric-urban · commit b5987d6a0737 · 2022-09-29T10:47:54.000-07:00
diff --git a/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/python.md b/articles/cognitive-services/Speech-Service/includes/how-to/speech-synthesis/python.md
@@ -157,11 +157,85 @@ While using the [SpeechSynthesizer](/python/api/azure-cognitiveservices-speech/a
 
 [!INCLUDE [Event types](events.md)]
 
-Here's an example that shows how to subscribe to the `BookmarkReached` event for speech synthesis. 
+Here's an example that shows how to subscribe to events for speech synthesis. You can follow the instructions in the [quickstart](../../../get-started-text-to-speech.md?pivots=python), but replace the contents of that `Program.cs` file with the following C# code. 
 
 ```python
-speech_synthesizer.bookmark_reached.connect(lambda evt: print(
-    "Bookmark reached: {}, audio offset: {}ms, bookmark text: {}.".format(evt, evt.audio_offset / 10000, evt.text)))
+import os
+import azure.cognitiveservices.speech as speechsdk
+
+def speech_synthesizer_bookmark_reached_cb(evt: speechsdk.SessionEventArgs):
+    print('BookmarkReached event')
+    print('\tAudioOffset: {}ms'.format((evt.audio_offset + 5000) / 10000))
+    print('\tText: {}'.format(evt.text))
+
+def speech_synthesizer_synthesis_canceled_cb(evt: speechsdk.SessionEventArgs):
+    print('SynthesisCanceled event')
+
+def speech_synthesizer_synthesis_completed_cb(evt: speechsdk.SessionEventArgs):
+    print('SynthesisCompleted event')
+    print('\tAudioData: {} bytes'.format(len(evt.result.audio_data)))
+    print('\tAudioDuration: {}'.format(evt.result.audio_duration))
+
+def speech_synthesizer_synthesis_started_cb(evt: speechsdk.SessionEventArgs):
+    print('SynthesisStarted event')
+
+def speech_synthesizer_word_boundary_cb(evt: speechsdk.SessionEventArgs):
+    print('WordBoundary event')
+    print('\tBoundaryType: {}'.format(evt.boundary_type))
+    print('\tAudioOffset: {}ms'.format((evt.audio_offset + 5000) / 10000))
+    print('\tDuration: {}'.format(evt.duration))
+    print('\tText: {}'.format(evt.text))
+    print('\tTextOffset: {}'.format(evt.text_offset))
+    print('\tWordLength: {}'.format(evt.word_length))
+
+def speech_synthesizer_synthesizing_cb(evt: speechsdk.SessionEventArgs):
+    print('Synthesizing event')
+    print('\tAudioData: {} bytes'.format(len(evt.result.audio_data)))
+
+def speech_synthesizer_viseme_received_cb(evt: speechsdk.SessionEventArgs):
+    print('VisemeReceived event')
+    print('\tAudioOffset: {}ms'.format((evt.audio_offset + 5000) / 10000))
+    print('\tVisemeId: {}'.format(evt.viseme_id))
+
+speech_config = speechsdk.SpeechConfig(subscription=os.environ.get('SPEECH_KEY'), region=os.environ.get('SPEECH_REGION'))
+audio_config = speechsdk.audio.AudioOutputConfig(use_default_speaker=True)
+speech_synthesizer = speechsdk.SpeechSynthesizer(speech_config=speech_config, audio_config=audio_config)
+
+# Subscribe to events
+speech_synthesizer.bookmark_reached.connect(speech_synthesizer_bookmark_reached_cb)
+speech_synthesizer.synthesis_canceled.connect(speech_synthesizer_synthesis_canceled_cb)
+speech_synthesizer.synthesis_completed.connect(speech_synthesizer_synthesis_completed_cb)
+speech_synthesizer.synthesis_started.connect(speech_synthesizer_synthesis_started_cb)
+speech_synthesizer.synthesis_word_boundary.connect(speech_synthesizer_word_boundary_cb)
+speech_synthesizer.synthesizing.connect(speech_synthesizer_synthesizing_cb)
+speech_synthesizer.viseme_received.connect(speech_synthesizer_viseme_received_cb)
+
+# Required for WordBoundary event sentences.
+speech_config.set_property(property_id=speechsdk.PropertyId.SpeechServiceResponse_RequestSentenceBoundary, value='true')
+
+# The language of the voice that speaks.
+speech_synthesis_voice_name='en-US-JennyNeural'
+
+ssml = """<speak version='1.0' xml:lang='en-US' xmlns='http://www.w3.org/2001/10/synthesis' xmlns:mstts='http://www.w3.org/2001/mstts'>
+    <voice name='{}'>
+        <mstts:viseme type='redlips_front'/>
+        The rainbow has seven colors: <bookmark mark='colors_list_begin'/>Red, orange, yellow, green, blue, indigo, and violet.<bookmark mark='colors_list_end'/>.
+    </voice>
+</speak>""".format(speech_synthesis_voice_name)
+
+# Synthesize the SSML
+print("SSML to synthesize: \r\n{}".format(ssml))
+speech_synthesis_result = speech_synthesizer.speak_ssml_async(ssml).get()
+
+if speech_synthesis_result.reason == speechsdk.ResultReason.SynthesizingAudioCompleted:
+    print("SynthesizingAudioCompleted result")
+elif speech_synthesis_result.reason == speechsdk.ResultReason.Canceled:
+    cancellation_details = speech_synthesis_result.cancellation_details
+    print("Speech synthesis canceled: {}".format(cancellation_details.reason))
+    if cancellation_details.reason == speechsdk.CancellationReason.Error:
+        if cancellation_details.error_details:
+            print("Error details: {}".format(cancellation_details.error_details))
+            print("Did you set the speech resource key and region values?")
 ```
 
 You can find more text-to-speech samples at [GitHub](https://aka.ms/csspeech/samples).