docs(texttospeech): Create sample for Synthesize speech multiple speakers

holtskinner · holtskinner · commit f65f91c748c6 · 2024-11-19T06:48:42.000-06:00
- https://cloud.google.com/text-to-speech/docs/create-dialogue-with-multispeakers
diff --git a/texttospeech/snippets/requirements.txt b/texttospeech/snippets/requirements.txt
@@ -1,3 +1,3 @@
 future==1.0.0
-google-cloud-texttospeech==2.17.2
-google-cloud-storage==2.9.0
+google-cloud-texttospeech==2.21.1
+google-cloud-storage==2.18.2
diff --git a/texttospeech/snippets/synthesize_speech_multiple_speakers.py b/texttospeech/snippets/synthesize_speech_multiple_speakers.py
@@ -0,0 +1,84 @@
+#!/usr/bin/env python
+# Copyright 2014 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+"""Google Cloud Text-To-Speech API sample application .
+
+Example usage:
+    python synthesize_speech_multiple_speakers.py
+"""
+
+
+def synthesize_speech_multiple_speakers():
+    # [START tts_synthesize_speech_multiple_speakers]
+    """Synthesizes speech for multiple speakers.
+    Make sure to be working in a virtual environment.
+    """
+    from google.cloud import texttospeech_v1beta1 as texttospeech
+
+    # Instantiates a client
+    client = texttospeech.TextToSpeechClient()
+
+    multi_speaker_markup = texttospeech.MultiSpeakerMarkup(
+        turns=[
+            texttospeech.MultiSpeakerMarkup.Turn(
+                text="I've heard that the Google Cloud multi-speaker audio generation sounds amazing!",
+                speaker="R",
+            ),
+            texttospeech.MultiSpeakerMarkup.Turn(
+                text="Oh? What's so good about it?", speaker="S"
+            ),
+            texttospeech.MultiSpeakerMarkup.Turn(text="Well..", speaker="R"),
+            texttospeech.MultiSpeakerMarkup.Turn(text="Well what?", speaker="S"),
+            texttospeech.MultiSpeakerMarkup.Turn(
+                text="Well, you should find it out by yourself!", speaker="R"
+            ),
+            texttospeech.MultiSpeakerMarkup.Turn(
+                text="Alright alright, let's try it out!", speaker="S"
+            ),
+        ]
+    )
+
+    # Set the text input to be synthesized
+    synthesis_input = texttospeech.SynthesisInput(
+        multi_speaker_markup=multi_speaker_markup
+    )
+
+    # Build the voice request, select the language code ('en-US') and the voice
+    voice = texttospeech.VoiceSelectionParams(
+        language_code="en-US", name="en-US-Studio-MultiSpeaker"
+    )
+
+    # Select the type of audio file you want returned
+    audio_config = texttospeech.AudioConfig(
+        audio_encoding=texttospeech.AudioEncoding.MP3
+    )
+
+    # Perform the text-to-speech request on the text input with the selected
+    # voice parameters and audio file type
+    response = client.synthesize_speech(
+        input=synthesis_input, voice=voice, audio_config=audio_config
+    )
+
+    # The response's audio_content is binary.
+    with open("output.mp3", "wb") as out:
+        # Write the response to the output file.
+        out.write(response.audio_content)
+        print('Audio content written to file "output.mp3"')
+    # [END tts_synthesize_speech_multiple_speakers]
+
+
+if __name__ == "__main__":
+    synthesize_speech_multiple_speakers()
diff --git a/texttospeech/snippets/synthesize_speech_multiple_speakers_test.py b/texttospeech/snippets/synthesize_speech_multiple_speakers_test.py
@@ -0,0 +1,28 @@
+#!/usr/bin/env python
+# Copyright 2018 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+
+import synthesize_speech_multiple_speakers
+
+
+def synthesize_speech_multiple_speakers_text(capsys):
+    synthesize_speech_multiple_speakers.synthesize_speech_multiple_speakers()
+    out, err = capsys.readouterr()
+
+    assert "Audio content written to file" in out
+    statinfo = os.stat("output.mp3")
+    assert statinfo.st_size > 0