docs(texttospeech): Update TTS Samples to use Chirp 3 Model (#13253)

holtskinner · web-flow · commit 6194578038fe · 2025-03-25T11:21:36.000-05:00
diff --git a/texttospeech/snippets/streaming_tts_quickstart.py b/texttospeech/snippets/streaming_tts_quickstart.py
@@ -23,27 +23,41 @@
 
 def run_streaming_tts_quickstart():
     # [START tts_synthezise_streaming]
-    """Synthesizes speech from a stream of input text.
-    """
+    """Synthesizes speech from a stream of input text."""
     from google.cloud import texttospeech
-    import itertools
 
     client = texttospeech.TextToSpeechClient()
 
     # See https://cloud.google.com/text-to-speech/docs/voices for all voices.
-    streaming_config = texttospeech.StreamingSynthesizeConfig(voice=texttospeech.VoiceSelectionParams(name="en-US-Journey-D", language_code="en-US"))
+    streaming_config = texttospeech.StreamingSynthesizeConfig(
+        voice=texttospeech.VoiceSelectionParams(
+            name="en-US-Chirp3-HD-Charon",
+            language_code="en-US",
+        )
+    )
 
     # Set the config for your stream. The first request must contain your config, and then each subsequent request must contain text.
-    config_request = texttospeech.StreamingSynthesizeRequest(streaming_config=streaming_config)
+    config_request = texttospeech.StreamingSynthesizeRequest(
+        streaming_config=streaming_config
+    )
+
+    text_iterator = [
+        "Hello there. ",
+        "How are you ",
+        "today? It's ",
+        "such nice weather outside.",
+    ]
 
     # Request generator. Consider using Gemini or another LLM with output streaming as a generator.
     def request_generator():
-        yield texttospeech.StreamingSynthesizeRequest(input=texttospeech.StreamingSynthesisInput(text="Hello there. "))
-        yield texttospeech.StreamingSynthesizeRequest(input=texttospeech.StreamingSynthesisInput(text="How are you "))
-        yield texttospeech.StreamingSynthesizeRequest(input=texttospeech.StreamingSynthesisInput(text="today? It's "))
-        yield texttospeech.StreamingSynthesizeRequest(input=texttospeech.StreamingSynthesisInput(text="such nice weather outside."))
+        yield config_request
+        for text in text_iterator:
+            yield texttospeech.StreamingSynthesizeRequest(
+                input=texttospeech.StreamingSynthesisInput(text=text)
+            )
+
+    streaming_responses = client.streaming_synthesize(request_generator())
 
-    streaming_responses = client.streaming_synthesize(itertools.chain([config_request], request_generator()))
     for response in streaming_responses:
         print(f"Audio content size in bytes is: {len(response.audio_content)}")
     # [END tts_synthezise_streaming]
diff --git a/texttospeech/snippets/synthesize_text.py b/texttospeech/snippets/synthesize_text.py
@@ -38,16 +38,17 @@ def synthesize_text():
     # Names of voices can be retrieved with client.list_voices().
     voice = texttospeech.VoiceSelectionParams(
         language_code="en-US",
-        name="en-US-Standard-C",
-        ssml_gender=texttospeech.SsmlVoiceGender.FEMALE,
+        name="en-US-Chirp3-HD-Charon",
     )
 
     audio_config = texttospeech.AudioConfig(
         audio_encoding=texttospeech.AudioEncoding.MP3
     )
 
     response = client.synthesize_speech(
-        request={"input": input_text, "voice": voice, "audio_config": audio_config}
+        input=input_text,
+        voice=voice,
+        audio_config=audio_config,
     )
 
     # The response's audio_content is binary.

Original file line number	Diff line number	Diff line change
`@@ -38,16 +38,17 @@ def synthesize_text():`
`38`	`38`	`# Names of voices can be retrieved with client.list_voices().`
`39`	`39`	`voice = texttospeech.VoiceSelectionParams(`
`40`	`40`	`language_code="en-US",`
`41`		`- name="en-US-Standard-C",`
`42`		`- ssml_gender=texttospeech.SsmlVoiceGender.FEMALE,`
	`41`	`+ name="en-US-Chirp3-HD-Charon",`
`43`	`42`	`)`
`44`	`43`
`45`	`44`	`audio_config = texttospeech.AudioConfig(`
`46`	`45`	`audio_encoding=texttospeech.AudioEncoding.MP3`
`47`	`46`	`)`
`48`	`47`
`49`	`48`	`response = client.synthesize_speech(`
`50`		`- request={"input": input_text, "voice": voice, "audio_config": audio_config}`
	`49`	`+ input=input_text,`
	`50`	`+ voice=voice,`
	`51`	`+ audio_config=audio_config,`
`51`	`52`	`)`
`52`	`53`
`53`	`54`	`# The response's audio_content is binary.`