|
318 | 318 | } |
319 | 319 | } |
320 | 320 | }, |
321 | | - "revision": "20250415", |
| 321 | + "revision": "20250424", |
322 | 322 | "rootUrl": "https://texttospeech.googleapis.com/", |
323 | 323 | "schemas": { |
324 | 324 | "AdvancedVoiceOptions": { |
|
403 | 403 | "enum": [ |
404 | 404 | "PHONETIC_ENCODING_UNSPECIFIED", |
405 | 405 | "PHONETIC_ENCODING_IPA", |
406 | | - "PHONETIC_ENCODING_X_SAMPA" |
| 406 | + "PHONETIC_ENCODING_X_SAMPA", |
| 407 | + "PHONETIC_ENCODING_JAPANESE_YOMIGANA", |
| 408 | + "PHONETIC_ENCODING_PINYIN" |
407 | 409 | ], |
408 | 410 | "enumDescriptions": [ |
409 | 411 | "Not specified.", |
410 | 412 | "IPA, such as apple -> ˈæpəl. https://en.wikipedia.org/wiki/International_Phonetic_Alphabet", |
411 | | - "X-SAMPA, such as apple -> \"{p@l\". https://en.wikipedia.org/wiki/X-SAMPA" |
| 413 | + "X-SAMPA, such as apple -> \"{p@l\". https://en.wikipedia.org/wiki/X-SAMPA", |
| 414 | + "For reading-to-pron conversion to work well, the `pronunciation` field should only contain Kanji, Hiragana, and Katakana. The pronunciation can also contain pitch accents. The start of a pitch phrase is specified with `^` and the down-pitch position is specified with `!`, for example: phrase:端 pronunciation:^はし phrase:箸 pronunciation:^は!し phrase:橋 pronunciation:^はし! We currently only support the Tokyo dialect, which allows at most one down-pitch per phrase (i.e. at most one `!` between `^`).", |
| 415 | + "Used to specify pronunciations for Mandarin words. See https://en.wikipedia.org/wiki/Pinyin. For example: 朝阳, the pronunciation is \"chao2 yang2\". The number represents the tone, and there is a space between syllables. Neutral tones are represented by 5, for example 孩子 \"hai2 zi5\"." |
412 | 416 | ], |
413 | 417 | "type": "string" |
414 | 418 | }, |
|
608 | 612 | "$ref": "CustomPronunciations", |
609 | 613 | "description": "Optional. The pronunciation customizations are applied to the input. If this is set, the input is synthesized using the given pronunciation customizations. The initial support is for en-us, with plans to expand to other locales in the future. Instant Clone voices aren't supported. In order to customize the pronunciation of a phrase, there must be an exact match of the phrase in the input types. If using SSML, the phrase must not be inside a phoneme tag." |
610 | 614 | }, |
| 615 | + "markup": { |
| 616 | + "description": "Markup for HD voices specifically. This field may not be used with any other voices.", |
| 617 | + "type": "string" |
| 618 | + }, |
611 | 619 | "multiSpeakerMarkup": { |
612 | 620 | "$ref": "MultiSpeakerMarkup", |
613 | 621 | "description": "The multi-speaker input to be synthesized. Only applicable for multi-speaker synthesis." |
|
0 commit comments