Skip to content

Commit dded13b

Browse files
committed
feat(api): add Gemini Flash 2.0 Multimodal Live API support
1 parent 0870255 commit dded13b

File tree

1 file changed

+79
-0
lines changed

1 file changed

+79
-0
lines changed

fern/apis/api/openapi.json

Lines changed: 79 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -5543,6 +5543,75 @@
55435543
"model"
55445544
]
55455545
},
5546+
"GeminiMultimodalLivePrebuiltVoiceConfig": {
5547+
"type": "object",
5548+
"properties": {
5549+
"voiceName": {
5550+
"type": "string",
5551+
"enum": [
5552+
"Puck",
5553+
"Charon",
5554+
"Kore",
5555+
"Fenrir",
5556+
"Aoede"
5557+
]
5558+
}
5559+
},
5560+
"required": [
5561+
"voiceName"
5562+
]
5563+
},
5564+
"GeminiMultimodalLiveVoiceConfig": {
5565+
"type": "object",
5566+
"properties": {
5567+
"prebuiltVoiceConfig": {
5568+
"$ref": "#/components/schemas/GeminiMultimodalLivePrebuiltVoiceConfig"
5569+
}
5570+
},
5571+
"required": [
5572+
"prebuiltVoiceConfig"
5573+
]
5574+
},
5575+
"GeminiMultimodalLiveSpeechConfig": {
5576+
"type": "object",
5577+
"properties": {
5578+
"voiceConfig": {
5579+
"$ref": "#/components/schemas/GeminiMultimodalLiveVoiceConfig"
5580+
}
5581+
},
5582+
"required": [
5583+
"voiceConfig"
5584+
]
5585+
},
5586+
"GoogleRealtimeConfig": {
5587+
"type": "object",
5588+
"properties": {
5589+
"topP": {
5590+
"type": "number",
5591+
"description": "This is the nucleus sampling parameter that controls the cumulative probability of tokens considered during text generation.\nOnly applicable with the Gemini Flash 2.0 Multimodal Live API."
5592+
},
5593+
"topK": {
5594+
"type": "number",
5595+
"description": "This is the top-k sampling parameter that limits the number of highest probability tokens considered during text generation.\nOnly applicable with the Gemini Flash 2.0 Multimodal Live API."
5596+
},
5597+
"presencePenalty": {
5598+
"type": "number",
5599+
"description": "This is the presence penalty parameter that influences the model's likelihood to repeat information by penalizing tokens based on their presence in the text.\nOnly applicable with the Gemini Flash 2.0 Multimodal Live API."
5600+
},
5601+
"frequencyPenalty": {
5602+
"type": "number",
5603+
"description": "This is the frequency penalty parameter that influences the model's likelihood to repeat tokens by penalizing them based on their frequency in the text.\nOnly applicable with the Gemini Flash 2.0 Multimodal Live API."
5604+
},
5605+
"speechConfig": {
5606+
"description": "This is the speech configuration object that defines the voice settings to be used for the model's speech output.\nOnly applicable with the Gemini Flash 2.0 Multimodal Live API.",
5607+
"allOf": [
5608+
{
5609+
"$ref": "#/components/schemas/GeminiMultimodalLiveSpeechConfig"
5610+
}
5611+
]
5612+
}
5613+
}
5614+
},
55465615
"GoogleModel": {
55475616
"type": "object",
55485617
"properties": {
@@ -5613,6 +5682,8 @@
56135682
"type": "string",
56145683
"description": "This is the Google model that will be used.",
56155684
"enum": [
5685+
"gemini-2.0-flash-exp",
5686+
"gemini-2.0-flash-realtime-exp",
56165687
"gemini-1.5-flash",
56175688
"gemini-1.5-flash-002",
56185689
"gemini-1.5-pro",
@@ -5626,6 +5697,14 @@
56265697
"google"
56275698
]
56285699
},
5700+
"realtimeConfig": {
5701+
"description": "This is the session configuration for the Gemini Flash 2.0 Multimodal Live API.\nOnly applicable if the model `gemini-2.0-flash-realtime-exp` is selected.",
5702+
"allOf": [
5703+
{
5704+
"$ref": "#/components/schemas/GoogleRealtimeConfig"
5705+
}
5706+
]
5707+
},
56295708
"temperature": {
56305709
"type": "number",
56315710
"description": "This is the temperature that will be used for calls. Default is 0 to leverage caching for lower latency.",

0 commit comments

Comments
 (0)