add basic classes

VinayGuthal · VinayGuthal · commit 503a2d26839b · 2025-03-11T14:52:42.000-04:00
diff --git a/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/LiveGenerativeModel.kt b/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/LiveGenerativeModel.kt
@@ -0,0 +1,87 @@
+/*
+ * Copyright 2024 Google LLC
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.google.firebase.vertexai
+
+import android.graphics.Bitmap
+import com.google.firebase.appcheck.interop.InteropAppCheckTokenProvider
+import com.google.firebase.auth.internal.InternalAuthProvider
+import com.google.firebase.vertexai.common.APIController
+import com.google.firebase.vertexai.common.AppCheckHeaderProvider
+import com.google.firebase.vertexai.common.CountTokensRequest
+import com.google.firebase.vertexai.common.GenerateContentRequest
+import com.google.firebase.vertexai.type.Content
+import com.google.firebase.vertexai.type.CountTokensResponse
+import com.google.firebase.vertexai.type.FinishReason
+import com.google.firebase.vertexai.type.FirebaseVertexAIException
+import com.google.firebase.vertexai.type.GenerateContentResponse
+import com.google.firebase.vertexai.type.GenerationConfig
+import com.google.firebase.vertexai.type.LiveGenerationConfig
+import com.google.firebase.vertexai.type.LiveSession
+import com.google.firebase.vertexai.type.PromptBlockedException
+import com.google.firebase.vertexai.type.RequestOptions
+import com.google.firebase.vertexai.type.ResponseStoppedException
+import com.google.firebase.vertexai.type.SafetySetting
+import com.google.firebase.vertexai.type.SerializationException
+import com.google.firebase.vertexai.type.Tool
+import com.google.firebase.vertexai.type.ToolConfig
+import com.google.firebase.vertexai.type.content
+import kotlinx.coroutines.flow.Flow
+import kotlinx.coroutines.flow.catch
+import kotlinx.coroutines.flow.map
+import kotlinx.serialization.ExperimentalSerializationApi
+
+/**
+ * Represents a multimodal model (like Gemini), capable of generating content based on various input
+ * types.
+ */
+public class LiveGenerativeModel
+internal constructor(
+    private val modelName: String,
+    private val config: LiveGenerationConfig? = null,
+    private val tools: List<Tool>? = null,
+    private val toolConfig: ToolConfig? = null,
+    private val systemInstruction: Content? = null,
+    private val controller: APIController,
+) {
+    internal constructor(
+        modelName: String,
+        apiKey: String,
+        config: LiveGenerationConfig? = null,
+        tools: List<Tool>? = null,
+        toolConfig: ToolConfig? = null,
+        systemInstruction: Content? = null,
+        requestOptions: RequestOptions = RequestOptions(),
+        appCheckTokenProvider: InteropAppCheckTokenProvider? = null,
+        internalAuthProvider: InternalAuthProvider? = null,
+    ) : this(
+        modelName,
+        config,
+        tools,
+        toolConfig,
+        systemInstruction,
+        APIController(
+            apiKey,
+            modelName,
+            requestOptions,
+            "gl-kotlin/${KotlinVersion.CURRENT} fire/${BuildConfig.VERSION_NAME}",
+            AppCheckHeaderProvider(TAG, appCheckTokenProvider, internalAuthProvider),
+        ),
+    )
+
+    public suspend fun connect(): LiveSession = LiveSession()
+
+}
diff --git a/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/LiveGenerationConfig.kt b/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/LiveGenerationConfig.kt
@@ -0,0 +1,202 @@
+/*
+ * Copyright 2023 Google LLC
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.google.firebase.vertexai.type
+
+import kotlinx.serialization.SerialName
+import kotlinx.serialization.Serializable
+
+/**
+ * Configuration parameters to use for content generation.
+ *
+ * @property temperature A parameter controlling the degree of randomness in token selection. A
+ * temperature of 0 means that the highest probability tokens are always selected. In this case,
+ * responses for a given prompt are mostly deterministic, but a small amount of variation is still
+ * possible.
+ *
+ * @property topK The `topK` parameter changes how the model selects tokens for output. A `topK` of
+ * 1 means the selected token is the most probable among all the tokens in the model's vocabulary,
+ * while a `topK` of 3 means that the next token is selected from among the 3 most probable using
+ * the `temperature`. For each token selection step, the `topK` tokens with the highest
+ * probabilities are sampled. Tokens are then further filtered based on `topP` with the final token
+ * selected using `temperature` sampling. Defaults to 40 if unspecified.
+ *
+ * @property topP The `topP` parameter changes how the model selects tokens for output. Tokens are
+ * selected from the most to least probable until the sum of their probabilities equals the `topP`
+ * value. For example, if tokens A, B, and C have probabilities of 0.3, 0.2, and 0.1 respectively
+ * and the topP value is 0.5, then the model will select either A or B as the next token by using
+ * the `temperature` and exclude C as a candidate. Defaults to 0.95 if unset.
+ *
+ * @property candidateCount The maximum number of generated response messages to return. This value
+ * must be between [1, 8], inclusive. If unset, this will default to 1.
+ *
+ * - Note: Only unique candidates are returned. Higher temperatures are more likely to produce
+ * unique candidates. Setting `temperature` to 0 will always produce exactly one candidate
+ * regardless of the `candidateCount`.
+ *
+ * @property presencePenalty Positive penalties.
+ *
+ * @property frequencyPenalty Frequency penalties.
+ *
+ * @property maxOutputTokens Specifies the maximum number of tokens that can be generated in the
+ * response. The number of tokens per word varies depending on the language outputted. Defaults to 0
+ * (unbounded).
+ *
+ * @property stopSequences A set of up to 5 `String`s that will stop output generation. If
+ * specified, the API will stop at the first appearance of a stop sequence. The stop sequence will
+ * not be included as part of the response.
+ *
+ * @property responseMimeType Output response MIME type of the generated candidate text (IANA
+ * standard).
+ *
+ * Supported MIME types depend on the model used, but could include:
+ * - `text/plain`: Text output; the default behavior if unspecified.
+ * - `application/json`: JSON response in the candidates.
+ *
+ * @property responseSchema Output schema of the generated candidate text. If set, a compatible
+ * [responseMimeType] must also be set.
+ *
+ * Compatible MIME types:
+ * - `application/json`: Schema for JSON response.
+ *
+ * Refer to the
+ * [Control generated output](https://cloud.google.com/vertex-ai/generative-ai/docs/multimodal/control-generated-output)
+ * guide for more details.
+ */
+public class LiveGenerationConfig
+private constructor(
+    internal val temperature: Float?,
+    internal val topK: Int?,
+    internal val topP: Float?,
+    internal val candidateCount: Int?,
+    internal val maxOutputTokens: Int?,
+    internal val presencePenalty: Float?,
+    internal val frequencyPenalty: Float?,
+    internal val responseModalities: List<ContentModality>?
+    internal val speechConfig: SpeechConfig?
+) {
+
+    /**
+     * Builder for creating a [GenerationConfig].
+     *
+     * Mainly intended for Java interop. Kotlin consumers should use [generationConfig] for a more
+     * idiomatic experience.
+     *
+     * @property temperature See [GenerationConfig.temperature].
+     *
+     * @property topK See [GenerationConfig.topK].
+     *
+     * @property topP See [GenerationConfig.topP].
+     *
+     * @property presencePenalty See [GenerationConfig.presencePenalty]
+     *
+     * @property frequencyPenalty See [GenerationConfig.frequencyPenalty]
+     *
+     * @property candidateCount See [GenerationConfig.candidateCount].
+     *
+     * @property maxOutputTokens See [GenerationConfig.maxOutputTokens].
+     *
+     * @property stopSequences See [GenerationConfig.stopSequences].
+     *
+     * @property responseMimeType See [GenerationConfig.responseMimeType].
+     *
+     * @property responseSchema See [GenerationConfig.responseSchema].
+     * @see [generationConfig]
+     */
+    public class Builder {
+        @JvmField public var temperature: Float? = null
+        @JvmField public var topK: Int? = null
+        @JvmField public var topP: Float? = null
+        @JvmField public var candidateCount: Int? = null
+        @JvmField public var maxOutputTokens: Int? = null
+        @JvmField public var presencePenalty: Float? = null
+        @JvmField public var frequencyPenalty: Float? = null
+        @JvmField public var responseModalities: List<SpeechConfig>? = null
+        @JvmField public var speechConfig: SpeechConfig? = null
+
+        /** Create a new [GenerationConfig] with the attached arguments. */
+        public fun build(): LiveGenerationConfig =
+            LiveGenerationConfig(
+                temperature = temperature,
+                topK = topK,
+                topP = topP,
+                candidateCount = candidateCount,
+                maxOutputTokens = maxOutputTokens,
+                presencePenalty = presencePenalty,
+                frequencyPenalty = frequencyPenalty,
+                responseModalities = responseModalities,
+                speechConfig = speechConfig
+            )
+    }
+
+    internal fun toInternal() =
+        Internal(
+            temperature = temperature,
+            topP = topP,
+            topK = topK,
+            candidateCount = candidateCount,
+            maxOutputTokens = maxOutputTokens,
+            frequencyPenalty = frequencyPenalty,
+            presencePenalty = presencePenalty,
+            speechConfig = speechConfig,
+            responseModalities = responseModalities
+        )
+
+    @Serializable
+    internal data class Internal(
+        val temperature: Float?,
+        @SerialName("top_p") val topP: Float?,
+        @SerialName("top_k") val topK: Int?,
+        @SerialName("candidate_count") val candidateCount: Int?,
+        @SerialName("max_output_tokens") val maxOutputTokens: Int?,
+        @SerialName("presence_penalty") val presencePenalty: Float? = null,
+        @SerialName("frequency_penalty") val frequencyPenalty: Float? = null,
+        @SerialName("speech_config") val speechConfig: SpeechConfig? = null,
+        @SerialName("response_modalities") val responseModalities: List<ContentModality>? = null
+    )
+
+    public companion object {
+
+        /**
+         * Alternative casing for [GenerationConfig.Builder]:
+         * ```
+         * val config = GenerationConfig.builder()
+         * ```
+         */
+        public fun builder(): Builder = Builder()
+    }
+}
+
+/**
+ * Helper method to construct a [GenerationConfig] in a DSL-like manner.
+ *
+ * Example Usage:
+ * ```
+ * generationConfig {
+ *   temperature = 0.75f
+ *   topP = 0.5f
+ *   topK = 30
+ *   candidateCount = 4
+ *   maxOutputTokens = 300
+ *   stopSequences = listOf("in conclusion", "-----", "do you need")
+ * }
+ * ```
+ */
+public fun liveGenerationConfig(init: LiveGenerationConfig.Builder.() -> Unit): LiveGenerationConfig {
+    val builder = LiveGenerationConfig.builder()
+    builder.init()
+    return builder.build()
+}
diff --git a/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/LiveSession.kt b/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/LiveSession.kt
@@ -0,0 +1,5 @@
+package com.google.firebase.vertexai.type
+
+public class LiveSession {
+
+}
diff --git a/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/SpeechConfig.kt b/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/SpeechConfig.kt
@@ -0,0 +1,6 @@
+package com.google.firebase.vertexai.type
+
+import kotlinx.serialization.Serializable
+
+@Serializable
+class SpeechConfig(val voice_config: VoiceConfig)
diff --git a/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/VoiceConfig.kt b/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/VoiceConfig.kt
@@ -0,0 +1,6 @@
+package com.google.firebase.vertexai.type
+
+import kotlinx.serialization.Serializable
+
+@Serializable
+class SpeechConfig(val voice: Voices)
diff --git a/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/Voices.kt b/firebase-vertexai/src/main/kotlin/com/google/firebase/vertexai/type/Voices.kt
@@ -0,0 +1,53 @@
+/*
+ * Copyright 2025 Google LLC
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.google.firebase.vertexai.type
+
+import com.google.firebase.vertexai.common.util.FirstOrdinalSerializer
+import kotlinx.serialization.KSerializer
+import kotlinx.serialization.SerialName
+import kotlinx.serialization.Serializable
+
+/** Content part modality. */
+public class Voices private constructor(public val ordinal: Int) {
+
+    @Serializable(Internal.Serializer::class)
+    internal enum class Internal {
+        @SerialName("VOICES_UNSPECIFIED") UNSPECIFIED,
+        CHARON,
+        AOEDE
+
+        internal object Serializer : KSerializer<Internal> by FirstOrdinalSerializer(Internal::class)
+
+        internal fun toPublic() =
+            when (this) {
+                CHARON -> Voices.CHARON
+                AOEDE -> Voices.AOEDE
+                else -> Voices.UNSPECIFIED
+            }
+    }
+
+    public companion object {
+        /** Unspecified modality. */
+        @JvmField public val UNSPECIFIED: Voices = Voices(0)
+
+        /** Plain text. */
+        @JvmField public val CHARON: Voices = Voices(1)
+
+        /** Image. */
+        @JvmField public val AOEDE: Voices = Voices(2)
+    }
+}

-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +package com.google.firebase.vertexai.type
++
 +public class LiveSession {
++
 +}