change modelid in conversationstate into model info

evanliu048 · evanliu048 · commit cb27bf954b41 · 2025-08-07T15:24:35.000-07:00
diff --git a/crates/chat-cli/src/cli/chat/cli/context.rs b/crates/chat-cli/src/cli/chat/cli/context.rs
@@ -222,8 +222,7 @@ impl ContextSubcommand {
                         execute!(session.stderr, style::Print(format!("{}\n\n", "▔".repeat(3))),)?;
                     }
 
-                    let context_files_max_size =
-                        calc_max_context_files_size(session.conversation.model.as_deref(), os).await;
+                    let context_files_max_size = calc_max_context_files_size(session.conversation.model.as_ref());
                     let mut files_as_vec = profile_context_files
                         .iter()
                         .map(|(path, content, _)| (path.clone(), content.clone()))
diff --git a/crates/chat-cli/src/cli/chat/cli/model.rs b/crates/chat-cli/src/cli/chat/cli/model.rs
@@ -9,6 +9,11 @@ use crossterm::{
     queue,
 };
 use dialoguer::Select;
+use serde::{
+    Deserialize,
+    Deserializer,
+    Serialize,
+};
 
 use crate::api_client::Endpoint;
 use crate::cli::chat::{
@@ -17,6 +22,110 @@ use crate::cli::chat::{
     ChatState,
 };
 use crate::os::Os;
+
+#[derive(Debug, Clone, Serialize)]
+pub struct ModelInfo {
+    /// Display name
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub model_name: Option<String>,
+    /// Actual model id to send in the API
+    pub model_id: String,
+    /// Size of the model's context window, in tokens
+    #[serde(default = "default_context_window")]
+    pub context_window_tokens: usize,
+}
+
+impl ModelInfo {
+    pub fn from_api_model(model: &Model) -> Self {
+        let context_window_tokens = model
+            .token_limits()
+            .and_then(|limits| limits.max_input_tokens())
+            .map_or(default_context_window(), |tokens| tokens as usize);
+        Self {
+            model_id: model.model_id().to_string(),
+            model_name: model.model_name().map(|s| s.to_string()),
+            context_window_tokens,
+        }
+    }
+
+    /// create a defualt model with only model_id（be compatoble with old stored model data）
+    pub fn from_id(model_id: String) -> Self {
+        Self {
+            model_id,
+            model_name: None,
+            context_window_tokens: 200_000,
+        }
+    }
+
+    pub fn display_name(&self) -> &str {
+        self.model_name.as_deref().unwrap_or(&self.model_id)
+    }
+}
+impl<'de> Deserialize<'de> for ModelInfo {
+    fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
+    where
+        D: Deserializer<'de>,
+    {
+        use std::fmt;
+
+        use serde::de::{
+            self,
+            MapAccess,
+            Visitor,
+        };
+
+        struct ModelInfoVisitor;
+
+        impl<'de> Visitor<'de> for ModelInfoVisitor {
+            type Value = ModelInfo;
+
+            fn expecting(&self, formatter: &mut fmt::Formatter<'_>) -> fmt::Result {
+                formatter.write_str("a string or a ModelInfo object")
+            }
+
+            // old version: modelid string
+            fn visit_str<E>(self, value: &str) -> Result<ModelInfo, E>
+            where
+                E: de::Error,
+            {
+                Ok(ModelInfo {
+                    model_id: value.to_string(),
+                    model_name: None,
+                    context_window_tokens: default_context_window(),
+                })
+            }
+
+            // new version: modelInfo object
+            fn visit_map<M>(self, mut map: M) -> Result<ModelInfo, M::Error>
+            where
+                M: MapAccess<'de>,
+            {
+                let mut model_id = None;
+                let mut model_name = None;
+                let mut context_window_tokens = None;
+
+                while let Some(key) = map.next_key::<String>()? {
+                    match key.as_str() {
+                        "model_id" => model_id = Some(map.next_value()?),
+                        "model_name" => model_name = map.next_value()?,
+                        "context_window_tokens" => context_window_tokens = Some(map.next_value()?),
+                        _ => {
+                            let _: serde::de::IgnoredAny = map.next_value()?;
+                        },
+                    }
+                }
+
+                Ok(ModelInfo {
+                    model_id: model_id.ok_or_else(|| de::Error::missing_field("model_id"))?,
+                    model_name,
+                    context_window_tokens: context_window_tokens.unwrap_or_else(default_context_window),
+                })
+            }
+        }
+
+        deserializer.deserialize_any(ModelInfoVisitor)
+    }
+}
 #[deny(missing_docs)]
 #[derive(Debug, PartialEq, Args)]
 pub struct ModelArgs;
@@ -45,14 +154,13 @@ pub async fn select_model(os: &Os, session: &mut ChatSession) -> Result<Option<C
         return Ok(None);
     }
 
-    let active_model_id = session.conversation.model.as_deref();
+    let active_model_id = session.conversation.model.as_ref().map(|m| m.model_id.as_str());
 
     let labels: Vec<String> = models
         .iter()
         .map(|model| {
-            let display_name = model.model_name().unwrap_or(model.model_id());
-
-            if Some(model.model_id()) == active_model_id {
+            let display_name = model.display_name();
+            if Some(model.model_id.as_str()) == active_model_id {
                 format!("{} (active)", display_name)
             } else {
                 display_name.to_owned()
@@ -81,10 +189,9 @@ pub async fn select_model(os: &Os, session: &mut ChatSession) -> Result<Option<C
     queue!(session.stderr, style::ResetColor)?;
 
     if let Some(index) = selection {
-        let selected = &models[index];
-        let model_id_str = selected.model_id.clone();
-        session.conversation.model = Some(model_id_str.clone());
-        let display_name = selected.model_name().unwrap_or(selected.model_id());
+        let selected = models[index].clone();
+        session.conversation.model = Some(selected.clone());
+        let display_name = selected.display_name();
 
         queue!(
             session.stderr,
@@ -103,41 +210,38 @@ pub async fn select_model(os: &Os, session: &mut ChatSession) -> Result<Option<C
     }))
 }
 
+pub async fn get_model_info(model_id: &str, os: &Os) -> Result<ModelInfo, ChatError> {
+    let (models, _) = get_available_models(os).await?;
+
+    models
+        .into_iter()
+        .find(|m| m.model_id == model_id)
+        .ok_or_else(|| ChatError::Custom(format!("Model '{}' not found", model_id).into()))
+}
+
 /// Get available models with caching support
-pub async fn get_available_models(os: &Os) -> Result<(Vec<Model>, Model), ChatError> {
+pub async fn get_available_models(os: &Os) -> Result<(Vec<ModelInfo>, ModelInfo), ChatError> {
     let endpoint = Endpoint::configured_value(&os.database);
     let region = endpoint.region().as_ref();
 
-    os.client
+    let (api_models, api_default) = os
+        .client
         .get_available_models(region)
         .await
-        .map_err(|e| ChatError::Custom(format!("Failed to fetch available models: {}", e).into()))
+        .map_err(|e| ChatError::Custom(format!("Failed to fetch available models: {}", e).into()))?;
+
+    let models: Vec<ModelInfo> = api_models.iter().map(ModelInfo::from_api_model).collect();
+    let default_model = ModelInfo::from_api_model(&api_default);
+
+    Ok((models, default_model))
 }
 
 /// Returns the context window length in tokens for the given model_id.
 /// Uses cached model data when available
-pub async fn context_window_tokens(model_id: Option<&str>, os: &Os) -> usize {
-    const DEFAULT_CONTEXT_WINDOW_LENGTH: usize = 200_000;
-
-    // If no model_id provided, return default
-    let Some(model_id) = model_id else {
-        return DEFAULT_CONTEXT_WINDOW_LENGTH;
-    };
-
-    // Try to get from cached models first
-    let (models, _) = match get_available_models(os).await {
-        Ok(models) => models,
-        Err(_) => {
-            // If we can't get models, return default
-            return DEFAULT_CONTEXT_WINDOW_LENGTH;
-        },
-    };
+pub fn context_window_tokens(model_info: Option<&ModelInfo>) -> usize {
+    model_info.map(|m| m.context_window_tokens).unwrap_or(200_000)
+}
 
-    models
-        .iter()
-        .find(|m| m.model_id() == model_id)
-        .and_then(|m| m.token_limits())
-        .and_then(|limits| limits.max_input_tokens())
-        .map(|tokens| tokens as usize)
-        .unwrap_or(DEFAULT_CONTEXT_WINDOW_LENGTH)
+fn default_context_window() -> usize {
+    200_000
 }
diff --git a/crates/chat-cli/src/cli/chat/cli/usage.rs b/crates/chat-cli/src/cli/chat/cli/usage.rs
@@ -62,7 +62,7 @@ impl UsageArgs {
         // set a max width for the progress bar for better aesthetic
         let progress_bar_width = std::cmp::min(window_width, 80);
 
-        let context_window_size = context_window_tokens(session.conversation.model.as_deref(), os).await;
+        let context_window_size = context_window_tokens(session.conversation.model.as_ref());
         let context_width =
             ((context_token_count.value() as f64 / context_window_size as f64) * progress_bar_width as f64) as usize;
         let assistant_width =
diff --git a/crates/chat-cli/src/cli/chat/context.rs b/crates/chat-cli/src/cli/chat/context.rs
@@ -23,6 +23,7 @@ use crate::cli::agent::hook::{
 };
 use crate::cli::chat::ChatError;
 use crate::cli::chat::cli::hooks::HookExecutor;
+use crate::cli::chat::cli::model::ModelInfo;
 use crate::os::Os;
 
 #[derive(Debug, Clone)]
@@ -255,9 +256,9 @@ impl ContextManager {
 }
 
 /// Calculates the maximum context files size to use for the given model id.
-pub async fn calc_max_context_files_size(model_id: Option<&str>, os: &Os) -> usize {
+pub fn calc_max_context_files_size(model: Option<&ModelInfo>) -> usize {
     // Sets the max as 75% of the context window
-    context_window_tokens(model_id, os).await.saturating_mul(3) / 4
+    context_window_tokens(model).saturating_mul(3) / 4
 }
 
 /// Process a path, handling glob patterns and file types.
@@ -432,13 +433,22 @@ mod tests {
     }
 
     #[test]
-    async fn test_calc_max_context_files_size() {
-        let os = Os::new().await.unwrap();
-
+    fn test_calc_max_context_files_size() {
         assert_eq!(
-            calc_max_context_files_size(Some("CLAUDE_SONNET_4_20250514_V1_0"), os),
+            calc_max_context_files_size(Some(&ModelInfo {
+                model_id: "CLAUDE_SONNET_4_20250514_V1_0".to_string(),
+                model_name: Some("Claude".to_string()),
+                context_window_tokens: 200_000,
+            })),
             150_000
         );
-        assert_eq!(calc_max_context_files_size(Some("OPENAI_GPT_OSS_120B_1_0"), os), 96_000);
+        assert_eq!(
+            calc_max_context_files_size(Some(&ModelInfo {
+                model_id: "OPENAI_GPT_OSS_120B_1_0".to_string(),
+                model_name: Some("GPT".to_string()),
+                context_window_tokens: 128_000,
+            })),
+            96_000
+        );
     }
 }
diff --git a/crates/chat-cli/src/cli/chat/conversation.rs b/crates/chat-cli/src/cli/chat/conversation.rs
diff --git a/crates/chat-cli/src/cli/chat/mod.rs b/crates/chat-cli/src/cli/chat/mod.rs

Original file line number	Diff line number	Diff line change
`@@ -222,8 +222,7 @@ impl ContextSubcommand {`
`222`	`222`	`execute!(session.stderr, style::Print(format!("{}\n\n", "▔".repeat(3))),)?;`
`223`	`223`	`}`
`224`	`224`
`225`		`- let context_files_max_size =`
`226`		`- calc_max_context_files_size(session.conversation.model.as_deref(), os).await;`
	`225`	`+ let context_files_max_size = calc_max_context_files_size(session.conversation.model.as_ref());`
`227`	`226`	`let mut files_as_vec = profile_context_files`
`228`	`227`	`.iter()`
`229`	`228`	`.map(\|(path, content, _)\| (path.clone(), content.clone()))`