firstbatchxyz
diff --git a/‎.env.example‎
Lines changed: 1 addition & 1 deletion b/‎.env.example‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎Cargo.lock‎
Lines changed: 1 addition & 0 deletions b/‎Cargo.lock‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎Cargo.toml‎
Lines changed: 1 addition & 1 deletion b/‎Cargo.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎workflows/Cargo.toml‎
Lines changed: 2 additions & 1 deletion b/‎workflows/Cargo.toml‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎workflows/src/models.rs‎ renamed to ‎workflows/src/config.rs‎
Lines changed: 92 additions & 77 deletions b/‎workflows/src/models.rs‎ renamed to ‎workflows/src/config.rs‎
Lines changed: 92 additions & 77 deletions
diff --git a/‎workflows/src/lib.rs‎
Lines changed: 6 additions & 20 deletions b/‎workflows/src/lib.rs‎
Lines changed: 6 additions & 20 deletions
diff --git a/‎workflows/src/providers/mod.rs‎
Lines changed: 5 additions & 0 deletions b/‎workflows/src/providers/mod.rs‎
Lines changed: 5 additions & 0 deletions
@@ -10,7 +10,7 @@ DKN_ADMIN_PUBLIC_KEY=0208ef5e65a9c656a6f92fb2c770d5d5e2ecffe02a6aade19207f75110b
 DKN_MODELS=
 
 ## DRIA (optional) ##
-# P2P address, you don't need to change this unless you really want this port.
+# P2P address, you don't need to change this unless this port is already in use.
 DKN_P2P_LISTEN_ADDR=/ip4/0.0.0.0/tcp/4001
 # Comma-separated static relay nodes
 DKN_RELAY_NODES=
 
@@ -17,7 +17,7 @@ serde = { version = "1.0", features = ["derive"] }
 serde_json = "1.0"
 async-trait = "0.1.81"
 reqwest = "0.12.5"
-
+rand = "0.8.5"
 env_logger = "0.11.3"
 log = "0.4.21"
 eyre = "0.6.12"
@@ -15,8 +15,9 @@ serde.workspace = true
 serde_json.workspace = true
 async-trait.workspace = true
 reqwest.workspace = true
-
+rand.workspace = true
 log.workspace = true
 eyre.workspace = true
 
+# ollama-rs is re-exported from ollama-workflows
 ollama-workflows = { git = "https://github.com/andthattoo/ollama-workflows" }
@@ -1,89 +1,21 @@
-use crate::{utils::split_comma_separated, OllamaConfig, OpenAIConfig};
+use crate::{split_comma_separated, OllamaConfig, OpenAIConfig};
 use eyre::{eyre, Result};
 use ollama_workflows::{Model, ModelProvider};
 use rand::seq::IteratorRandom; // provides Vec<_>.choose
 
 #[derive(Debug, Clone)]
 pub struct ModelConfig {
+    /// List of models with their providers.
     pub models: Vec<(ModelProvider, Model)>,
+    /// Even if Ollama is not used, we store the host & port here.
+    /// If Ollama is used, this config will be respected during its instantiations.
     pub ollama: OllamaConfig,
+    /// OpenAI API key & its service check implementation.
     pub openai: OpenAIConfig,
 }
 
-impl std::fmt::Display for ModelConfig {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
-        let models_str = self
-            .models
-            .iter()
-            .map(|(provider, model)| format!("{:?}:{}", provider, model))
-            .collect::<Vec<_>>()
-            .join(",");
-        write!(f, "{}", models_str)
-    }
-}
-
 impl ModelConfig {
-    /// Creates a new config with the given list of models.
-    pub fn new(models: Vec<Model>) -> Self {
-        // map models to (provider, model) pairs
-        let models_providers = models
-            .into_iter()
-            .map(|m| (m.clone().into(), m))
-            .collect::<Vec<_>>();
-
-        let mut providers = Vec::new();
-
-        // get ollama models & config
-        let ollama_models = models_providers
-            .iter()
-            .filter_map(|(p, m)| {
-                if *p == ModelProvider::Ollama {
-                    Some(m.clone())
-                } else {
-                    None
-                }
-            })
-            .collect::<Vec<_>>();
-        let ollama_config = if !ollama_models.is_empty() {
-            providers.push(ModelProvider::Ollama);
-            Some(OllamaConfig::new(ollama_models))
-        } else {
-            None
-        };
-
-        // get openai models & config
-        let openai_models = models_providers
-            .iter()
-            .filter_map(|(p, m)| {
-                if *p == ModelProvider::OpenAI {
-                    Some(m.clone())
-                } else {
-                    None
-                }
-            })
-            .collect::<Vec<_>>();
-        let openai_config = if !openai_models.is_empty() {
-            providers.push(ModelProvider::OpenAI);
-            Some(OpenAIConfig::new(openai_models))
-        } else {
-            None
-        };
-
-        Self {
-            models_providers,
-            providers,
-            ollama_config,
-            openai_config,
-        }
-    }
-
     /// Parses Ollama-Workflows compatible models from a comma-separated values string.
-    ///
-    /// ## Example
-    ///
-    /// ```
-    /// let config = ModelConfig::new_from_csv("gpt-4-turbo,gpt-4o-mini");
-    /// ```
     pub fn new_from_csv(input: Option<String>) -> Self {
         let models_str = split_comma_separated(input);
 
@@ -98,7 +30,11 @@ impl ModelConfig {
             })
             .collect::<Vec<_>>();
 
-        Self { models }
+        Self {
+            models,
+            openai: OpenAIConfig::new(),
+            ollama: OllamaConfig::new(),
+        }
     }
 
     /// Returns the models that belong to a given providers from the config.
@@ -117,12 +53,27 @@ impl ModelConfig {
 
     /// Given a raw model name or provider (as a string), returns the first matching model & provider.
     ///
-    /// If this is a model and is supported by this node, it is returned directly.
-    /// If this is a provider, the first matching model in the node config is returned.
+    /// - If input is `*` or `all`, a random model is returned.
+    /// - if input is `!` the first model is returned.
+    /// - If input is a model and is supported by this node, it is returned directly.
+    /// - If input is a provider, the first matching model in the node config is returned.
     ///
     /// If there are no matching models with this logic, an error is returned.
     pub fn get_matching_model(&self, model_or_provider: String) -> Result<(ModelProvider, Model)> {
-        if let Ok(provider) = ModelProvider::try_from(model_or_provider.clone()) {
+        if model_or_provider == "*" {
+            // return a random model
+            self.models
+                .iter()
+                .choose(&mut rand::thread_rng())
+                .ok_or_else(|| eyre!("No models to randomly pick for '*'."))
+                .cloned()
+        } else if model_or_provider == "!" {
+            // return the first model
+            self.models
+                .first()
+                .ok_or_else(|| eyre!("No models to choose first for '!'."))
+                .cloned()
+        } else if let Ok(provider) = ModelProvider::try_from(model_or_provider.clone()) {
             // this is a valid provider, return the first matching model in the config
             self.models
                 .iter()
@@ -186,6 +137,70 @@ impl ModelConfig {
                 unique
             })
     }
+
+    /// Check if the required compute services are running.
+    /// This has several steps:
+    ///
+    /// - If Ollama models are used, hardcoded models are checked locally, and for
+    ///   external models, the workflow is tested with a simple task with timeout.
+    /// - If OpenAI models are used, the API key is checked and the models are tested
+    ///
+    /// If both type of models are used, both services are checked.
+    /// In the end, bad models are filtered out and we simply check if we are left if any valid models at all.
+    /// If not, an error is returned.
+    pub async fn check_services(&mut self) -> Result<()> {
+        log::info!("Checking configured services.");
+
+        // TODO: can refactor (provider, model) logic here
+        let unique_providers = self.get_providers();
+
+        let mut good_models = Vec::new();
+
+        // if Ollama is a provider, check that it is running & Ollama models are pulled (or pull them)
+        if unique_providers.contains(&ModelProvider::Ollama) {
+            let ollama_models = self.get_models_for_provider(ModelProvider::Ollama);
+
+            // ensure that the models are pulled / pull them if not
+            let good_ollama_models = self.ollama.check(ollama_models).await?;
+            good_models.extend(
+                good_ollama_models
+                    .into_iter()
+                    .map(|m| (ModelProvider::Ollama, m)),
+            );
+        }
+
+        // if OpenAI is a provider, check that the API key is set
+        if unique_providers.contains(&ModelProvider::OpenAI) {
+            let openai_models = self.get_models_for_provider(ModelProvider::OpenAI);
+
+            let good_openai_models = self.openai.check(openai_models).await?;
+            good_models.extend(
+                good_openai_models
+                    .into_iter()
+                    .map(|m| (ModelProvider::OpenAI, m)),
+            );
+        }
+
+        // update good models
+        if good_models.is_empty() {
+            Err(eyre!("No good models found, please check logs for errors."))
+        } else {
+            self.models = good_models;
+            Ok(())
+        }
+    }
+}
+
+impl std::fmt::Display for ModelConfig {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        let models_str = self
+            .models
+            .iter()
+            .map(|(provider, model)| format!("{:?}:{}", provider, model))
+            .collect::<Vec<_>>()
+            .join(",");
+        write!(f, "{}", models_str)
+    }
 }
 
 #[cfg(test)]
 
@@ -1,22 +1,8 @@
-use async_trait::async_trait;
-use eyre::Result;
+mod utils;
+pub use utils::*;
 
-mod models;
-pub use models::ModelConfig;
+mod providers;
+pub use providers::*;
 
-/// Ollama configurations & service checks
-mod ollama;
-pub(crate) use ollama::OllamaConfig;
-
-/// OpenAI configurations & service checks
-mod openai;
-pub(crate) use openai::OpenAIConfig;
-
-/// Extension trait for model providers to check if they are ready, and describe themselves.
-#[async_trait]
-pub trait ProvidersExt {
-    const PROVIDER_NAME: &str;
-
-    /// Ensures that the required provider is online & ready.
-    async fn check_service(&self) -> Result<()>;
-}
+mod config;
+pub use config::ModelConfig;
@@ -0,0 +1,5 @@
+mod ollama;
+pub use ollama::OllamaConfig;
+
+mod openai;
+pub use openai::OpenAIConfig;