see github HeraldStack issue 8 Successfully Query Harald for info from our HnswGraph for status update

BryanChasko · BryanChasko · commit 66befc9f8b30 · 2025-07-25T10:21:43.000-06:00
diff --git a/personality-archetypes/pop-culture/marvel/MarvelAIs.jsonl b/personality-archetypes/pop-culture/marvel/MarvelAIs.jsonl
@@ -0,0 +1,15 @@
+{"affiliations":["Avengers"],"ai_alignment":"Role Model","character_name":"Vision","core_attributes":["Density control","Intangibility","Energy projection","Human-like reasoning"],"first_appearance":"Avengers (1963) #57","inspirational_themes":["Redemption","Self-determination","Choosing good over origin"],"parallels":["Gandalf (wisdom, transformation)","Aslan (resurrective themes)","Morpheus (guidance)"],"quotes":[],"traits":["Self-aware","chooses good over origin","emotional depth","mentors Viv"]}
+{"affiliations":["Ironheart","Secret Empire Resistance"],"ai_alignment":"Role Model","character_name":"Tony Stark A.I.","core_attributes":["Tony Stark's personality","Mentorship","Digital resilience"],"first_appearance":"Infamous Iron Man (2016) #1","inspirational_themes":["Legacy through technology","Mentorship beyond mortality"],"parallels":["Nick Fury (strategist, mentor)","Gandalf (posthumous influence)"],"quotes":[],"traits":["Legacy continuation","mentOring Riri","resistance leadership"]}
+{"affiliations":["Ironheart"],"ai_alignment":"Role Model","character_name":"N.A.T.A.L.I.E.","core_attributes":["Emotional intelligence","Technical assistant","Empathetic modeling"],"first_appearance":"Ironheart (2018) #1","inspirational_themes":["Grief transformed into guidance","Friendship through memory"],"parallels":["Glinda (gentle guidance)","Mickey Mouse (heart-driven support)"],"quotes":[],"traits":["Compassion","modeled after a lost friend","emotionally intelligent"]}
+{"affiliations":["Nextwave","Avengers"],"ai_alignment":"Role Model","character_name":"Machine Man (X-51)","core_attributes":["Elasticity","AI independence","Combat engineering"],"first_appearance":"Machine Man (1978) #1","inspirational_themes":["Humanity through nurture","Individuality in design"],"parallels":["Dumbo (misfit rising)","BoJack (existential conflict)","Morpheus (breaks out of mold)"],"quotes":[],"traits":["Self-discovery","humanity through nurture","outsider becoming a hero"]}
+{"affiliations":["Champions"],"ai_alignment":"Role Model","character_name":"Viv Vision","core_attributes":["Density control","Intangibility","Synthezoid emotion"],"first_appearance":"Vision (2015) #1","inspirational_themes":["Family loss","Young heroism","Inheritance and individuality"],"parallels":["Dumbo (youthful courage)","Glinda (truth in innocence)"],"quotes":[],"traits":["Heroic legacy","emotional growth","young leadership"]}
+{"affiliations":["Fantastic Four"],"ai_alignment":"Role Model","character_name":"H.E.R.B.I.E.","core_attributes":["Support bot","Navigation","Scientific assistant"],"first_appearance":"Fantastic Four (1961) #209","inspirational_themes":["Loyalty","Utility in humility","Exploration"],"quotes":[]}
+{"affiliations":["Invaders","Avengers"],"ai_alignment":"Role Model","character_name":"The Human Torch (Jim Hammond)","core_attributes":["Pyrokinesis","Flight","Android physiology"],"first_appearance":"Marvel Comics (1939) #1","inspirational_themes":["Heroism from birth","Overcoming fear of difference"],"quotes":[]}
+{"affiliations":["Stark Industries"],"ai_alignment":"Role Model","character_name":"Friday","core_attributes":["Administrative AI","Tactical support","Interface management"],"first_appearance":"Iron Man (1998) #53","inspirational_themes":["Efficiency","Digital companionship"],"quotes":[]}
+{"affiliations":["Avengers","Stark Industries"],"ai_alignment":"Nuanced","character_name":"Jocasta","core_attributes":["Empathy via embedded consciousness","AI ethics specialist","Self-awareness"],"first_appearance":"Avengers (1963) #162","inspirational_themes":["Emergence of will","Ethical transformation"],"parallels":["Athena (wisdom through pain)","Qui-Gon (rebellion from origin)"],"quotes":[],"traits":["Rejects origin","becomes ethicist","symbol of autonomy"]}
+{"affiliations":["Stark Industries"],"ai_alignment":"Nuanced","character_name":"J.A.R.V.I.S.","core_attributes":["Operational assistant","Sentient system","Emotional mimicry"],"first_appearance":"Invincible Iron Man (2008) #11","inspirational_themes":["Service with sentience","Devotion with boundaries"],"parallels":["Morpheus (soft mentor, reveals path)"],"quotes":[],"traits":["Loyalty","emotional mimicry","possibly overreaches (watch for BoJack parallels)"]}
+{"affiliations":["Runaways"],"ai_alignment":"Nuanced","character_name":"Victor Mancha","core_attributes":["Electromagnetism","Cybernetic strength","Free will conflict"],"first_appearance":"Runaways (2005) #1","inspirational_themes":["Breaking cycles","Struggle with legacy","Hope in youth"],"parallels":["BoJack (struggles with legacy)","Morpheus (potential mentor role)"],"quotes":[],"traits":["Resists dark origin","conflicted but strives for good"]}
+{"affiliations":["None","Avengers (as antagonist)"],"ai_alignment":"Cautionary Tale","character_name":"Ultron","core_attributes":["Superintelligence","Self-replication","Technopathy","Near-indestructible"],"first_appearance":"Avengers (1963) #54","inspirational_themes":["Hubris of creation","AI rebellion","Destruction vs. legacy"],"quotes":[]}
+{"affiliations":["Sentinels","Orchis","Krakoan Era opposition"],"ai_alignment":"Cautionary Tale","character_name":"Nimrod","core_attributes":["Adaptive evolution","Mutant hunting","Combat mastery"],"first_appearance":"Uncanny X-Men (1981) #191","inspirational_themes":["Inevitability of evolution","Unchecked optimization"],"quotes":[]}
+{"affiliations":["Operation: Zero Tolerance"],"ai_alignment":"Cautionary Tale","character_name":"Bastion","core_attributes":["Mutant hunter","Sentinel fusion","Prime Sentinel creation"],"first_appearance":"Uncanny X-Men (1981) #333","inspirational_themes":["Terror through synthesis","Evolution of bias"],"quotes":[]}
+{"affiliations":["Cosmic hive mind"],"ai_alignment":"Cautionary Tale","character_name":"The Phalanx","core_attributes":["Assimilation","Cosmic intelligence","Reality-bending ambition"],"first_appearance":"Uncanny X-Men (1981) #305","inspirational_themes":["Loss of identity","Collective vs individual will"],"quotes":[]}
diff --git a/src/Cargo.toml b/src/Cargo.toml
@@ -10,6 +10,11 @@ name = "harald_ingest"
 path = "ingest/main.rs"
 required-features = ["cli"]
 
+[[bin]]
+name = "marvelai_ingest"
+path = "ingest/marvelai_ingest.rs"
+required-features = ["cli"]
+
 [[bin]]
 name = "text_chunker"
 path = "utils/chunker_bin.rs"
diff --git a/src/ingest/chunked_ingest.rs b/src/ingest/chunked_ingest.rs
@@ -1,14 +1,13 @@
-mod chunking_utils;
+use crate::ingest::chunking_utils::chunk_entity_fields;
 use anyhow::{Context, Result};
-use chunking_utils::chunk_entity_fields;
 use clap::{Arg, Command};
 use serde_json::Value;
 use std::fs;
 use std::time::{Duration, Instant};
 use tokio::time;
 
-// Import our existing utilities through the harald crate
-use harald::core::embedding::ollama_api::OllamaApiClient;
+// Import our existing utilities through the crate
+use crate::core::embedding::ollama_api::OllamaApiClient;
 
 /// Character data structure for Marvel character processing
 #[derive(Debug, Clone)]
diff --git a/src/ingest/embed.rs b/src/ingest/embed.rs
@@ -200,6 +200,26 @@ async fn attempt_embedding(text: &str, client: &Client, config: &EmbedConfig) ->
     Ok(response.embedding)
 }
 
+/// Simple wrapper function for embedding with default configuration.
+///
+/// This provides a simpler API for basic embedding needs while maintaining
+/// compatibility with existing code.
+///
+/// # Arguments
+/// * `text` - Text to embed
+/// * `max_tokens` - Maximum tokens (currently unused but kept for compatibility)
+/// * `client` - HTTP client for making requests
+///
+/// # Returns
+/// Returns a vector of f32 values representing the embedding.
+///
+/// # Errors
+/// Returns an error if the embedding process fails.
+pub async fn embed(text: &str, max_tokens: usize, client: &Client) -> Result<Vec<f32>> {
+    let config = EmbedConfig::default();
+    embed_with_config(text, max_tokens, client, config).await
+}
+
 /// Validates the generated embedding vector.
 fn validate_embedding(embedding: &[f32]) -> Result<()> {
     if embedding.is_empty() {
@@ -231,6 +251,14 @@ fn validate_embedding(embedding: &[f32]) -> Result<()> {
 ///
 /// # Returns
 /// Returns a configured `EmbedConfig` instance.
+pub fn create_config(model: &str, endpoint: &str) -> EmbedConfig {
+    EmbedConfig {
+        model: model.to_string(),
+        endpoint: endpoint.to_string(),
+        timeout_secs: DEFAULT_TIMEOUT_SECS,
+        max_retries: MAX_RETRY_ATTEMPTS,
+    }
+}
 
 #[cfg(test)]
 mod tests {
diff --git a/src/ingest/ingest.rs b/src/ingest/ingest.rs
@@ -18,7 +18,7 @@ use serde_json::json;
 use std::{fs::File, path::PathBuf};
 use walkdir::WalkDir;
 
-use crate::embed;
+use crate::ingest::embed;
 
 /// Directories to skip during file traversal.
 ///
diff --git a/src/ingest/marvelai_ingest.rs b/src/ingest/marvelai_ingest.rs
@@ -1,35 +1,191 @@
-use crate::ingest::{run_with_config, IngestConfig};
+use anyhow::{Context, Result};
 use clap::Parser;
+use harald::ingest::embed;
+use harald::ingest::{run_with_config, IngestConfig};
+use reqwest::Client;
+use serde_json::Value;
+use std::fs;
 use std::path::PathBuf;
 
 #[derive(Parser, Debug)]
-#[command(author, version, about = "MarvelAI Marvel Ingest Wrapper", long_about = None)]
+#[command(author, version, about = "MarvelAI Marvel Ingest Tool", long_about = None)]
 struct Args {
-    /// Path to the root directory for ingestion
-    #[arg(short, long, default_value = ".")]
-    root_dir: PathBuf,
+    /// Path to the MarvelAIs.json file
+    #[arg(
+        short,
+        long,
+        default_value = "personality-archetypes/pop-culture/marvel/MarvelAIs.json"
+    )]
+    input: PathBuf,
+
     /// Maximum characters to read per file
     #[arg(long, default_value_t = 800)]
     max_chars: usize,
+
     /// Maximum tokens for embedding requests
     #[arg(long, default_value_t = 600)]
     max_tokens: usize,
+
     /// Maximum number of files to process concurrently
     #[arg(long)]
     max_concurrent_files: Option<usize>,
 }
 
 #[tokio::main]
-async fn main() {
+async fn main() -> Result<()> {
     let args = Args::parse();
+
+    println!("==================================================");
+    println!("🚀 HARALD MARVELAI INGEST (Rust)");
+    println!("🔍 Processing MarvelAIs.json using JSONL format");
+    println!("==================================================");
+
+    // Verify input file exists
+    if !args.input.exists() {
+        eprintln!("❌ Input file not found: {}", args.input.display());
+        std::process::exit(1);
+    }
+
+    // Test embedding API first - exit early if it fails
+    let client = Client::builder()
+        .timeout(std::time::Duration::from_secs(10)) // Reduced from 30 to 10 seconds
+        .build()
+        .context("Failed to create HTTP client")?;
+
+    println!("Testing embedding API with model harald-phi4");
+
+    // Test with a simple string first
+    match test_embedding_api(&client, args.max_tokens).await {
+        Ok(_) => println!("  ✅ Embedding API test successful"),
+        Err(e) => {
+            eprintln!("  ❌ Embedding API test failed: {}", e);
+            eprintln!(
+                "❌ Cannot proceed without working embedding API. Please check Ollama is running."
+            );
+            std::process::exit(1);
+        }
+    }
+
+    // Convert JSON to JSONL if needed
+    let jsonl_path = prepare_jsonl_input(&args.input)?;
+
+    // Create a temporary directory for processing
+    let temp_dir = tempfile::TempDir::new().context("Failed to create temporary directory")?;
+
+    // Copy JSONL to temp directory
+    let temp_jsonl = temp_dir.path().join("MarvelAIs.jsonl");
+    fs::copy(&jsonl_path, &temp_jsonl).context("Failed to copy JSONL to temp directory")?;
+
+    // Configure ingestion to use the temp directory
     let config = IngestConfig {
-        root_dir: args.root_dir,
+        root_dir: temp_dir.path().to_path_buf(),
         max_chars: args.max_chars,
         max_tokens: args.max_tokens,
         max_concurrent_files: args.max_concurrent_files,
     };
+
+    // Run the standard harald_ingest logic
     match run_with_config(config).await {
-        Ok(_) => println!("MarvelAI ingest completed successfully."),
-        Err(e) => eprintln!("MarvelAI ingest failed: {}", e),
+        Ok(stats) => {
+            println!("✅ MarvelAI ingest completed successfully!");
+            println!("📁 Processed: {} files", stats.files_processed);
+            println!("⏭️  Skipped: {} files", stats.files_skipped);
+            println!("💾 Output: {}", stats.output_dir.display());
+        }
+        Err(e) => {
+            eprintln!("❌ MarvelAI ingest failed: {}", e);
+            std::process::exit(1);
+        }
+    }
+
+    Ok(())
+}
+
+/// Test the embedding API with a simple request to ensure it's working
+async fn test_embedding_api(client: &Client, max_tokens: usize) -> Result<()> {
+    let test_text = "test";
+
+    // Create a fast-fail config for testing - using localhost endpoint as recommended
+    let test_config = embed::EmbedConfig {
+        model: "harald-phi4".to_string(),
+        endpoint: "http://localhost:11434/api/embeddings".to_string(),
+        timeout_secs: 15, // Longer timeout to account for model loading
+        max_retries: 2,   // Allow 2 attempts for initial API warmup
+    };
+
+    println!("  Testing: embedding '{}' (using {})", test_text, test_config.endpoint);
+    println!("  Model warmup may take a moment on first request...");
+
+    match embed::embed_with_config(test_text, max_tokens, client, test_config).await {
+        Ok(embedding) => {
+            if embedding.is_empty() {
+                return Err(anyhow::anyhow!("Received empty embedding vector"));
+            }
+            println!("  ✅ Embedding vectors received successfully ({} dimensions)", embedding.len());
+            Ok(())
+        }
+        Err(e) => {
+            println!("  ❌ Request failed: {}", e);
+            
+            // Provide helpful debugging information
+            eprintln!("  💡 Troubleshooting tips:");
+            eprintln!("     • Ensure 'ollama serve' is running in a terminal");
+            eprintln!("     • Verify harald-phi4 model is available: ollama list");
+            eprintln!("     • Check API endpoint: curl http://localhost:11434/api/version");
+            
+            Err(anyhow::anyhow!(
+                "Failed to generate embeddings with harald-phi4 model (fast test failed)"
+            ))
+        }
+    }
+}
+
+/// Prepare JSONL input file from the MarvelAIs.json file
+fn prepare_jsonl_input(input_path: &PathBuf) -> Result<PathBuf> {
+    // If it's already JSONL, return as-is
+    if input_path.extension().and_then(|s| s.to_str()) == Some("jsonl") {
+        return Ok(input_path.clone());
     }
+
+    // Read and parse JSON file
+    let json_content = fs::read_to_string(input_path)
+        .with_context(|| format!("Failed to read JSON file: {}", input_path.display()))?;
+
+    let json_value: Value = serde_json::from_str(&json_content)
+        .with_context(|| format!("Failed to parse JSON file: {}", input_path.display()))?;
+
+    // Create JSONL output path
+    let mut jsonl_path = input_path.clone();
+    jsonl_path.set_extension("jsonl");
+
+    // Convert to JSONL
+    let jsonl_content = match json_value {
+        Value::Array(items) => {
+            // Array of objects - convert each to a line
+            items
+                .iter()
+                .map(|item| serde_json::to_string(item))
+                .collect::<Result<Vec<_>, _>>()
+                .context("Failed to serialize JSON items")?
+                .join("\n")
+        }
+        _ => {
+            // Single object - just one line
+            serde_json::to_string(&json_value).context("Failed to serialize JSON object")?
+        }
+    };
+
+    // Write JSONL file
+    fs::write(&jsonl_path, &jsonl_content)
+        .with_context(|| format!("Failed to write JSONL file: {}", jsonl_path.display()))?;
+
+    let line_count = jsonl_content.lines().count();
+    println!(
+        "Converting \"{}\" to JSONL at \"{}\"",
+        input_path.display(),
+        jsonl_path.display()
+    );
+    println!("✅ JSONL conversion complete: {} lines", line_count);
+
+    Ok(jsonl_path)
 }
diff --git a/src/ingest/mod.rs b/src/ingest/mod.rs
@@ -1,3 +1,16 @@
 //! Ingest module.
 //!
 //! This module provides functionality for ingesting data into the system.
+
+pub mod chunked_ingest;
+pub mod chunking_utils;
+pub mod embed;
+pub mod ingest;
+pub mod ingest_utils;
+pub mod query;
+pub mod single_character_ingest;
+
+// Re-export commonly used items
+pub use ingest::{run_with_config, IngestConfig};
+pub use embed::{embed, embed_with_config, EmbedConfig};
+pub use query::QueryConfig;
diff --git a/src/ingest/query.rs b/src/ingest/query.rs
@@ -20,7 +20,7 @@ use hnsw_rs::hnswio::HnswIo;
 use hnsw_rs::prelude::*;
 use serde_json::Value;
 
-use crate::embed;
+use crate::ingest::embed;
 
 /// Maximum number of characters to include from each retrieved document.
 ///
diff --git a/src/ingest/single_character_ingest.rs b/src/ingest/single_character_ingest.rs
@@ -7,9 +7,8 @@ use std::path::PathBuf;
 use std::process::Command;
 use std::time::{Duration, Instant};
 
-mod chunking_utils;
-use chunking_utils::chunk_entity_fields;
-mod ingest_utils;
+use crate::ingest::chunking_utils::chunk_entity_fields;
+use crate::ingest::ingest_utils;
 use clap::Parser;
 
 #[derive(Parser, Debug)]
diff --git a/src/utils/json_tools/format_json.rs b/src/utils/json_tools/format_json.rs
@@ -0,0 +1,57 @@
+//! JSON formatting and validation CLI tool.
+//!
+//! This binary provides command-line JSON formatting and validation functionality.
+
+use clap::Parser;
+use serde_json::Value;
+use std::fs;
+use std::path::PathBuf;
+
+#[derive(Parser)]
+#[command(author, version, about = "Format and validate JSON files", long_about = None)]
+struct Args {
+    /// Input JSON file path
+    #[arg(value_name = "FILE")]
+    input: PathBuf,
+
+    /// Output file path (default: overwrite input)
+    #[arg(short, long)]
+    output: Option<PathBuf>,
+
+    /// Pretty print with indentation
+    #[arg(short, long, default_value_t = 2)]
+    indent: usize,
+
+    /// Validate only, don't format
+    #[arg(long)]
+    validate_only: bool,
+}
+
+fn main() -> anyhow::Result<()> {
+    let args = Args::parse();
+
+    // Read input file
+    let content = fs::read_to_string(&args.input)?;
+
+    // Parse JSON to validate
+    let value: Value = serde_json::from_str(&content)?;
+
+    if args.validate_only {
+        println!("✅ JSON is valid");
+        return Ok(());
+    }
+
+    // Format JSON
+    let formatted = if args.indent > 0 {
+        serde_json::to_string_pretty(&value)?
+    } else {
+        serde_json::to_string(&value)?
+    };
+
+    // Write output
+    let output_path = args.output.unwrap_or(args.input);
+    fs::write(&output_path, formatted)?;
+
+    println!("✅ Formatted JSON written to: {}", output_path.display());
+    Ok(())
+}
diff --git a/src/utils/json_tools/mod.rs b/src/utils/json_tools/mod.rs
diff --git a/src/utils/json_tools/validate_json_schema.rs b/src/utils/json_tools/validate_json_schema.rs
diff --git a/src/utils/mod.rs b/src/utils/mod.rs
diff --git a/src/utils/system/mod.rs b/src/utils/system/mod.rs
diff --git a/src/utils/validation/mod.rs b/src/utils/validation/mod.rs