Milestone 10: whitepaper and research paper publishing

trae · trae · commit ab43d7bb7434 · 2026-03-22T15:34:56.000-04:00
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/Cargo.toml b/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "consensusmind"
-version = "0.9.0"
+version = "0.10.0"
 edition = "2021"
 authors = ["Distributed Systems Labs, LLC"]
 license = "Apache-2.0"
diff --git a/README.md b/README.md
@@ -8,7 +8,7 @@ ConsensusMind is an autonomous research agent that conducts end-to-end research
 
 ## Status
 
-**Current Version:** 0.9.0 - Milestone 9 Complete
+**Current Version:** 0.10.0 - Milestone 10 Complete
 
 ### Completed Milestones
 
@@ -54,9 +54,12 @@ ConsensusMind is an autonomous research agent that conducts end-to-end research
 - Unified CLI entrypoints (help/version and command usage)
 - Repo structure improvements for outputs and data directories
 
+#### Milestone 10: Whitepaper & Research Paper
+- Whitepaper (Markdown) and research paper (LaTeX) generation from hypotheses and experiment results
+
 ## Features
 
-### Current (v0.9.0)
+### Current (v0.10.0)
 - Configuration management from TOML files
 - Environment variable overrides for sensitive data
 - Structured logging to file and console
@@ -73,6 +76,7 @@ ConsensusMind is an autonomous research agent that conducts end-to-end research
 - Consensus simulation and experimentation
 - LaTeX paper generation from experiment outputs
 - CLI help/version and stable command interface
+- Whitepaper + research paper publishing commands
 
 ### Planned
 - Automated LaTeX paper generation
@@ -136,13 +140,15 @@ consensusmind run "<query>"
 consensusmind hypothesize "<query>"
 consensusmind experiment <hypothesis-id> [--seeds N] [--ticks T] [--nodes N]
 consensusmind paper <hypothesis-id>
+consensusmind whitepaper <hypothesis-id>
+consensusmind publish <hypothesis-id>
 consensusmind index
 consensusmind semantic-search "<query>" [top_k]
 consensusmind simulate [rounds] [leader_failure_prob] [seed]
 consensusmind raft-simulate [nodes] [ticks] [seed]
 ```
 
-Currently initializes the system, validates configuration, and provides arXiv search and PDF download capabilities.
+Supports end-to-end research runs, hypothesis generation, experiments, and paper/whitepaper generation.
 
 ## Development
 ```bash
@@ -166,7 +172,7 @@ CI runs `cargo fmt --check`, `cargo clippy -- -D warnings`, and `cargo test` on
 - [x] Milestone 7: Automated Experimentation
 - [x] Milestone 8: Paper Generation
 - [x] Milestone 9: Integration & Polish
-- [ ] Milestone 10: Whitepaper & Research Paper
+- [x] Milestone 10: Whitepaper & Research Paper
 
 ## License
 
diff --git a/src/agent/mod.rs b/src/agent/mod.rs
@@ -239,6 +239,37 @@ impl Agent {
         crate::output::paper::write_paper_tex(&self.config.paths.output, &hypothesis, &run, &store)
     }
 
+    pub fn whitepaper(
+        &self,
+        hypothesis_id: &str,
+    ) -> Result<crate::output::whitepaper::SavedWhitepaper> {
+        let hypothesis =
+            experiment::find_hypothesis(&self.config.knowledge.hypotheses_file, hypothesis_id)?;
+        let run = crate::output::whitepaper::load_experiment_results(
+            &self.config.paths.experiments,
+            hypothesis_id,
+        )?;
+        let store = MetadataStore::new(self.config.knowledge.metadata_file.clone())?;
+        crate::output::whitepaper::write_whitepaper_md(
+            &self.config.paths.output,
+            &hypothesis,
+            &run,
+            &store,
+        )
+    }
+
+    pub fn publish(
+        &self,
+        hypothesis_id: &str,
+    ) -> Result<(
+        crate::output::paper::SavedPaper,
+        crate::output::whitepaper::SavedWhitepaper,
+    )> {
+        let paper = self.paper(hypothesis_id)?;
+        let whitepaper = self.whitepaper(hypothesis_id)?;
+        Ok((paper, whitepaper))
+    }
+
     async fn hypothesize_inner(&mut self, query: &str) -> Result<SavedReport> {
         let max_results = (self.config.agent.max_iterations as usize).clamp(1, 10);
         let download_limit = self.config.agent.download_limit;
diff --git a/src/main.rs b/src/main.rs
@@ -19,6 +19,8 @@ fn print_usage() {
     println!("  consensusmind hypothesize \"<query>\"");
     println!("  consensusmind experiment <hypothesis-id> [--seeds N] [--ticks T] [--nodes N]");
     println!("  consensusmind paper <hypothesis-id>");
+    println!("  consensusmind whitepaper <hypothesis-id>");
+    println!("  consensusmind publish <hypothesis-id>");
     println!("  consensusmind index");
     println!("  consensusmind semantic-search \"<query>\" [top_k]");
     println!("  consensusmind simulate [rounds] [leader_failure_prob] [seed]");
@@ -185,6 +187,29 @@ async fn main() -> Result<()> {
             println!("Paper TeX saved to {}", paper.tex_path.display());
             return Ok(());
         }
+        Some("whitepaper") => {
+            let hypothesis_id = args.get(2).map(|s| s.as_str()).unwrap_or("");
+            if hypothesis_id.trim().is_empty() {
+                println!("Usage: consensusmind whitepaper <hypothesis-id>");
+                return Ok(());
+            }
+            let agent = Agent::new(config)?;
+            let whitepaper = agent.whitepaper(hypothesis_id)?;
+            println!("Whitepaper saved to {}", whitepaper.md_path.display());
+            return Ok(());
+        }
+        Some("publish") => {
+            let hypothesis_id = args.get(2).map(|s| s.as_str()).unwrap_or("");
+            if hypothesis_id.trim().is_empty() {
+                println!("Usage: consensusmind publish <hypothesis-id>");
+                return Ok(());
+            }
+            let agent = Agent::new(config)?;
+            let (paper, whitepaper) = agent.publish(hypothesis_id)?;
+            println!("Paper TeX saved to {}", paper.tex_path.display());
+            println!("Whitepaper saved to {}", whitepaper.md_path.display());
+            return Ok(());
+        }
         Some("simulate") => {
             let rounds = args
                 .get(2)
diff --git a/src/output/mod.rs b/src/output/mod.rs
@@ -5,6 +5,7 @@ use std::fs;
 use std::path::{Path, PathBuf};
 
 pub mod paper;
+pub mod whitepaper;
 
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct AgentRunReport {
diff --git a/src/output/whitepaper.rs b/src/output/whitepaper.rs
@@ -0,0 +1,211 @@
+use crate::agent::experiment::ExperimentRun;
+use crate::agent::hypothesis::Hypothesis;
+use crate::knowledge::database::MetadataStore;
+use anyhow::{Context, Result};
+use chrono::Utc;
+use serde::{Deserialize, Serialize};
+use std::cmp::Ordering;
+use std::fs;
+use std::path::{Path, PathBuf};
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct SavedWhitepaper {
+    pub md_path: PathBuf,
+}
+
+pub fn write_whitepaper_md(
+    output_root: &Path,
+    hypothesis: &Hypothesis,
+    experiment_run: &ExperimentRun,
+    metadata_store: &MetadataStore,
+) -> Result<SavedWhitepaper> {
+    let papers_dir = output_root.join("papers");
+    fs::create_dir_all(&papers_dir)?;
+
+    let ts = Utc::now().format("%Y%m%dT%H%M%SZ").to_string();
+    let filename = format!("whitepaper-{}-{}.md", sanitize_filename(&hypothesis.id), ts);
+    let md_path = papers_dir.join(filename);
+
+    let md = render_md(hypothesis, experiment_run, metadata_store)?;
+    crate::utils::fs::atomic_write(&md_path, md.as_bytes())?;
+
+    Ok(SavedWhitepaper { md_path })
+}
+
+pub fn load_experiment_results(
+    experiments_root: &Path,
+    hypothesis_id: &str,
+) -> Result<ExperimentRun> {
+    let path = experiments_root.join(hypothesis_id).join("results.json");
+    let contents = fs::read_to_string(&path)
+        .with_context(|| format!("Failed to read experiment results: {}", path.display()))?;
+    Ok(serde_json::from_str(&contents)?)
+}
+
+fn render_md(
+    hypothesis: &Hypothesis,
+    experiment_run: &ExperimentRun,
+    metadata_store: &MetadataStore,
+) -> Result<String> {
+    let mut s = String::new();
+    s.push_str("# ");
+    s.push_str(&hypothesis.title);
+    s.push('\n');
+    s.push('\n');
+
+    s.push_str("## Abstract\n");
+    s.push_str(&hypothesis.description);
+    s.push('\n');
+    s.push('\n');
+
+    s.push_str("## Hypothesis\n");
+    s.push_str("**Mechanism.** ");
+    s.push_str(&hypothesis.mechanism);
+    s.push('\n');
+    s.push('\n');
+
+    if !hypothesis.evaluation_plan.is_empty() {
+        s.push_str("## Evaluation Plan\n");
+        for (i, step) in hypothesis.evaluation_plan.iter().enumerate() {
+            s.push_str(&format!("{}. {}\n", i + 1, step));
+        }
+        s.push('\n');
+    }
+
+    s.push_str("## Experiments\n");
+    s.push_str("Experiments are executed as parameter sweeps over simulation configurations with multiple random seeds. This report summarizes aggregate metrics.\n\n");
+
+    if !experiment_run.raft.is_empty() {
+        let mut raft_ranked = experiment_run.raft.clone();
+        raft_ranked.sort_by(|a, b| {
+            b.aggregate
+                .mean_commit_rate_per_tick
+                .partial_cmp(&a.aggregate.mean_commit_rate_per_tick)
+                .unwrap_or(Ordering::Equal)
+        });
+
+        s.push_str("### Raft-style Simulator (Top Cases)\n");
+        for case in raft_ranked.iter().take(5) {
+            s.push_str(&format!(
+                "- nodes={} ticks={} p_req={:.2} mean_commit_rate_per_tick={:.6} mean_elections={:.2} mean_leader_changes={:.2}\n",
+                case.params.nodes,
+                case.params.ticks,
+                case.params.client_request_prob,
+                case.aggregate.mean_commit_rate_per_tick,
+                case.aggregate.mean_elections,
+                case.aggregate.mean_leader_changes
+            ));
+        }
+        s.push('\n');
+    }
+
+    if !experiment_run.leader.is_empty() {
+        s.push_str("### Leader-failure Baseline\n");
+        for case in experiment_run.leader.iter() {
+            s.push_str(&format!(
+                "- p_fail={:.2} mean_commit_rate={:.4}\n",
+                case.params.leader_failure_prob, case.aggregate.mean_commit_rate
+            ));
+        }
+        s.push('\n');
+    }
+
+    s.push_str("## Related Work\n");
+    if hypothesis.related_paper_ids.is_empty() {
+        s.push_str("No related papers were explicitly linked to this hypothesis.\n\n");
+    } else {
+        for paper_id in hypothesis.related_paper_ids.iter() {
+            let title = metadata_store
+                .get_paper(paper_id)
+                .map(|p| p.title.clone())
+                .unwrap_or_else(|| paper_id.to_string());
+            s.push_str(&format!(
+                "- {} (arXiv: {}) https://arxiv.org/abs/{}\n",
+                title, paper_id, paper_id
+            ));
+        }
+        s.push('\n');
+    }
+
+    s.push_str("## Reproducibility\n");
+    s.push_str("- Results file: ");
+    s.push_str(&format!(
+        "`data/experiments/{}/results.json`\n",
+        hypothesis.id
+    ));
+    s.push_str("- Generated at: ");
+    s.push_str(&Utc::now().to_rfc3339());
+    s.push('\n');
+
+    Ok(s)
+}
+
+fn sanitize_filename(s: &str) -> String {
+    s.chars()
+        .map(|c| {
+            if c.is_ascii_alphanumeric() || c == '-' || c == '_' {
+                c
+            } else {
+                '_'
+            }
+        })
+        .collect()
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::agent::experiment::{run_experiments, ExperimentOverrides};
+
+    fn temp_path(name: &str) -> PathBuf {
+        let pid = std::process::id();
+        let ts = Utc::now().timestamp_nanos_opt().unwrap_or(0);
+        std::env::temp_dir().join(format!("consensusmind-whitepaper-{}-{}-{}", name, pid, ts))
+    }
+
+    #[test]
+    fn write_whitepaper_creates_md_file() {
+        let root = temp_path("write");
+        fs::create_dir_all(&root).unwrap();
+
+        let hypotheses_path = root.join("hypotheses.json");
+        let metadata_path = root.join("metadata.json");
+        let output_root = root.join("out");
+        fs::create_dir_all(&output_root).unwrap();
+
+        let h = Hypothesis {
+            id: "h1".to_string(),
+            title: "Whitepaper Title".to_string(),
+            description: "desc".to_string(),
+            mechanism: "mech".to_string(),
+            evaluation_plan: vec!["plan".to_string()],
+            related_paper_ids: vec!["1234.56789".to_string()],
+            novelty_score: 0.2,
+            feasibility_score: 0.8,
+            created_at: Utc::now().to_rfc3339(),
+        };
+        let h_contents = serde_json::to_string_pretty(&vec![h.clone()]).unwrap();
+        crate::utils::fs::atomic_write(&hypotheses_path, h_contents.as_bytes()).unwrap();
+
+        crate::utils::fs::atomic_write(&metadata_path, "{}".as_bytes()).unwrap();
+        let store = MetadataStore::new(metadata_path).unwrap();
+
+        let (_hyp, run, _results_path) = run_experiments(
+            &root,
+            &hypotheses_path,
+            "h1",
+            ExperimentOverrides {
+                seeds: Some(2),
+                ticks: Some(200),
+                nodes: Some(3),
+            },
+        )
+        .unwrap();
+
+        let saved = write_whitepaper_md(&output_root, &h, &run, &store).unwrap();
+        assert!(saved.md_path.exists());
+        let contents = fs::read_to_string(saved.md_path).unwrap();
+        assert!(contents.contains("# Whitepaper Title"));
+        assert!(contents.contains("## Experiments"));
+    }
+}