Merge pull request #3 from TheMesocarp/feat/diffusion!

FiberedSkies · web-flow · commit 56db7b4b1371 · 2025-05-19T06:01:54.000-04:00
diffusion!
diff --git a/Cargo.toml b/Cargo.toml
@@ -6,4 +6,6 @@ edition = "2021"
 [dependencies]
 num-complex = "0.4.6"
 rand = "0.9.0"
-candle-core = "0.9.0"
+candle-core = "0.9.1"
+candle-optimisers = "0.9.0"
+candle-nn = "0.9.1"
diff --git a/src/cw.rs b/src/cw.rs
diff --git a/src/lib.rs b/src/lib.rs
@@ -1,3 +1,3 @@
 pub mod error;
 pub mod math;
-pub mod sheaf;
+pub mod nn;
diff --git a/src/math/mod.rs b/src/math/mod.rs
@@ -1,2 +1,3 @@
 pub mod cell;
+pub mod sheaf;
 pub mod tensors;
diff --git a/src/math/sheaf.rs b/src/math/sheaf.rs
@@ -12,7 +12,7 @@ use crate::{
 #[derive(PartialEq, Eq, Hash, Clone)]
 pub struct Point<T: Eq + std::hash::Hash + Clone + Sized>(T);
 
-pub struct Section(Vector);
+pub struct Section(pub Vector);
 
 impl Section {
     pub fn new<T: WithDType>(
@@ -30,8 +30,8 @@ pub struct CellularSheaf<O: OpenSet> {
     pub restrictions: HashMap<(usize, usize, usize, usize), Matrix>,
     pub interlinked: HashMap<(usize, usize, usize, usize), i8>,
     pub global_sections: Vec<Section>,
-    device: Device,
-    dtype: DType,
+    pub device: Device,
+    pub dtype: DType,
 }
 
 impl<O: OpenSet> CellularSheaf<O> {
@@ -94,7 +94,7 @@ impl<O: OpenSet> CellularSheaf<O> {
         Ok(())
     }
 
-    pub fn k_coboundary(
+    fn k_coboundary(
         &self,
         k: usize,
         k_cochain: Vec<Vector>,
@@ -151,7 +151,7 @@ impl<O: OpenSet> CellularSheaf<O> {
     }
 
     /// Computes the adjoint of the k-th coboundary operator ((delta^k)*).
-    pub fn k_adjoint_coboundary(
+    fn k_adjoint_coboundary(
         &self,
         k: usize,
         k_coboundary_output: Vec<Vector>,
@@ -215,34 +215,38 @@ impl<O: OpenSet> CellularSheaf<O> {
     }
 
     /// Retrieves the cochain (Vec<Vector>) for a given dimension k.
-    pub fn get_k_cochain(&self, k: usize) -> Result<Vec<Vector>, MathError> {
+    pub fn get_k_cochain(&self, k: usize) -> Result<Matrix, MathError> {
         if k >= self.section_spaces.len() {
             return Err(MathError::DimensionMismatch);
         }
         let k_sections = &self.section_spaces[k];
         let k_cochain: Vec<Vector> = k_sections.iter().map(|section| section.0.clone()).collect();
-
-        Ok(k_cochain)
+        Matrix::from_vecs(k_cochain).map_err(MathError::Candle)
     }
 
     pub fn k_hodge_laplacian(
         &self,
         k: usize,
         k_cochain: Matrix,
-        k_stalk_dim: usize,
-        k_plus_stalk_dim: usize,
-        k_minus_stalk_dim: usize,
+        down_included: bool,
     ) -> Result<Matrix, MathError> {
         let vecs = k_cochain.to_vectors().map_err(MathError::Candle)?;
+
+        let k_plus_stalk_dim = self.section_spaces[k + 1][0].0.dimension();
+        let k_stalk_dim = self.section_spaces[k][0].0.dimension();
+        let k_minus_stalk_dim = self.section_spaces[k - 1][0].0.dimension();
+
         let up_a = self.k_coboundary(k, vecs.clone(), k_plus_stalk_dim)?;
         let up_b = self.k_adjoint_coboundary(k, up_a, k_stalk_dim)?;
-
-        let down_a = self.k_adjoint_coboundary(k, vecs, k_minus_stalk_dim)?;
-        let down_b = self.k_coboundary(k, down_a, k_stalk_dim)?;
-        let out = Matrix::from_vecs(up_b)
-            .map_err(MathError::Candle)?
-            .add(&Matrix::from_vecs(down_b).map_err(MathError::Candle)?)
-            .map_err(MathError::Candle)?;
-        Ok(out)
+        if down_included {
+            let down_a = self.k_adjoint_coboundary(k, vecs, k_minus_stalk_dim)?;
+            let down_b = self.k_coboundary(k, down_a, k_stalk_dim)?;
+            let out = Matrix::from_vecs(up_b)
+                .map_err(MathError::Candle)?
+                .add(&Matrix::from_vecs(down_b).map_err(MathError::Candle)?)
+                .map_err(MathError::Candle)?;
+            return Ok(out);
+        }
+        Matrix::from_vecs(up_b).map_err(MathError::Candle)
     }
 }
diff --git a/src/math/tensors.rs b/src/math/tensors.rs
@@ -82,8 +82,8 @@ impl Vector {
 #[derive(Debug, Clone)]
 pub struct Matrix {
     pub tensor: Tensor,
-    device: Device,
-    dtype: DType,
+    pub device: Device,
+    pub dtype: DType,
 }
 
 impl Matrix {
@@ -263,6 +263,12 @@ impl Matrix {
 
         Ok(cols_vectors)
     }
+
+    /// Generates a new random matrix with elements sampled from a standard normal distribution (mean 0, std dev 1).
+    pub fn rand(rows: usize, cols: usize, device: Device, dtype: DType) -> Result<Self> {
+        let tensor = Tensor::randn(0.0f32, 1.0f32, (rows, cols), &device)?.to_dtype(dtype)?;
+        Self::new(tensor, device, dtype)
+    }
 }
 
 // Example Usage (requires a candle_core setup)
diff --git a/src/nn/activations.rs b/src/nn/activations.rs
@@ -0,0 +1,118 @@
+use candle_core::{Error, Tensor};
+
+use crate::math::tensors::Matrix;
+
+pub enum Activations {
+    Step,
+    Linear,
+    Sigmoid,
+    Tanh,
+    ReLU,
+    Softmax,
+    Swish,
+    GeLU,
+    Sinc,
+    SeLU,
+}
+
+impl Activations {
+    pub fn activate(&self, input: Matrix) -> Result<Matrix, Error> {
+        let tensor = input.inner();
+        let device = input.device.clone();
+        let dtype = input.dtype;
+
+        let activated = match self {
+            Activations::Step => {
+                // Heaviside step function: 1.0 where x >= 0.0, else 0.0
+                let zeros = Tensor::zeros_like(tensor)?;
+                let ones = Tensor::ones_like(tensor)?;
+                tensor.ge(&zeros)?.where_cond(&ones, &zeros)?
+            }
+            Activations::Linear => tensor.clone(),
+            Activations::Tanh => tensor.tanh()?,
+            Activations::ReLU => tensor.relu()?,
+            Activations::Sinc => {
+                // sinc(x) = sin(x) / x, define 1 at x=0
+                // Using a small epsilon to handle division by zero.
+                // If x is near zero, output 1, else sin(x)/x
+                let eps_val = 1e-7f64;
+                let eps = Tensor::full(eps_val, tensor.dims(), &device)?.to_dtype(dtype)?;
+                let near_zero = tensor.abs()?.le(&eps)?;
+
+                let numerator = tensor.sin()?;
+                let denominator = tensor.clone(); // Clone to avoid consuming tensor
+                let value = numerator.div(&denominator)?;
+
+                near_zero.where_cond(&Tensor::ones_like(tensor)?, &value)?
+            }
+            Activations::Sigmoid => {
+                // Sigmoid(x) = 1 / (1 + exp(-x))
+                let neg_x = tensor.neg()?;
+                let exp_neg_x = neg_x.exp()?;
+                let one = Tensor::ones_like(&exp_neg_x)?;
+                let one_plus_exp_neg_x = one.add(&exp_neg_x)?;
+                one_plus_exp_neg_x.recip()? // 1 / (1 + exp(-x))
+            }
+            Activations::Softmax => {
+                // Softmax(x_i) = exp(x_i) / sum(exp(x_j)) along the last dimension
+                // For a Matrix (rank 2), apply along dim 1 (columns) for each row.
+                let exp_x = tensor.exp()?;
+                // Sum along the last dimension, keeping the dimension for broadcasting
+                let sum_exp_x = exp_x.sum_keepdim(1)?;
+                exp_x.broadcast_div(&sum_exp_x)?
+            }
+            Activations::Swish => {
+                // Swish(x) = x * Sigmoid(x)
+                let neg_x = tensor.neg()?;
+                let exp_neg_x = neg_x.exp()?;
+                let one = Tensor::ones_like(&exp_neg_x)?;
+                let one_plus_exp_neg_x = one.add(&exp_neg_x)?;
+                let sigmoid_x = one_plus_exp_neg_x.recip()?;
+                tensor.mul(&sigmoid_x)?
+            }
+            Activations::GeLU => {
+                // GeLU(x) = 0.5 * x * (1 + erf(x / sqrt(2)))
+                let sqrt_two_val = 2.0f64.sqrt();
+                let sqrt_two =
+                    Tensor::full(sqrt_two_val, tensor.dims(), &device)?.to_dtype(dtype)?;
+
+                let x_div_sqrt_two = tensor.div(&sqrt_two)?;
+                let erf_val = x_div_sqrt_two.erf()?;
+                let one = Tensor::ones_like(&erf_val)?;
+                let one_plus_erf = one.add(&erf_val)?;
+
+                let half_val = 0.5f64;
+                let half = Tensor::full(half_val, tensor.dims(), &device)?.to_dtype(dtype)?;
+
+                tensor.mul(&half)?.mul(&one_plus_erf)?
+            }
+            Activations::SeLU => {
+                // SeLU(x) = lambda * (x if x > 0 else alpha * (exp(x) - 1))
+                // Standard constants for SeLU
+                let alpha_val = 1.673_263_242_354_377_2_f64;
+                let lambda_val = 1.050_700_987_355_480_5_f64;
+
+                let alpha = Tensor::full(alpha_val, tensor.dims(), &device)?.to_dtype(dtype)?;
+                let lambda = Tensor::full(lambda_val, tensor.dims(), &device)?.to_dtype(dtype)?;
+                let zero = Tensor::zeros_like(tensor)?;
+
+                // Condition: x > 0
+                let cond_gt_zero = tensor.gt(&zero)?;
+
+                // Case for x > 0: just x
+                let case_gt_zero = tensor.clone();
+
+                // Case for x <= 0: alpha * (exp(x) - 1)
+                let exp_x = tensor.exp()?;
+                let one_for_sub = Tensor::ones_like(&exp_x)?;
+                let exp_x_minus_one = exp_x.sub(&one_for_sub)?;
+                let case_le_zero = alpha.mul(&exp_x_minus_one)?;
+
+                let result = cond_gt_zero.where_cond(&case_gt_zero, &case_le_zero)?;
+                lambda.mul(&result)?
+            }
+        };
+
+        Matrix::new(activated, device, dtype)
+    }
+}
diff --git a/src/nn/diffusion.rs b/src/nn/diffusion.rs
diff --git a/src/nn/mod.rs b/src/nn/mod.rs

Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,3 @@`
`1`	`1`	`pub mod cell;`
	`2`	`+pub mod sheaf;`
`2`	`3`	`pub mod tensors;`