Adjust fitting

aarmey · aarmey · commit 1988607bb195 · 2025-11-13T17:07:35.000-08:00
diff --git a/pf2rnaseq/factorization.py b/pf2rnaseq/factorization.py
@@ -264,7 +264,8 @@ def objective(x):
         mse = np.sum((A - reconstruction) ** 2)
 
         # Regularization: L1 penalty on both W and H
-        l1_W = alpha * np.sum(np.abs(W))
+        # Exclude diagonal of W from L1 penalty
+        l1_W = alpha * np.sum(np.abs(W)) - alpha * np.diag(np.abs(W)).sum()
         l1_H = alpha * np.sum(np.abs(H))
 
         total_loss = mse + l1_W + l1_H
@@ -273,7 +274,7 @@ def objective(x):
         if total_loss < best_loss[0]:
             best_loss[0] = total_loss
 
-        if iteration_counter[0] % 100 == 0:
+        if iteration_counter[0] % 10 == 0:
             print(
                 f"  Iter {iteration_counter[0]}: Loss={total_loss:.4f} "
                 f"(MSE={mse:.4f}, L1_W={l1_W:.4f}, L1_H={l1_H:.4f})"
@@ -287,24 +288,20 @@ def gradient(x):
 
         # ===== Gradient w.r.t. W =====
         # 1. Reconstruction term: ∂/∂W [||A - WH||²] = 2(error @ H^T), L1 penalty: ∂/∂W [α||W||₁] = α * sign(W)
-        grad_W = 2 * ((W @ H - A) @ H.T) + alpha
+        grad_W = 2 * ((W @ H - A) @ H.T) + alpha * np.sign(W) - np.diag(alpha * np.sign(np.diag(W)))
 
         # ===== Gradient w.r.t. H =====
         # 1. Reconstruction term: ∂/∂H [||A - WH||²] = 2(W^T @ error),  L1 penalty: ∂/∂H [α||H||₁] = α * sign(H)
-        grad_H = 2 * (W.T @ (W @ H - A)) + alpha
+        grad_H = 2 * (W.T @ (W @ H - A)) + alpha * np.sign(H)
 
         return np.concatenate([grad_W.ravel(), grad_H.ravel()])
 
-    # Enforce non-negativity
-    bounds = [(0, None)] * len(x0)
-
     print("\nStarting optimization...")
 
     result = minimize(
         fun=objective,
         x0=x0,
         method="L-BFGS-B",
-        bounds=bounds,
         jac=gradient,
         options={"maxiter": max_iter, "disp": True},
     )