DessimozLab
diff --git a/‎foldtree2/notebooks/experiments/test_fapeloss.ipynb‎
Lines changed: 195 additions & 61 deletions b/‎foldtree2/notebooks/experiments/test_fapeloss.ipynb‎
Lines changed: 195 additions & 61 deletions
@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 1,
    "id": "59ee2444",
    "metadata": {},
    "outputs": [
@@ -20,7 +20,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 2,
    "id": "10fe5139",
    "metadata": {},
    "outputs": [],
@@ -89,29 +89,34 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 39,
+   "execution_count": 3,
    "id": "4c3ff08e",
    "metadata": {},
    "outputs": [],
    "source": [
     "import torch\n",
     "from foldtree2.src.pdbgraph import PDB2PyG\n",
-    "from foldtree2.src.rigid_utils import *\n",
+    "from foldtree2.src.rigid_utils import Rigid\n",
+    "from foldtree2.src.losses.fape import (\n",
+    "    compute_chain_positions,\n",
+    "    rotation_matrix_to_quaternion,\n",
+    "    reconstruct_positions,\n",
+    "    quaternion_multiply,\n",
+    "    quaternion_rotate,\n",
+    "    fape_loss,\n",
+    "    lddt_loss,\n",
+    "    compute_lddt_quaternions\n",
+    ")\n",
     "\n",
     "import matplotlib.pyplot as plt\n",
     "from mpl_toolkits.mplot3d import Axes3D\n",
-    "from foldtree2.src.losses.losses import compute_chain_positions\n",
-    "\n",
-    "# Example PDB file path\n",
-    "pdb_path = './foldtree2/config/1eei.pdb'\n",
-    "\n",
-    "# Initialize parser\n",
-    "pdb2pyg = PDB2PyG(aapropcsv = 'foldtree2/config/aaindex1.csv')\n"
+    "import numpy as np\n",
+    "from scipy.spatial import procrustes"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 42,
+   "execution_count": 4,
    "id": "63373b61",
    "metadata": {},
    "outputs": [],
@@ -234,8 +239,7 @@
     "\t# Stack into tensors\n",
     "\tif rotations:\n",
     "\t\trotation_tensor = torch.stack(rotations, dim=0)\n",
-    "\t\t#normalize rotation matrices to ensure orthogonality\n",
-    "\t\trotation_tensor = rotation_tensor / rotation_tensor.norm(dim=[1, 2], keepdim=True)\n",
+    "\t\t# Rotation matrices from Rigid.get_rots() are already orthogonal - no normalization needed!\n",
     "\telse:\n",
     "\t\trotation_tensor = torch.empty(0, 3, 3)\n",
     "\t\n",
@@ -245,7 +249,7 @@
     "\t\ttranslation_tensor = torch.empty(0, 3)\n",
     "\tif quats:\n",
     "\t\tquats = torch.stack(quats, dim=0)\n",
-    "\t\t#normalize quaternion vectors\n",
+    "\t\t# Normalize quaternion vectors to ensure unit norm\n",
     "\t\tquats = quats / quats.norm(dim=1, keepdim=True)\n",
     "\telse:\n",
     "\t\tquats = torch.empty(0, 4)\n",
@@ -372,8 +376,22 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 43,
-   "id": "48e0d8f9",
+   "execution_count": 5,
+   "id": "d5f32f57",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#transform a strucutre's residues into rigid body transforms\n",
+    "from Bio.PDB import PDBParser\n",
+    "pdb_parser = PDBParser(QUIET=True)\n",
+    "\n",
+    "pdb_path = './foldtree2/config/1eei.pdb'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "635676ab",
    "metadata": {},
    "outputs": [
     {
@@ -485,17 +503,15 @@
       "        [ 0.5021,  0.2582, -0.7162,  0.4102]])\n",
       "Transformation Analysis:\n",
       "  Number of residue-to-residue transformations: 102\n",
-      "  Mean rotation angle: 120.00° ± 15.96°\n",
+      "  Mean rotation angle: 123.56° ± 31.83°\n",
       "  Mean translation distance: 57.890 ± 17.816 Å\n",
       "  Translation distance range: 10.431 - 98.682 Å\n",
-      "  Rotation angle range: 88.05° - 142.06°\n"
+      "  Rotation angle range: 64.84° - 179.54°\n"
      ]
     }
    ],
    "source": [
-    "#transform a strucutre's residues into rigid body transforms\n",
-    "from Bio.PDB import PDBParser\n",
-    "pdb_parser = PDBParser(QUIET=True)\n",
+    "\n",
     "pdb_structure = pdb_parser.get_structure('1eei', pdb_path)\n",
     "pdb_transforms = get_residue_transformations_from_pdb(\n",
     "\tpdb_structure, chain_id=None, device=None\n",
@@ -507,6 +523,149 @@
     "pdb_analysis = analyze_residue_transformations(pdb_transforms, verbose=True)\n"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "f5540be4",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "============================================================\n",
+      "VALIDATION TESTS FOR get_residue_transformations\n",
+      "============================================================\n",
+      "\n",
+      "1. Quaternion Unit Norm Test:\n",
+      "   Min quaternion norm: 1.000000\n",
+      "   Max quaternion norm: 1.000000\n",
+      "   Mean quaternion norm: 1.000000\n",
+      "   ✓ PASS\n",
+      "\n",
+      "2. Rotation Matrix Orthogonality Test:\n",
+      "   Max orthogonality error: 6.597833e-07\n",
+      "   Mean orthogonality error: 2.584600e-07\n",
+      "   ✓ PASS\n",
+      "\n",
+      "3. Rotation Matrix Determinant Test:\n",
+      "   Min determinant: 1.000000\n",
+      "   Max determinant: 1.000000\n",
+      "   Mean determinant: 1.000000\n",
+      "   ✓ PASS\n",
+      "\n",
+      "4. Quaternion-to-Rotation Consistency Test:\n",
+      "   Max consistency error: 2.828426e+00\n",
+      "   Mean consistency error: 2.283508e+00\n",
+      "   ✗ FAIL\n",
+      "\n",
+      "5. Transformation Chain Test:\n",
+      "   Rotation composition error: 2.522347e+00\n",
+      "   Translation composition error: 6.872144e+01\n",
+      "   ✗ FAIL\n",
+      "\n",
+      "============================================================\n",
+      "VALIDATION COMPLETE\n",
+      "============================================================\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Validation tests for get_residue_transformations\n",
+    "\n",
+    "print(\"=\"*60)\n",
+    "print(\"VALIDATION TESTS FOR get_residue_transformations\")\n",
+    "print(\"=\"*60)\n",
+    "\n",
+    "# Test 1: Check quaternion properties\n",
+    "print(\"\\n1. Quaternion Unit Norm Test:\")\n",
+    "quat_norms = torch.norm(pdb_transforms['quats'], dim=1)\n",
+    "print(f\"   Min quaternion norm: {quat_norms.min():.6f}\")\n",
+    "print(f\"   Max quaternion norm: {quat_norms.max():.6f}\")\n",
+    "print(f\"   Mean quaternion norm: {quat_norms.mean():.6f}\")\n",
+    "print(f\"   ✓ PASS\" if torch.allclose(quat_norms, torch.ones_like(quat_norms), atol=1e-5) else \"   ✗ FAIL\")\n",
+    "\n",
+    "# Test 2: Check rotation matrix orthogonality (R^T @ R should be identity)\n",
+    "print(\"\\n2. Rotation Matrix Orthogonality Test:\")\n",
+    "R = pdb_transforms['rotations']\n",
+    "identity_errors = []\n",
+    "for i in range(len(R)):\n",
+    "    should_be_identity = R[i].T @ R[i]\n",
+    "    error = torch.norm(should_be_identity - torch.eye(3), p='fro')\n",
+    "    identity_errors.append(error.item())\n",
+    "\n",
+    "identity_errors = torch.tensor(identity_errors)\n",
+    "print(f\"   Max orthogonality error: {identity_errors.max():.6e}\")\n",
+    "print(f\"   Mean orthogonality error: {identity_errors.mean():.6e}\")\n",
+    "print(f\"   ✓ PASS\" if identity_errors.max() < 1e-5 else \"   ✗ FAIL\")\n",
+    "\n",
+    "# Test 3: Check rotation matrix determinant (should be +1)\n",
+    "print(\"\\n3. Rotation Matrix Determinant Test:\")\n",
+    "determinants = torch.stack([torch.det(R[i]) for i in range(len(R))])\n",
+    "print(f\"   Min determinant: {determinants.min():.6f}\")\n",
+    "print(f\"   Max determinant: {determinants.max():.6f}\")\n",
+    "print(f\"   Mean determinant: {determinants.mean():.6f}\")\n",
+    "print(f\"   ✓ PASS\" if torch.allclose(determinants, torch.ones_like(determinants), atol=1e-5) else \"   ✗ FAIL\")\n",
+    "\n",
+    "# Test 4: Check quaternion-to-rotation consistency\n",
+    "print(\"\\n4. Quaternion-to-Rotation Consistency Test:\")\n",
+    "from foldtree2.src.losses.fape import quaternion_to_rotation_matrix\n",
+    "R_from_quats = quaternion_to_rotation_matrix(pdb_transforms['quats'])\n",
+    "consistency_error = torch.norm(R_from_quats - R, p='fro', dim=[1, 2])\n",
+    "print(f\"   Max consistency error: {consistency_error.max():.6e}\")\n",
+    "print(f\"   Mean consistency error: {consistency_error.mean():.6e}\")\n",
+    "print(f\"   ✓ PASS\" if consistency_error.max() < 1e-4 else \"   ✗ FAIL\")\n",
+    "\n",
+    "# Test 5: Verify transformation composition\n",
+    "print(\"\\n5. Transformation Chain Test:\")\n",
+    "# Apply transforms sequentially and check against direct computation\n",
+    "transforms = pdb_transforms['transforms']\n",
+    "composed_transform = transforms[0]\n",
+    "for i in range(1, min(5, len(transforms))):  # Test first 5 transforms\n",
+    "    composed_transform = composed_transform.compose(transforms[i])\n",
+    "\n",
+    "# The composed transform should match what we get from composing frames directly\n",
+    "residue_list = list(pdb_structure[0][list(pdb_structure[0].child_dict.keys())[0]])\n",
+    "coords_0 = {\n",
+    "    'N': torch.tensor(residue_list[0]['N'].get_coord(), dtype=torch.float32),\n",
+    "    'CA': torch.tensor(residue_list[0]['CA'].get_coord(), dtype=torch.float32),\n",
+    "    'C': torch.tensor(residue_list[0]['C'].get_coord(), dtype=torch.float32)\n",
+    "}\n",
+    "coords_5 = {\n",
+    "    'N': torch.tensor(residue_list[5]['N'].get_coord(), dtype=torch.float32),\n",
+    "    'CA': torch.tensor(residue_list[5]['CA'].get_coord(), dtype=torch.float32),\n",
+    "    'C': torch.tensor(residue_list[5]['C'].get_coord(), dtype=torch.float32)\n",
+    "}\n",
+    "\n",
+    "frame_0 = Rigid.from_3_points(\n",
+    "    p_neg_x_axis=coords_0['N'].unsqueeze(0),\n",
+    "    origin=coords_0['CA'].unsqueeze(0),\n",
+    "    p_xy_plane=coords_0['C'].unsqueeze(0)\n",
+    ")\n",
+    "frame_5 = Rigid.from_3_points(\n",
+    "    p_neg_x_axis=coords_5['N'].unsqueeze(0),\n",
+    "    origin=coords_5['CA'].unsqueeze(0),\n",
+    "    p_xy_plane=coords_5['C'].unsqueeze(0)\n",
+    ")\n",
+    "\n",
+    "direct_transform = frame_5.compose(frame_0.invert())\n",
+    "rotation_error = torch.norm(\n",
+    "    composed_transform.get_rots().get_rot_mats() - direct_transform.get_rots().get_rot_mats(), \n",
+    "    p='fro'\n",
+    ")\n",
+    "translation_error = torch.norm(\n",
+    "    composed_transform.get_trans() - direct_transform.get_trans()\n",
+    ")\n",
+    "\n",
+    "print(f\"   Rotation composition error: {rotation_error.item():.6e}\")\n",
+    "print(f\"   Translation composition error: {translation_error.item():.6e}\")\n",
+    "print(f\"   ✓ PASS\" if rotation_error < 1e-4 and translation_error < 1e-4 else \"   ✗ FAIL\")\n",
+    "\n",
+    "print(\"\\n\" + \"=\"*60)\n",
+    "print(\"VALIDATION COMPLETE\")\n",
+    "print(\"=\"*60)"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": 44,
@@ -553,33 +712,9 @@
     "\tplt.show()\n",
     "\n",
     "\n",
-    "def reconstruct_positions(R, T):\n",
-    "\t\"\"\"\n",
-    "\tReconstruct 3D positions from a sequence of rotation matrices and translation vectors.\n",
-    "\t\n",
-    "\tArgs:\n",
-    "\t\tR (torch.Tensor): Rotation matrices of shape (N, 3, 3)\n",
-    "\t\tT (torch.Tensor): Translation vectors of shape (N, 3)\n",
-    "\t\t\n",
-    "\tReturns:\n",
-    "\t\ttorch.Tensor: Reconstructed positions of shape (N+1, 3), starting from origin\n",
-    "\t\"\"\"\n",
-    "\tpositions = torch.zeros(len(T) + 1, 3, dtype=T.dtype, device=T.device)\n",
-    "\tcurrent_pos = torch.zeros(3, dtype=T.dtype, device=T.device)\n",
-    "\t\n",
-    "\tfor i in range(len(T)):\n",
-    "\t\tcurrent_pos = R[i] @ current_pos + T[i]\n",
-    "\t\tpositions[i + 1] = current_pos\n",
-    "\t\n",
-    "\treturn positions\n",
-    "\n",
     "def plot_reconstructed_chain(R, T, title=\"Reconstructed Chain\"):\n",
-    "\tR = R.detach().cpu()\n",
-    "\tT = T.detach().cpu()\n",
     "\tpositions = reconstruct_positions(R, T)\n",
-    "\t\n",
-    "\tplot_points(positions, title)\n",
-    "\n"
+    "\tplot_points(positions, title=title)"
    ]
   },
   {
@@ -930,8 +1065,6 @@
     }
    ],
    "source": [
-    "from src.losses.losses import compute_chain_positions\n",
-    "\n",
     "# Extract original CA coordinates\n",
     "ca_coords = pdb2pyg.extract_pdb_coordinates(pdb_path, atom_type=\"CA\")\n",
     "\n",
@@ -1018,8 +1151,6 @@
     }
    ],
    "source": [
-    "from src.losses.losses import compute_chain_positions\n",
-    "\n",
     "def plot_quaternion_and_rt_alignment(quats, translations, R, T, title=\"Alignment Plot\"):\n",
     "\t\"\"\"\n",
     "\tPlot points created from quaternion chain and from RT values to check alignment.\n",
@@ -1141,7 +1272,6 @@
     "plot_quaternion_chain(quaternions_noisy, t_noisy, \"Noisy Quaternion Chain Positions\")\n",
     "\n",
     "# --- Compute FAPE loss and lDDT loss ---\n",
-    "from losses.losses import fape_loss, lddt_loss\n",
     "\n",
     "# FAPE loss (using original as true, noisy as pred)\n",
     "batch = torch.zeros(coords.shape[0], dtype=torch.long)  # single batch\n",
@@ -1169,21 +1299,25 @@
     "ax.legend()\n",
     "plt.show()"
    ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0121113b",
-   "metadata": {},
-   "outputs": [],
-   "source": []
   }
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "foldtree2",
    "language": "python",
    "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.23"
   }
  },
  "nbformat": 4,