ITISFoundation
diff --git a/‎packages/postgres-database/src/simcore_postgres_database/migration/versions/dfa87810f245_add_comp_run_snapshot_tasks_table.py‎
Lines changed: 110 additions & 0 deletions b/‎packages/postgres-database/src/simcore_postgres_database/migration/versions/dfa87810f245_add_comp_run_snapshot_tasks_table.py‎
Lines changed: 110 additions & 0 deletions
diff --git a/‎packages/postgres-database/src/simcore_postgres_database/models/comp_run_snapshot_tasks.py‎
Lines changed: 130 additions & 0 deletions b/‎packages/postgres-database/src/simcore_postgres_database/models/comp_run_snapshot_tasks.py‎
Lines changed: 130 additions & 0 deletions
diff --git a/‎packages/simcore-sdk/src/simcore_sdk/node_ports_common/dbmanager.py‎
Lines changed: 32 additions & 3 deletions b/‎packages/simcore-sdk/src/simcore_sdk/node_ports_common/dbmanager.py‎
Lines changed: 32 additions & 3 deletions
diff --git a/‎services/director-v2/src/simcore_service_director_v2/api/routes/computations.py‎
Lines changed: 10 additions & 6 deletions b/‎services/director-v2/src/simcore_service_director_v2/api/routes/computations.py‎
Lines changed: 10 additions & 6 deletions
@@ -0,0 +1,110 @@
+"""add comp_run_snapshot_tasks table
+
+Revision ID: dfa87810f245
+Revises: 278daef7e99d
+Create Date: 2025-05-26 14:17:04.227338+00:00
+
+"""
+
+import sqlalchemy as sa
+from alembic import op
+from sqlalchemy.dialects import postgresql
+
+# revision identifiers, used by Alembic.
+revision = "dfa87810f245"
+down_revision = "278daef7e99d"
+branch_labels = None
+depends_on = None
+
+
+def upgrade():
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.create_table(
+        "comp_run_snapshot_tasks",
+        sa.Column("snapshot_task_id", sa.Integer(), nullable=False),
+        sa.Column("run_id", sa.Integer(), nullable=False),
+        sa.Column("project_id", sa.String(), nullable=True),
+        sa.Column("node_id", sa.String(), nullable=True),
+        sa.Column(
+            "node_class",
+            postgresql.ENUM(
+                "COMPUTATIONAL",
+                "INTERACTIVE",
+                "FRONTEND",
+                name="nodeclass",
+                create_type=False,
+            ),
+            nullable=True,
+        ),
+        sa.Column("job_id", sa.String(), nullable=True),
+        sa.Column("internal_id", sa.Integer(), nullable=True),
+        sa.Column("schema", sa.JSON(), nullable=True),
+        sa.Column("inputs", sa.JSON(), nullable=True),
+        sa.Column("outputs", sa.JSON(), nullable=True),
+        sa.Column("run_hash", sa.String(), nullable=True),
+        sa.Column("image", sa.JSON(), nullable=True),
+        sa.Column(
+            "state",
+            postgresql.ENUM(
+                "NOT_STARTED",
+                "PUBLISHED",
+                "PENDING",
+                "RUNNING",
+                "SUCCESS",
+                "FAILED",
+                "ABORTED",
+                name="statetype",
+                create_type=False,
+            ),
+            server_default="NOT_STARTED",
+            nullable=False,
+        ),
+        sa.Column("errors", postgresql.JSONB(astext_type=sa.Text()), nullable=True),
+        sa.Column("progress", sa.Numeric(precision=3, scale=2), nullable=True),
+        sa.Column("start", sa.DateTime(timezone=True), nullable=True),
+        sa.Column("end", sa.DateTime(timezone=True), nullable=True),
+        sa.Column("last_heartbeat", sa.DateTime(timezone=True), nullable=True),
+        sa.Column(
+            "created",
+            sa.DateTime(timezone=True),
+            server_default=sa.text("now()"),
+            nullable=False,
+        ),
+        sa.Column(
+            "modified",
+            sa.DateTime(timezone=True),
+            server_default=sa.text("now()"),
+            nullable=False,
+        ),
+        sa.Column(
+            "pricing_info", postgresql.JSONB(astext_type=sa.Text()), nullable=True
+        ),
+        sa.Column(
+            "hardware_info", postgresql.JSONB(astext_type=sa.Text()), nullable=True
+        ),
+        sa.Column(
+            "submit",
+            sa.DateTime(timezone=True),
+            server_default=sa.text("'1900-01-01T00:00:00Z'::timestamptz"),
+            nullable=True,
+        ),
+        sa.ForeignKeyConstraint(
+            ["project_id"],
+            ["comp_pipeline.project_id"],
+        ),
+        sa.ForeignKeyConstraint(
+            ["run_id"],
+            ["comp_runs.run_id"],
+            name="fk_snapshot_tasks_to_comp_runs",
+            onupdate="CASCADE",
+            ondelete="CASCADE",
+        ),
+        sa.PrimaryKeyConstraint("snapshot_task_id"),
+    )
+    # ### end Alembic commands ###
+
+
+def downgrade():
+    # ### commands auto generated by Alembic - please adjust! ###
+    op.drop_table("comp_run_snapshot_tasks")
+    # ### end Alembic commands ###
@@ -0,0 +1,130 @@
+"""Computational Tasks Table"""
+
+import sqlalchemy as sa
+from sqlalchemy.dialects import postgresql
+from sqlalchemy.dialects.postgresql import ENUM
+
+from ._common import (
+    RefActions,
+    column_created_datetime,
+    column_modified_datetime,
+)
+from .base import metadata
+from .comp_pipeline import StateType
+from .comp_runs import comp_runs
+
+comp_run_snapshot_tasks = sa.Table(
+    "comp_run_snapshot_tasks",
+    metadata,
+    sa.Column(
+        "snapshot_task_id",
+        sa.Integer,
+        primary_key=True,
+    ),
+    sa.Column(
+        "run_id",
+        sa.Integer,
+        sa.ForeignKey(
+            comp_runs.c.run_id,
+            name="fk_snapshot_tasks_to_comp_runs",
+            onupdate=RefActions.CASCADE,
+            ondelete=RefActions.CASCADE,
+        ),
+        nullable=False,
+    ),
+    sa.Column(
+        "project_id",
+        sa.String,
+        sa.ForeignKey("comp_pipeline.project_id"),
+        doc="Project that contains the node associated to this task",
+    ),
+    sa.Column("node_id", sa.String, doc="Node associated to this task"),
+    sa.Column(
+        "node_class",
+        ENUM(
+            "COMPUTATIONAL",
+            "INTERACTIVE",
+            "FRONTEND",
+            name="nodeclass",
+            create_type=False,  # necessary to avoid alembic nodeclass already exists error
+        ),
+        doc="Classification of the node associated to this task",
+    ),
+    sa.Column("job_id", sa.String, doc="Worker job ID for this task"),
+    sa.Column("internal_id", sa.Integer, doc="DEV: only for development. From 1 to N"),
+    sa.Column("schema", sa.JSON, doc="Schema for inputs and outputs"),
+    sa.Column("inputs", sa.JSON, doc="Input values"),
+    sa.Column("outputs", sa.JSON, doc="Output values"),
+    sa.Column(
+        "run_hash",
+        sa.String,
+        nullable=True,
+        doc="Hashes inputs before run. Used to detect changes in inputs.",
+    ),
+    sa.Column(
+        "image", sa.JSON, doc="Metadata about service image associated to this node"
+    ),
+    sa.Column(
+        "state",
+        ENUM(
+            "NOT_STARTED",
+            "PUBLISHED",
+            "PENDING",
+            "RUNNING",
+            "SUCCESS",
+            "FAILED",
+            "ABORTED",
+            name="statetype",
+            create_type=False,  # necessary to avoid alembic statetype already exists error
+        ),
+        nullable=False,
+        server_default=StateType.NOT_STARTED.value,
+        doc="Current state in the task lifecycle",
+    ),
+    sa.Column(
+        "errors",
+        postgresql.JSONB,
+        nullable=True,
+        doc="List[models_library.errors.ErrorDict] with error information"
+        " for a failing state, otherwise set to None",
+    ),
+    sa.Column(
+        "progress",
+        sa.Numeric(precision=3, scale=2),  # numbers from 0.00 and 1.00
+        nullable=True,
+        doc="current progress of the task if available",
+    ),
+    sa.Column(
+        "start", sa.DateTime(timezone=True), doc="UTC timestamp when task started"
+    ),
+    sa.Column(
+        "end", sa.DateTime(timezone=True), doc="UTC timestamp for task completion"
+    ),
+    sa.Column(
+        "last_heartbeat",
+        sa.DateTime(timezone=True),
+        doc="UTC timestamp for last task running check",
+    ),
+    column_created_datetime(timezone=True),
+    column_modified_datetime(timezone=True),
+    sa.Column(
+        "pricing_info",
+        postgresql.JSONB,
+        nullable=True,
+        doc="Billing information of this task",
+    ),
+    sa.Column(
+        "hardware_info",
+        postgresql.JSONB,
+        nullable=True,
+        doc="Harware information of this task",
+    ),
+    # deprecated columns must be kept due to legacy services
+    # utc timestamps for submission/start/end
+    sa.Column(
+        "submit",
+        sa.DateTime(timezone=True),
+        server_default=sa.text("'1900-01-01T00:00:00Z'::timestamptz"),
+        doc="[DEPRECATED unused but kept for legacy services and must be filled with a default value of 1 January 1900]",
+    ),
+)
@@ -2,14 +2,20 @@
 
 import sqlalchemy as sa
 from common_library.json_serialization import json_dumps, json_loads
-
 from models_library.projects import ProjectID
+from models_library.projects_nodes_io import NodeID
 from models_library.users import UserID
 from pydantic import TypeAdapter
 from servicelib.db_asyncpg_utils import create_async_engine_and_database_ready
 from settings_library.node_ports import NodePortsSettings
 from simcore_postgres_database.models.comp_tasks import comp_tasks
 from simcore_postgres_database.models.projects import projects
+from simcore_service_director_v2.modules.db.repositories.comp_runs import (
+    CompRunsRepository,
+)
+from simcore_service_director_v2.modules.db.repositories.comp_runs_snapshot_tasks import (
+    CompRunsSnapshotTasksRepository,
+)
 from sqlalchemy.ext.asyncio import AsyncConnection, AsyncEngine
 
 from .exceptions import NodeNotFound, ProjectNotFoundError
@@ -78,7 +84,10 @@ def __init__(self, db_engine: AsyncEngine | None = None):
         self._db_engine = db_engine
 
     async def write_ports_configuration(
-        self, json_configuration: str, project_id: str, node_uuid: str
+        self,
+        json_configuration: str,
+        project_id: str,
+        node_uuid: str,
     ):
         message = (
             f"Writing port configuration to database for "
@@ -91,7 +100,7 @@ async def write_ports_configuration(
             DBContextManager(self._db_engine) as engine,
             engine.begin() as connection,
         ):
-            # update the necessary parts
+            # 1. Update comp_tasks table
             await connection.execute(
                 comp_tasks.update()
                 .where(
@@ -105,6 +114,26 @@ async def write_ports_configuration(
                     run_hash=node_configuration.get("run_hash"),
                 )
             )
+            # 2. Get latest run id for the project
+            _latest_run_id = await CompRunsRepository.instance(
+                engine
+            ).get_latest_run_id_for_project(
+                connection, project_id=ProjectID(project_id)
+            )
+            # 3. Update comp_run_snapshot_tasks table
+            await CompRunsSnapshotTasksRepository.instance(
+                engine
+            ).update_for_run_id_and_node_id(
+                connection,
+                run_id=_latest_run_id,
+                node_id=NodeID(node_uuid),
+                data={
+                    "schema": node_configuration["schema"],
+                    "inputs": node_configuration["inputs"],
+                    "outputs": node_configuration["outputs"],
+                    "run_hash": node_configuration.get("run_hash"),
+                },
+            )
 
     async def get_ports_configuration_from_node_uuid(
         self, project_id: str, node_uuid: str
 
@@ -199,6 +199,7 @@ async def _try_start_pipeline(
     project: ProjectAtDB,
     users_repo: UsersRepository,
     projects_metadata_repo: ProjectsMetadataRepository,
+    filtered_comp_tasks_in_db: list[CompTaskAtDB],
 ) -> None:
     if not minimal_dag.nodes():
         # 2 options here: either we have cycles in the graph or it's really done
@@ -241,6 +242,7 @@ async def _try_start_pipeline(
         )
         or {},
         use_on_demand_clusters=computation.use_on_demand_clusters,
+        filtered_comp_tasks_in_db=filtered_comp_tasks_in_db,
     )
 
 
@@ -340,6 +342,13 @@ async def create_computation(  # noqa: PLR0913 # pylint: disable=too-many-positi
             rabbitmq_rpc_client=rpc_client,
         )
 
+        # filter the tasks by the effective pipeline
+        filtered_tasks = [
+            t
+            for t in comp_tasks
+            if f"{t.node_id}" in set(minimal_computational_dag.nodes())
+        ]
+
         if computation.start_pipeline:
             await _try_start_pipeline(
                 request.app,
@@ -350,14 +359,9 @@ async def create_computation(  # noqa: PLR0913 # pylint: disable=too-many-positi
                 project=project,
                 users_repo=users_repo,
                 projects_metadata_repo=projects_metadata_repo,
+                filtered_comp_tasks_in_db=filtered_tasks,
             )
 
-        # filter the tasks by the effective pipeline
-        filtered_tasks = [
-            t
-            for t in comp_tasks
-            if f"{t.node_id}" in set(minimal_computational_dag.nodes())
-        ]
         pipeline_state = utils.get_pipeline_state_from_task_states(filtered_tasks)
 
         # get run details if any