MobileTeleSystems
diff --git a/‎docker/Dockerfile.scheduler‎
Lines changed: 1 addition & 1 deletion b/‎docker/Dockerfile.scheduler‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docker/Dockerfile.server‎
Lines changed: 1 addition & 1 deletion b/‎docker/Dockerfile.server‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docker/Dockerfile.worker‎
Lines changed: 1 addition & 1 deletion b/‎docker/Dockerfile.worker‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/changelog/next_release/255.improvement.rst‎
Lines changed: 2 additions & 0 deletions b/‎docs/changelog/next_release/255.improvement.rst‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎syncmaster/db/migrations/versions/2025-08-10_0012_update_ts.py‎
Lines changed: 243 additions & 0 deletions b/‎syncmaster/db/migrations/versions/2025-08-10_0012_update_ts.py‎
Lines changed: 243 additions & 0 deletions
diff --git a/‎syncmaster/db/models/connection.py‎
Lines changed: 19 additions & 5 deletions b/‎syncmaster/db/models/connection.py‎
Lines changed: 19 additions & 5 deletions
diff --git a/‎syncmaster/db/models/group.py‎
Lines changed: 16 additions & 3 deletions b/‎syncmaster/db/models/group.py‎
Lines changed: 16 additions & 3 deletions
diff --git a/‎syncmaster/db/models/queue.py‎
Lines changed: 16 additions & 2 deletions b/‎syncmaster/db/models/queue.py‎
Lines changed: 16 additions & 2 deletions
@@ -1,5 +1,5 @@
 ARG PYTHON_VERSION=3.13
-FROM python:$PYTHON_VERSION-slim AS base
+FROM python:$PYTHON_VERSION-slim-bookworm AS base
 
 WORKDIR /app
 ENV PYTHONPATH=/app \
 
@@ -1,5 +1,5 @@
 ARG PYTHON_VERSION=3.13
-FROM python:$PYTHON_VERSION-slim AS base
+FROM python:$PYTHON_VERSION-slim-bookworm AS base
 
 RUN apt-get update \
     && apt-get install -y --no-install-recommends \
 
@@ -1,5 +1,5 @@
 ARG PYTHON_VERSION=3.13
-FROM python:$PYTHON_VERSION-slim AS base
+FROM python:$PYTHON_VERSION-slim-bookworm AS base
 
 RUN apt-get update && apt-get install -y --no-install-recommends \
         openjdk-17-jdk-headless \
 
@@ -0,0 +1,2 @@
+Improved full-text search by refining ``tsvector`` generation and adding better tokenization for technical fields such as hostnames, table names, and directory paths.
+-- by :github:user:`marashka`
@@ -0,0 +1,243 @@
+# SPDX-FileCopyrightText: 2023-2024 MTS PJSC
+# SPDX-License-Identifier: Apache-2.0
+"""Update text search
+
+Revision ID: 0012
+Revises: 0011
+Create Date: 2025-08-10 20:03:02.105470
+
+"""
+
+import sqlalchemy as sa
+from alembic import op
+from sqlalchemy.dialects import postgresql
+
+# revision identifiers, used by Alembic.
+revision = "0012"
+down_revision = "0011"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.drop_index(op.f("idx_connection_search_vector"), table_name="connection", postgresql_using="gin")
+    op.drop_column("connection", "search_vector")
+    op.drop_column("group", "search_vector")
+    op.drop_index(op.f("idx_transfer_search_vector"), table_name="transfer", postgresql_using="gin")
+    op.drop_column("transfer", "search_vector")
+    op.drop_column("queue", "search_vector")
+
+    op.add_column(
+        "connection",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed(
+                """
+                -- === NAME FIELD ===
+                -- Russian stemming for better morphological matching of regular words
+                to_tsvector('russian', coalesce(name, ''))
+                -- Simple dictionary (no stemming) for exact token match
+                || to_tsvector('simple', coalesce(name, ''))
+                -- Simple dictionary with translate(): split by . / - _ : \
+                -- (used when 'name' contains technical fields)
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(name, ''), './-_:\\', '      ')
+                )
+
+                -- === HOST FIELD (from JSON) ===
+                -- Simple dictionary (no stemming) for exact match
+                || to_tsvector('simple', coalesce(data->>'host', ''))
+                -- Simple dictionary with translate(): split by . / - _ : \\ for partial token matching
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(data->>'host', ''), './-_:\\', '      ')
+                )
+                """,
+                persisted=True,
+            ),
+            nullable=False,
+        ),
+    )
+    op.create_index(
+        "idx_connection_search_vector",
+        "connection",
+        ["search_vector"],
+        unique=False,
+        postgresql_using="gin",
+    )
+
+    op.add_column(
+        "group",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed(
+                """
+                -- === NAME FIELD ===
+                -- Russian stemming for better morphological matching of regular words
+                to_tsvector('russian', coalesce(name, ''))
+                -- Simple dictionary (no stemming) for exact token match
+                || to_tsvector('simple', coalesce(name, ''))
+                -- Simple dictionary with translate(): split by . / - _ : \
+                -- (used when 'name' contains technical fields)
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(name, ''), './-_:\\', '      ')
+                )
+                """,
+                persisted=True,
+            ),
+            nullable=False,
+        ),
+    )
+
+    op.add_column(
+        "queue",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed(
+                """
+                -- === NAME FIELD ===
+                -- Russian stemming for better morphological matching of regular words
+                to_tsvector('russian', coalesce(name, ''))
+                -- Simple dictionary (no stemming) for exact token match
+                || to_tsvector('simple', coalesce(name, ''))
+                -- Simple dictionary with translate(): split by . / - _ : \
+                -- (used when 'name' contains technical fields)
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(name, ''), './-_:\\', '      ')
+                )
+                """,
+                persisted=True,
+            ),
+            nullable=False,
+        ),
+    )
+
+    op.add_column(
+        "transfer",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed(
+                """
+                -- === NAME FIELD ===
+                -- Russian stemming for better morphological matching of regular words
+                to_tsvector('russian', coalesce(name, ''))
+                -- Simple dictionary (no stemming) for exact token match
+                || to_tsvector('simple', coalesce(name, ''))
+                -- Simple dictionary with translate(): split by . / - _ : \
+                -- (used when 'name' contains technical fields)
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(name, ''), './-_:\\', '      ')
+                )
+
+                -- === TABLE NAME FIELDS ===
+                -- Simple dictionary (no stemming) for exact match
+                || to_tsvector('simple', coalesce(source_params->>'table_name', ''))
+                || to_tsvector('simple', coalesce(target_params->>'table_name', ''))
+                -- Simple dictionary with translate(): split by . / - _ : \\ for partial token matching
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(source_params->>'table_name', ''), './-_:\\', '      ')
+                )
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(target_params->>'table_name', ''), './-_:\\', '      ')
+                )
+
+                -- === DIRECTORY PATH FIELDS ===
+                -- Simple dictionary (no stemming) for exact match
+                || to_tsvector('simple', coalesce(source_params->>'directory_path', ''))
+                || to_tsvector('simple', coalesce(target_params->>'directory_path', ''))
+                -- Simple dictionary with translate(): split by . / - _ : \\ for partial token matching
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(source_params->>'directory_path', ''), './-_:\\', '      ')
+                )
+                || to_tsvector(
+                    'simple',
+                    translate(coalesce(target_params->>'directory_path', ''), './-_:\\', '      ')
+                )
+                """,
+                persisted=True,
+            ),
+            nullable=False,
+        ),
+    )
+    op.create_index("idx_transfer_search_vector", "transfer", ["search_vector"], unique=False, postgresql_using="gin")
+
+
+def downgrade() -> None:
+    op.drop_index("idx_transfer_search_vector", table_name="transfer", postgresql_using="gin")
+    op.drop_column("transfer", "search_vector")
+    op.drop_column("group", "search_vector")
+    op.drop_index("idx_connection_search_vector", table_name="connection", postgresql_using="gin")
+    op.drop_column("connection", "search_vector")
+    op.drop_column("queue", "search_vector")
+
+    op.add_column(
+        "transfer",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed(
+                "to_tsvector('english'::regconfig, (((((((((((((((((((name)::text || ' '::text) || COALESCE(json_extract_path_text(source_params, VARIADIC ARRAY['table_name'::text]), ''::text)) || ' '::text) || COALESCE(json_extract_path_text(target_params, VARIADIC ARRAY['table_name'::text]), ''::text)) || ' '::text) || COALESCE(json_extract_path_text(source_params, VARIADIC ARRAY['directory_path'::text]), ''::text)) || ' '::text) || COALESCE(json_extract_path_text(target_params, VARIADIC ARRAY['directory_path'::text]), ''::text)) || ' '::text) || translate((name)::text, './'::text, '  '::text)) || ' '::text) || COALESCE(translate(json_extract_path_text(source_params, VARIADIC ARRAY['table_name'::text]), './'::text, '  '::text), ''::text)) || ' '::text) || COALESCE(translate(json_extract_path_text(target_params, VARIADIC ARRAY['table_name'::text]), './'::text, '  '::text), ''::text)) || ' '::text) || COALESCE(translate(json_extract_path_text(source_params, VARIADIC ARRAY['directory_path'::text]), './'::text, '  '::text), ''::text)) || ' '::text) || COALESCE(translate(json_extract_path_text(target_params, VARIADIC ARRAY['directory_path'::text]), './'::text, '  '::text), ''::text)))",
+                persisted=True,
+            ),
+            autoincrement=False,
+            nullable=False,
+        ),
+    )
+    op.create_index(
+        op.f("idx_transfer_search_vector"),
+        "transfer",
+        ["search_vector"],
+        unique=False,
+        postgresql_using="gin",
+    )
+    op.add_column(
+        "group",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed("to_tsvector('english'::regconfig, (name)::text)", persisted=True),
+            autoincrement=False,
+            nullable=False,
+        ),
+    )
+    op.add_column(
+        "connection",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed(
+                "to_tsvector('english'::regconfig, (((((name)::text || ' '::text) || COALESCE(json_extract_path_text(data, VARIADIC ARRAY['host'::text]), ''::text)) || ' '::text) || COALESCE(translate(json_extract_path_text(data, VARIADIC ARRAY['host'::text]), '.'::text, ' '::text), ''::text)))",
+                persisted=True,
+            ),
+            autoincrement=False,
+            nullable=False,
+        ),
+    )
+    op.create_index(
+        op.f("idx_connection_search_vector"),
+        "connection",
+        ["search_vector"],
+        unique=False,
+        postgresql_using="gin",
+    )
+    op.add_column(
+        "queue",
+        sa.Column(
+            "search_vector",
+            postgresql.TSVECTOR(),
+            sa.Computed("to_tsvector('english'::regconfig, (name)::text)", persisted=True),
+            autoincrement=False,
+            nullable=False,
+        ),
+    )
@@ -41,11 +41,25 @@ class Connection(Base, ResourceMixin, TimestampMixin):
         TSVECTOR,
         Computed(
             """
-            to_tsvector(
-                'english'::regconfig,
-                name || ' ' ||
-                COALESCE(json_extract_path_text(data, 'host'), '') || ' ' ||
-                COALESCE(translate(json_extract_path_text(data, 'host'), '.', ' '), '')
+            -- === NAME FIELD ===
+            -- Russian stemming for better morphological matching of regular words
+            to_tsvector('russian', coalesce(name, ''))
+            -- Simple dictionary (no stemming) for exact token match
+            || to_tsvector('simple', coalesce(name, ''))
+            -- Simple dictionary with translate(): split by . / - _ : \
+            -- (used when 'name' contains technical fields)
+            || to_tsvector(
+                'simple',
+                translate(coalesce(name, ''), './-_:\\', '      ')
+            )
+
+            -- === HOST FIELD (from JSON) ===
+            -- Simple dictionary (no stemming) for exact match
+            || to_tsvector('simple', coalesce(data->>'host', ''))
+            -- Simple dictionary with translate(): split by . / - _ : \\ for partial token matching
+            || to_tsvector(
+                'simple',
+                translate(coalesce(data->>'host', ''), './-_:\\', '      ')
             )
             """,
             persisted=True,
 
@@ -77,13 +77,26 @@ class Group(Base, TimestampMixin):
 
     owner: Mapped[User] = relationship(User)
     queue: Mapped[Queue] = relationship(back_populates="group", cascade="all, delete-orphan")
-
     search_vector: Mapped[str] = mapped_column(
         TSVECTOR,
-        Computed("to_tsvector('english'::regconfig, name)", persisted=True),
+        Computed(
+            """
+            -- === NAME FIELD ===
+            -- Russian stemming for better morphological matching of regular words
+            to_tsvector('russian', coalesce(name, ''))
+            -- Simple dictionary (no stemming) for exact token match
+            || to_tsvector('simple', coalesce(name, ''))
+            -- Simple dictionary with translate(): split by . / - _ : \
+            -- (used when 'name' contains technical fields)
+            || to_tsvector(
+                'simple',
+                translate(coalesce(name, ''), './-_:\\', '      ')
+            )
+            """,
+            persisted=True,
+        ),
         nullable=False,
         deferred=True,
-        doc="Full-text search vector",
     )
 
     def __repr__(self) -> str:
 
@@ -25,10 +25,24 @@ class Queue(Base, ResourceMixin, TimestampMixin):
 
     search_vector: Mapped[str] = mapped_column(
         TSVECTOR,
-        Computed("to_tsvector('english'::regconfig, name)", persisted=True),
+        Computed(
+            """
+            -- === NAME FIELD ===
+            -- Russian stemming for better morphological matching of regular words
+            to_tsvector('russian', coalesce(name, ''))
+            -- Simple dictionary (no stemming) for exact token match
+            || to_tsvector('simple', coalesce(name, ''))
+            -- Simple dictionary with translate(): split by . / - _ : \
+            -- (used when 'name' contains technical fields)
+            || to_tsvector(
+                'simple',
+                translate(coalesce(name, ''), './-_:\\', '      ')
+            )
+            """,
+            persisted=True,
+        ),
         nullable=False,
         deferred=True,
-        doc="Full-text search vector",
     )
 
     def __repr__(self):
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	+Improved full-text search by refining ``tsvector`` generation and adding better tokenization for technical fields such as hostnames, table names, and directory paths.
	`2`	+-- by :github:user:`marashka`