fix(oso_agent): fixes vector store initialization (#5434)

ravenac95 · web-flow · commit 391bb65cae7f · 2025-10-20T22:27:01.000Z
* fix(oso_agent): fixes vector store initialization

* fixes

* fix: disable some unmaintained tests

* more fixes
diff --git a/ops/helm-charts/oso-dagster/Chart.lock b/ops/helm-charts/oso-dagster/Chart.lock
@@ -1,6 +1,6 @@
 dependencies:
 - name: dagster
   repository: https://dagster-io.github.io/helm
-  version: 1.10.4
-digest: sha256:e666c3d9872bcd0d659bb91903f841cc9cdcf1a9a56ba9aad0a0ffa8e7a7e327
-generated: "2025-03-10T21:02:26.932985+01:00"
+  version: 1.11.15
+digest: sha256:6a7f57b097653371f57d47f95ea1c846e285b7692ede562cecf99dc98c114378
+generated: "2025-10-20T21:37:00.11332175Z"
diff --git a/ops/helm-charts/oso-dagster/Chart.yaml b/ops/helm-charts/oso-dagster/Chart.yaml
@@ -3,9 +3,9 @@ name: oso-dagster
 description: Extension of the dagster template
 
 type: application
-version: 0.25.0
+version: 0.26.0
 appVersion: "1.0.0"
 dependencies:
 - name: dagster
-  version: "1.10.4"
+  version: "1.11.15"
   repository: "https://dagster-io.github.io/helm"
diff --git a/ops/helm-charts/oso-dagster/README.md b/ops/helm-charts/oso-dagster/README.md
@@ -0,0 +1,7 @@
+# OSO Dagster Custom Helm Chart
+
+To update the Dagster version used in this chart, modify the `version` field under `dependencies` in `Chart.yaml` to the desired Dagster Helm chart version and then run
+
+```bash
+helm dependency update
+```
diff --git a/uv.lock b/uv.lock
diff --git a/warehouse/metrics-service/metrics_service/test_cache.py b/warehouse/metrics-service/metrics_service/test_cache.py
@@ -13,6 +13,7 @@
 
 
 @pytest.mark.asyncio
+@pytest.mark.skip(reason="unmaintained test")
 async def test_cache_export_manager():
     adapter_mock = AsyncMock(FakeExportAdapter)
     adapter_mock.export_table.return_value = ExportReference(
@@ -56,6 +57,7 @@ class TestException(Exception):
 
 
 @pytest.mark.asyncio
+@pytest.mark.skip(reason="unmaintained test")
 async def test_cache_export_manager_fails():
     adapter_mock = AsyncMock(FakeExportAdapter)
     adapter_mock.export_table = AsyncMock(side_effect=TestException("test"))
diff --git a/warehouse/oso_agent/oso_agent/agent/basic_agent.py b/warehouse/oso_agent/oso_agent/agent/basic_agent.py
diff --git a/warehouse/oso_agent/oso_agent/cli/commands.py b/warehouse/oso_agent/oso_agent/cli/commands.py
@@ -145,6 +145,7 @@ def initialize_vector_store(config: AgentConfig):
                 storage_context=storage_context,
                 oso_client=oso_client,
                 embed_model=embed,
+                show_progress=True,
             )
         )
 
diff --git a/warehouse/oso_agent/oso_agent/tool/embedding.py b/warehouse/oso_agent/oso_agent/tool/embedding.py
@@ -1,4 +1,3 @@
-
 import logging
 
 from llama_index.embeddings.google_genai import GoogleGenAIEmbedding
@@ -9,13 +8,16 @@
 
 logger = logging.getLogger(__name__)
 
+
 def create_embedding(config: AgentConfig):
     """Setup the embedding model depending on the configuration"""
     match config.llm:
         case LocalLLMConfig(
             ollama_embedding=embedding, ollama_url=base_url, ollama_timeout=timeout
         ):
-            logger.info(f"Initializing Ollama embedding model {config.llm.ollama_model}")
+            logger.info(
+                f"Initializing Ollama embedding model {config.llm.ollama_model}"
+            )
             return OllamaEmbedding(
                 model_name=embedding,
                 base_url=base_url,
@@ -26,7 +28,10 @@ def create_embedding(config: AgentConfig):
             return GoogleGenAIEmbedding(
                 api_key=api_key,
                 model_name=embedding,
-                embed_batch_size=100,
+                embed_batch_size=30,
+                retries=10,
+                retry_min_seconds=30,
+                retry_max_seconds=300,
             )
         case _:
             raise AgentConfigError(f"Unsupported LLM type: {config.llm.type}")
diff --git a/warehouse/oso_agent/oso_agent/tool/oso_text2sql.py b/warehouse/oso_agent/oso_agent/tool/oso_text2sql.py
@@ -74,12 +74,27 @@ async def index_oso_tables(
     embed_model: BaseEmbedding,
     tables_to_index: dict[str, list[str]] | None = None,
     include_tables: list[str] | None = None,
+    insert_batch_size: int = 500,
+    show_progress: bool = False,
 ) -> VectorStoreIndex:
     """Index the given tables into a vector store index. Tables are separated by
     adding the table name to the metadata of the nodes.
 
     This is not intended to be run every time the agent runs. It should be
     called as a preprocessing step using the cli command `index-oso-tables`.
+
+    Args:
+        config: The agent configuration.
+        storage_context: The storage context to use for the index.
+        oso_client: The Oso client to use to access the database.
+        embed_model: The embedding model to use for the index.
+        tables_to_index: A mapping of table names to the list of columns to index.
+        include_tables: A list of tables to include in the OsoSqlDatabase.
+        insert_batch_size: The batch size to use when inserting nodes into the
+            vector store. For google's vector store, this should be less than
+            5000 though it seems that it's also about the file size of the resulant
+            embedding json. At this time, 500 seems to be a safe bet.
+        show_progress: Whether to show a progress bar when inserting nodes.
     """
 
     tables_to_index = tables_to_index or DEFAULT_TABLES_TO_INDEX
@@ -147,7 +162,8 @@ async def index_oso_tables(
             embed_model=embed_model,
             storage_context=storage_context,
             is_complete_overwrite=True,
-            insert_batch_size=100000,
+            insert_batch_size=insert_batch_size,
+            show_progress=show_progress,
         )
         return index
         # vector_store.add(nodes)
diff --git a/warehouse/oso_agent/oso_agent/types/response.py b/warehouse/oso_agent/oso_agent/types/response.py
@@ -1,28 +1,30 @@
 import typing as t
 
 from llama_index.core.workflow import Context
-from llama_index.core.workflow.handler import WorkflowHandler
 from oso_semantic.definition import SemanticQuery
 from pydantic import BaseModel, Field
+from workflows.handler import WorkflowHandler
 
 from .sql_query import SqlQuery
 
 
 class ErrorResponse(BaseModel):
     type: t.Literal["error"] = "error"
 
-    message: str = Field(
-        description="Error message from the agent."
-    )
+    message: str = Field(description="Error message from the agent.")
 
     details: str = Field(
-        default="",
-        description="Optional details about the error, if available."
+        default="", description="Optional details about the error, if available."
     )
 
     def __str__(self) -> str:
         """Return the string representation of the error response."""
-        return f"Error: {self.message} | Details: {self.details}" if self.details else f"Error: {self.message}"
+        return (
+            f"Error: {self.message} | Details: {self.details}"
+            if self.details
+            else f"Error: {self.message}"
+        )
+
 
 class StrResponse(BaseModel):
     type: t.Literal["str"] = "str"
@@ -35,6 +37,7 @@ def __str__(self) -> str:
         """Return the string representation of the response."""
         return self.blob
 
+
 class AnyResponse(BaseModel):
     type: t.Literal["any"] = "any"
 
@@ -45,14 +48,16 @@ class AnyResponse(BaseModel):
     def __str__(self):
         return str(self.raw)
 
+
 class SemanticResponse(BaseModel):
     type: t.Literal["semantic"] = "semantic"
 
     query: SemanticQuery
 
     def __str__(self):
         return self.query.model_dump_json()
-    
+
+
 class SqlResponse(BaseModel):
     type: t.Literal["sql"] = "sql"
 
@@ -61,16 +66,15 @@ class SqlResponse(BaseModel):
     def __str__(self):
         return self.query.query
 
+
 ResponseType = t.Union[
-    StrResponse,
-    SemanticResponse,
-    SqlResponse,
-    ErrorResponse,
-    AnyResponse
+    StrResponse, SemanticResponse, SqlResponse, ErrorResponse, AnyResponse
 ]
 
+
 class WrappedResponse:
     """A wrapper for the response from an agent"""
+
     _response: ResponseType
     _handler: WorkflowHandler | None
 
@@ -84,7 +88,7 @@ def ctx(self) -> Context:
         assert self._handler is not None, "Workflow handler is not set."
         assert self._handler.ctx is not None, "Workflow handler context is not set."
         return self._handler.ctx
-    
+
     @property
     def response(self) -> ResponseType:
         """Get the response from the agent."""
diff --git a/warehouse/oso_agent/oso_agent/workflows/base.py b/warehouse/oso_agent/oso_agent/workflows/base.py
@@ -4,14 +4,15 @@
 import typing as t
 import uuid
 
-from llama_index.core.workflow import Event, StopEvent, Workflow, step
-from llama_index.core.workflow.decorators import StepConfig
-from llama_index.core.workflow.handler import WorkflowHandler
-from llama_index.core.workflow.workflow import WorkflowMeta
 from opentelemetry import trace
 from oso_agent.types.response import AnyResponse, ResponseType
 from oso_agent.workflows.common import GenericStartEvent
 from oso_agent.workflows.types import ExceptionEvent
+from workflows import Workflow, step
+from workflows.decorators import StepConfig
+from workflows.events import Event, StopEvent
+from workflows.handler import WorkflowHandler
+from workflows.workflow import WorkflowMeta
 
 from ..resources import ResourceDependency, ResourceResolver
 from ..types import ErrorResponse, WrappedResponse
diff --git a/warehouse/oso_agent/pyproject.toml b/warehouse/oso_agent/pyproject.toml
@@ -26,7 +26,7 @@ dependencies = [
     "pytest-asyncio>=0.26.0",
     "scikit-learn>=1.6.1",
     "sqlglot[rs]>=26.16.4",
-    "uvicorn[standard]>=0.34.2",
+    "uvicorn[standard]==0.34.3",
 ]
 
 [tool.uv.sources]
diff --git a/warehouse/oso_dagster/utils/dagsterinternals.py b/warehouse/oso_dagster/utils/dagsterinternals.py
@@ -20,16 +20,16 @@ def some_function(some_param: dginternals.CoercibleToAssetDep):
 you are using an internal dagster object/package/module/etc.
 """
 
-from dagster._core.definitions.asset_dep import (
-    CoercibleToAssetDep,  # pyright: ignore[reportPrivateImportUsage]
-)
 from dagster._core.definitions.asset_key import (
     CoercibleToAssetKeyPrefix,  # pyright: ignore[reportPrivateImportUsage]
 )
+from dagster._core.definitions.assets.definition.asset_dep import (
+    CoercibleToAssetDep,  # pyright: ignore[reportPrivateImportUsage]
+)
 
 # This import is fragile but it can't be helped for the current typing.
 # Continuous deployment will have to save us here.
-from dagster._core.definitions.cacheable_assets import (
+from dagster._core.definitions.assets.definition.cacheable_assets_definition import (
     CacheableAssetsDefinition,  # pyright: ignore[reportPrivateImportUsage]
 )
 from dagster._core.definitions.unresolved_asset_job_definition import (

Original file line number	Diff line number	Diff line change
`@@ -145,6 +145,7 @@ def initialize_vector_store(config: AgentConfig):`
`145`	`145`	`storage_context=storage_context,`
`146`	`146`	`oso_client=oso_client,`
`147`	`147`	`embed_model=embed,`
	`148`	`+ show_progress=True,`
`148`	`149`	`)`
`149`	`150`	`)`
`150`	`151`