Skip to content

Commit 03c048e

Browse files
committed
run ruff
1 parent 12301b3 commit 03c048e

File tree

2 files changed

+18
-7
lines changed

2 files changed

+18
-7
lines changed

src/data_designer/config/config_builder.py

Lines changed: 14 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,8 @@
66
import json
77
import logging
88
from pathlib import Path
9-
from typing import Union, Optional
9+
from typing import Optional, Union
10+
1011
from pygments import highlight
1112
from pygments.formatters import HtmlFormatter
1213
from pygments.lexers import PythonLexer
@@ -27,12 +28,12 @@
2728
)
2829
from .seed import (
2930
DatastoreSeedDatasetReference,
31+
IndexRange,
3032
LocalSeedDatasetReference,
33+
PartitionBlock,
3134
SamplingStrategy,
3235
SeedConfig,
3336
SeedDatasetReference,
34-
IndexRange,
35-
PartitionBlock,
3637
)
3738
from .utils.constants import DEFAULT_REPR_HTML_STYLE, REPR_HTML_TEMPLATE
3839
from .utils.info import DataDesignerInfo
@@ -115,7 +116,11 @@ def from_config(cls, config: dict | str | Path | BuilderConfig) -> Self:
115116
datastore_settings=builder_config.datastore_settings,
116117
)
117118
builder.set_seed_datastore_settings(builder_config.datastore_settings)
118-
builder.with_seed_dataset(seed_dataset_reference, sampling_strategy=config.seed_config.sampling_strategy, selection_strategy=config.seed_config.selection_strategy)
119+
builder.with_seed_dataset(
120+
seed_dataset_reference,
121+
sampling_strategy=config.seed_config.sampling_strategy,
122+
selection_strategy=config.seed_config.selection_strategy,
123+
)
119124

120125
return builder
121126

@@ -511,7 +516,11 @@ def with_seed_dataset(
511516
Returns:
512517
The current Data Designer config builder instance.
513518
"""
514-
self._seed_config = SeedConfig(dataset=dataset_reference.dataset, sampling_strategy=sampling_strategy, selection_strategy=selection_strategy)
519+
self._seed_config = SeedConfig(
520+
dataset=dataset_reference.dataset,
521+
sampling_strategy=sampling_strategy,
522+
selection_strategy=selection_strategy,
523+
)
515524
self.set_seed_datastore_settings(
516525
dataset_reference.datastore_settings if hasattr(dataset_reference, "datastore_settings") else None
517526
)

src/data_designer/engine/column_generators/generators/seed_dataset.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,7 @@ def _initialize(self) -> None:
6060
self._dataset_uri = self.resource_provider.datastore.get_dataset_uri(self.config.dataset)
6161
self._seed_dataset_size = self.duckdb_conn.execute(f"SELECT COUNT(*) FROM '{self._dataset_uri}'").fetchone()[0]
6262
self._index_range = self._resolve_index_range()
63-
63+
6464
def _validate_selection_strategy(self) -> None:
6565
err_msg = None
6666
if self.config.selection_strategy is not None:
@@ -115,7 +115,9 @@ def _sample_records(self, num_records: int) -> pd.DataFrame:
115115
logger.info(f" |-- seed dataset size: {self._seed_dataset_size} records")
116116
logger.info(f" |-- sampling strategy: {self.config.sampling_strategy}")
117117
if self._index_range is not None:
118-
logger.info(f" |-- selection strategy: {type(self.config.selection_strategy).__name__}\n{self.config.selection_strategy.model_dump_json(indent=4)}")
118+
logger.info(
119+
f" |-- selection strategy: {type(self.config.selection_strategy).__name__}\n{self.config.selection_strategy.model_dump_json(indent=4)}"
120+
)
119121
logger.info(f" |-- seed dataset size after selection: {self._index_range.size} records")
120122
df_batch = pd.DataFrame()
121123
df_sample = pd.DataFrame() if self._df_remaining is None else self._df_remaining

0 commit comments

Comments
 (0)