Skip to content

Commit c1e02ee

Browse files
committed
Cleanup and pre-commit
1 parent 1274a01 commit c1e02ee

File tree

2 files changed

+20
-13
lines changed

2 files changed

+20
-13
lines changed

src/mdio/converters/segy.py

Lines changed: 19 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -18,10 +18,19 @@
1818
from mdio.converters.exceptions import GridTraceSparsityError
1919
from mdio.converters.type_converter import to_structured_type
2020
from mdio.core.grid import Grid
21+
from mdio.core.utils_write import MAX_COORDINATES_BYTES
22+
from mdio.core.utils_write import MAX_SIZE_LIVE_MASK
23+
from mdio.core.utils_write import get_constrained_chunksize
24+
from mdio.schemas.chunk_grid import RegularChunkGrid
25+
from mdio.schemas.chunk_grid import RegularChunkShape
26+
from mdio.schemas.metadata import ChunkGridMetadata
27+
28+
# from mdio.schemas.v1.dataset_builder import ChunkGridMetadata
2129
from mdio.schemas.v1.dataset_serializer import to_xarray_dataset
2230
from mdio.schemas.v1.units import AllUnits
2331
from mdio.schemas.v1.units import LengthUnitEnum
2432
from mdio.schemas.v1.units import LengthUnitModel
33+
from mdio.schemas.v1.variable import VariableMetadata
2534
from mdio.segy import blocked_io
2635
from mdio.segy.utilities import get_grid_plan
2736

@@ -313,30 +322,27 @@ def _add_text_binary_headers(dataset: Dataset, segy_file: SegyFile) -> None:
313322

314323

315324
def _chunk_variable(ds: Dataset, variable_name: str) -> None:
316-
from mdio.core.utils_write import MAX_SIZE_LIVE_MASK
317-
from mdio.core.utils_write import get_constrained_chunksize
318-
from mdio.schemas.chunk_grid import RegularChunkGrid
319-
from mdio.schemas.chunk_grid import RegularChunkShape
320-
from mdio.schemas.metadata import ChunkGridMetadata
321-
from mdio.schemas.v1.dataset_builder import ChunkGridMetadata
322-
from mdio.schemas.v1.variable import VariableMetadata
323-
325+
"""Determins the chunking for a Variable in the dataset."""
324326
# Find the variable by name
325327
idx = -1
326328
for i in range(len(ds.variables)):
327329
if ds.variables[i].name == variable_name:
328330
idx = i
329331
break
330332
if idx == -1:
331-
raise ValueError(f"Variable '{variable_name}' not found in dataset.")
333+
# raise ValueError(f"Variable '{variable_name}' not found in dataset.")
334+
err = f"Variable '{variable_name}' not found in dataset."
335+
raise ValueError(err)
336+
337+
def determine_target_size(t: str) -> int:
338+
if t == "bool":
339+
return MAX_SIZE_LIVE_MASK
340+
return MAX_COORDINATES_BYTES
332341

333342
# Create the chunk grid metadata
334343
t = ds.variables[idx].data_type
335344
full_shape = tuple(dim.size for dim in ds.variables[idx].dimensions)
336-
if t == "bool":
337-
target_size = MAX_SIZE_LIVE_MASK
338-
else:
339-
target_size = 128 * 1024**2
345+
target_size = determine_target_size(t)
340346

341347
chunks = ChunkGridMetadata(
342348
chunk_grid=RegularChunkGrid(

src/mdio/core/utils_write.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -11,6 +11,7 @@
1111

1212

1313
MAX_SIZE_LIVE_MASK = 512 * 1024**2
14+
MAX_COORDINATES_BYTES = 128 * 1024**2
1415

1516
JsonSerializable = str | int | float | bool | None | dict[str, "JsonSerializable"] | list["JsonSerializable"]
1617

0 commit comments

Comments
 (0)