fix(zephyr): route block_size/cache_type to file opener, not FS constructor (#3121)

yonromai · web-flow · commit 6b5a5849f69c · 2026-02-27T18:35:53.000-08:00
Fixes #3117. Sole remaining CW canary blocker. ## Problem `fsspec.open()` routes all `**kwargs` to the filesystem constructor, not to `fs.open()`. `S3FileSystem.__init__` has `default_block_size` (not `block_size`), so the kwarg leaks into `**kwargs` → `AioSession.__init__()`, which `aiobotocore 2.26.0` rejects: ``` AioSession.__init__() got an unexpected keyword argument 'block_size' ``` This means `block_size`, `cache_type`, and `maxblocks` were **never controlling S3 buffering** — they silently leaked to the session constructor, and older aiobotocore ignored them. <details> <summary>fsspec 2025.3.0 source trace</summary> 1. **`open()` (L491-500)**: passes `**kwargs` to `open_files()`. 2. **`open_files()` (L300)**: `get_fs_token_paths(urlpath, mode, storage_options=kwargs)` — all kwargs become filesystem constructor args. 3. **`open_files()` (L313-322)**: constructs `OpenFile(fs, path, mode, compression, ...)` — **no kwargs forwarded**. 4. **`OpenFile.__enter__()` (L105)**: `f = self.fs.open(self.path, mode=mode)` — **only path and mode** reach `fs.open()`. </details> ## Solution Replace `fsspec.open()` with `url_to_fs()` + `fs.open()` so that `block_size`, `cache_type`, and `cache_options` reach the file opener (`AbstractBufferedFile`) instead of the filesystem constructor. `AbstractFileSystem.open()` (spec.py L1310-1316) passes `block_size`, `cache_options`, and `**kwargs` directly to `_open()`, and handles `compression` at L1318-1324. **`readers.py`** — `open_file()`: ```python # Before: kwargs go to FS constructor → leak to AioSession with fsspec.open(file_path, mode, compression=compression, block_size=16_000_000, cache_type="background", maxblocks=2) as f: # After: kwargs go to fs.open() → reach AbstractBufferedFile/S3File fs, resolved_path = fsspec.core.url_to_fs(file_path) with fs.open(resolved_path, mode, block_size=_READ_BLOCK_SIZE, cache_type=_READ_CACHE_TYPE, cache_options={"maxblocks": _READ_MAX_BLOCKS}, compression=compression) as f: ``` **`writers.py`** — 4 call sites: ```python # Before: block_size goes to FS constructor → AioSession crash with fsspec.open(temp_path, "wb", block_size=64 * 1024 * 1024) as f: # After: block_size goes to fs.open() → controls multipart upload part size fs, resolved_temp = fsspec.core.url_to_fs(temp_path) with fs.open(resolved_temp, "wb", block_size=_WRITE_BLOCK_SIZE) as f: ``` <details> <summary>Backend routing</summary> **S3**: `S3FileSystem._open(block_size=16M, cache_type="background", cache_options={"maxblocks": 2})` → `S3File` → `BackgroundBlockCache(blocksize=16M, maxblocks=2)`. **Local**: `LocalFileSystem._open(block_size=16M, **kwargs)` — `block_size` is a named param (silently ignored), remaining kwargs absorbed by `LocalFileOpener(**kwargs)`. No crash, no effect. </details> <details> <summary>Note: compresslevel=1 was also misrouted (pre-existing)</summary> The `.gz` writer branch had `compresslevel=1` in `fsspec.open()`. This also leaked to the FS constructor — fsspec's compression wrapper calls `compress(f, mode=mode[0])` with no extra kwargs. Dropped in this PR; fixing gzip compression level is a separate concern. </details> ## Safety This change makes the buffering settings actually work for the first time. Previously, S3 reads used fsspec defaults (5MB blocks, "readahead" cache). After: 16MB blocks with background prefetch. S3 writes go from 50MB to 64MB multipart parts. Local file IO is unaffected. ## Testing - [x] `test_backends.py` (9/9), full zephyr suite (351/351) - [x] Manual R2 test: reproduced `AioSession` crash with old code, confirmed fix with new code - [ ] Post-merge: re-run CW canary ferry
diff --git a/lib/iris/src/iris/cluster/k8s/kubectl.py b/lib/iris/src/iris/cluster/k8s/kubectl.py
@@ -26,6 +26,7 @@
 import logging
 import os
 import subprocess
+import time
 from dataclasses import dataclass, field
 from datetime import datetime, timezone
 
@@ -115,9 +116,13 @@ def run(
             logger.info("kubectl: %s\n  stdin=%s", " ".join(cmd), stdin[:2000])
         else:
             logger.info("kubectl: %s", " ".join(cmd))
+        t0 = time.monotonic()
         result = subprocess.run(cmd, input=stdin, capture_output=True, text=True, timeout=effective_timeout)
+        elapsed_ms = (time.monotonic() - t0) * 1000
         if result.returncode != 0:
-            logger.info("kubectl exit %d: stderr=%s", result.returncode, result.stderr.strip()[:500])
+            logger.info("kubectl exit %d: %dms stderr=%s", result.returncode, elapsed_ms, result.stderr.strip()[:500])
+        elif elapsed_ms > 2000:
+            logger.warning("kubectl slow: %dms cmd=%s", elapsed_ms, " ".join(args))
         return result
 
     def apply_json(self, manifest: dict) -> None:
diff --git a/lib/zephyr/src/zephyr/readers.py b/lib/zephyr/src/zephyr/readers.py
@@ -25,6 +25,11 @@
 
 logger = logging.getLogger(__name__)
 
+# 16 MB read blocks with background prefetch for S3/remote reads.
+_READ_BLOCK_SIZE = 16_000_000
+_READ_CACHE_TYPE = "background"
+_READ_MAX_BLOCKS = 2
+
 
 @dataclass
 class InputFileSpec:
@@ -77,13 +82,18 @@ def open_file(file_path: str, mode: str = "rb"):
     elif file_path.endswith(".xz"):
         compression = "xz"
 
-    with fsspec.open(
-        file_path,
+    # Use url_to_fs + fs.open so that block_size/cache_type reach the file
+    # opener (AbstractBufferedFile) rather than the filesystem constructor.
+    # fsspec.open() routes all **kwargs to the FS constructor, where S3's
+    # AioSession rejects unknown kwargs like block_size.
+    fs, resolved_path = fsspec.core.url_to_fs(file_path)
+    with fs.open(
+        resolved_path,
         mode,
+        block_size=_READ_BLOCK_SIZE,
+        cache_type=_READ_CACHE_TYPE,
+        cache_options={"maxblocks": _READ_MAX_BLOCKS},
         compression=compression,
-        block_size=16_000_000,
-        cache_type="background",
-        maxblocks=2,
     ) as f:
         yield f
 
diff --git a/lib/zephyr/src/zephyr/writers.py b/lib/zephyr/src/zephyr/writers.py
@@ -21,6 +21,9 @@
 
 logger = logging.getLogger(__name__)
 
+# 64 MB write blocks — controls S3 multipart upload part size.
+_WRITE_BLOCK_SIZE = 64 * 1024 * 1024
+
 
 def unique_temp_path(output_path: str) -> str:
     """Return a unique temporary path derived from ``output_path``.
@@ -81,22 +84,23 @@ def write_jsonl_file(records: Iterable, output_path: str) -> dict:
     encoder = msgspec.json.Encoder()
 
     with atomic_rename(output_path) as temp_path:
+        fs, resolved_temp = fsspec.core.url_to_fs(temp_path)
         if output_path.endswith(".zst"):
             import zstandard as zstd
 
             cctx = zstd.ZstdCompressor(level=2, threads=1)
-            with fsspec.open(temp_path, "wb", block_size=64 * 1024 * 1024) as raw_f:
+            with fs.open(resolved_temp, "wb", block_size=_WRITE_BLOCK_SIZE) as raw_f:
                 with cctx.stream_writer(raw_f) as f:
                     for record in records:
                         f.write(encoder.encode(record) + b"\n")
                         count += 1
         elif output_path.endswith(".gz"):
-            with fsspec.open(temp_path, "wb", compression="gzip", compresslevel=1, block_size=64 * 1024 * 1024) as f:
+            with fs.open(resolved_temp, "wb", block_size=_WRITE_BLOCK_SIZE, compression="gzip") as f:
                 for record in records:
                     f.write(encoder.encode(record) + b"\n")
                     count += 1
         else:
-            with fsspec.open(temp_path, "wb", block_size=64 * 1024 * 1024) as f:
+            with fs.open(resolved_temp, "wb", block_size=_WRITE_BLOCK_SIZE) as f:
                 for record in records:
                     f.write(encoder.encode(record) + b"\n")
                     count += 1
@@ -367,7 +371,8 @@ def write_binary_file(records: Iterable[bytes], output_path: str) -> dict:
 
     count = 0
     with atomic_rename(output_path) as temp_path:
-        with fsspec.open(temp_path, "wb", block_size=64 * 1024 * 1024) as f:
+        fs, resolved_temp = fsspec.core.url_to_fs(temp_path)
+        with fs.open(resolved_temp, "wb", block_size=_WRITE_BLOCK_SIZE) as f:
             for record in records:
                 f.write(record)
                 count += 1