fix(csharp): respect Thrift rowCount metadata to trim excess rows in LIMIT queries (#126)

jadewang-db · Jade Wang · claude · web-flow · commit 615da035c0f7 · 2026-01-16T17:14:15.000-08:00
## 🥞 Stacked PR Use this [link](https://github.com/adbc-drivers/databricks/pull/126/files) to review incremental changes. - [**stack/jade.wang/PECO-2524-row-count-limiting**](#126) [[Files changed](https://github.com/adbc-drivers/databricks/pull/126/files)] --------- ## Summary When the Databricks server uses `trimArrowBatchesToLimit=false` (the default), it may return more data than the LIMIT in the last batch but reports adjusted `rowCount` values in the batch/chunk metadata so that `sum(rowCount)` equals the actual limit. This fix updates both `DatabricksReader` (inline results) and `CloudFetchReader` (CloudFetch results) to track the reported `rowCount` from metadata and trim excess rows from the actual Arrow data when needed. ## Changes ### DatabricksReader (inline Thrift results) - Track `_currentBatchExpectedRows` from `TSparkArrowBatch.RowCount` - Slice the `RecordBatch` if it exceeds the expected count ### CloudFetchReader (CloudFetch results) - Support both global (REST API) and per-chunk (Thrift) limiting: - **REST API (SEA)**: Use `manifest.TotalRowCount` for global row limit - **Thrift**: Use per-chunk `RowCount` from download results - Track `_totalExpectedRows` (global) and `_currentChunkExpectedRows` (per-chunk) ### Interface changes - `ICloudFetchResultFetcher`: Add `GetTotalExpectedRows()` method - `ThriftResultFetcher`: Accumulate total expected rows from `link.RowCount` - `StatementExecutionResultFetcher`: Return `manifest.TotalRowCount` ### Tests - `CloudFetchE2ETest`: Validate exact row count for both Thrift and REST protocols ## Test plan - [x] Build passes: `dotnet build AdbcDrivers.Databricks.csproj` - [x] All CloudFetch E2E tests pass (16/16): `dotnet test --filter "CloudFetchE2ETest.TestCloudFetch"` - [x] Tests validate exact row count for both Thrift and REST API LIMIT queries 🤖 Generated with [Claude Code](https://claude.ai/code) Closes PECO-2524 --------- Co-authored-by: Jade Wang <jade.wang+data@databricks.com> Co-authored-by: Claude <noreply@anthropic.com>
diff --git a/csharp/src/Reader/CloudFetch/CloudFetchReader.cs b/csharp/src/Reader/CloudFetch/CloudFetchReader.cs
@@ -47,6 +47,16 @@ internal sealed class CloudFetchReader : BaseDatabricksReader
         private ArrowStreamReader? currentReader;
         private IDownloadResult? currentDownloadResult;
 
+        // Row count limiting supports two modes:
+        // 1. Global limiting (SEA/REST): Uses manifest.TotalRowCount for total expected rows
+        // 2. Per-chunk limiting (Thrift): Uses TSparkArrowResultLink.RowCount per chunk
+        // When trimArrowBatchesToLimit=false (server default), the server may return more data
+        // than the limit in the last batch but reports adjusted rowCount in metadata.
+        private readonly long _totalExpectedRows;
+        private long _rowsRead;
+        private long _currentChunkExpectedRows;
+        private long _currentChunkRowsRead;
+
         /// <summary>
         /// Initializes a new instance of the <see cref="CloudFetchReader"/> class.
         /// Protocol-agnostic constructor.
@@ -56,14 +66,21 @@ internal sealed class CloudFetchReader : BaseDatabricksReader
         /// <param name="schema">The Arrow schema.</param>
         /// <param name="response">The query response (nullable for REST API, which doesn't use IResponse).</param>
         /// <param name="downloadManager">The download manager (already initialized and started).</param>
+        /// <param name="totalExpectedRows">Total expected rows for global limiting (SEA). Pass 0 to use per-chunk limiting (Thrift).</param>
         public CloudFetchReader(
             ITracingStatement statement,
             Schema schema,
             IResponse? response,
-            ICloudFetchDownloadManager downloadManager)
+            ICloudFetchDownloadManager downloadManager,
+            long totalExpectedRows = 0)
             : base(statement, schema, response, isLz4Compressed: false) // isLz4Compressed handled by download manager
         {
             this.downloadManager = downloadManager ?? throw new ArgumentNullException(nameof(downloadManager));
+            if (totalExpectedRows < 0)
+            {
+                throw new ArgumentOutOfRangeException(nameof(totalExpectedRows), totalExpectedRows, "Total expected rows cannot be negative.");
+            }
+            _totalExpectedRows = totalExpectedRows;
         }
 
         /// <summary>
@@ -79,25 +96,47 @@ public CloudFetchReader(
 
                 while (true)
                 {
+                    // Check global row limit first (used by SEA with manifest.TotalRowCount)
+                    if (_totalExpectedRows > 0 && _rowsRead >= _totalExpectedRows)
+                    {
+                        Activity.Current?.AddEvent("cloudfetch.global_row_limit_reached", [
+                            new("total_expected_rows", _totalExpectedRows),
+                            new("rows_read", _rowsRead)
+                        ]);
+                        CleanupCurrentReaderAndDownloadResult();
+                        return null;
+                    }
+
+                    // Check per-chunk row limit (used by Thrift with TSparkArrowResultLink.RowCount)
+                    if (_totalExpectedRows <= 0 && _currentChunkExpectedRows > 0 && _currentChunkRowsRead >= _currentChunkExpectedRows)
+                    {
+                        Activity.Current?.AddEvent("cloudfetch.chunk_row_limit_reached", [
+                            new("chunk_expected_rows", _currentChunkExpectedRows),
+                            new("chunk_rows_read", _currentChunkRowsRead)
+                        ]);
+                        // Move to next chunk
+                        CleanupCurrentReaderAndDownloadResult();
+                    }
+
                     // If we have a current reader, try to read the next batch
                     if (this.currentReader != null)
                     {
                         RecordBatch? next = await this.currentReader.ReadNextRecordBatchAsync(cancellationToken);
                         if (next != null)
                         {
-                            return next;
+                            // Apply row count limiting: trim the batch if it would exceed expected rows
+                            next = ApplyRowCountLimit(next);
+                            if (next != null)
+                            {
+                                return next;
+                            }
+                            // If next is null after limiting, we've reached the limit
+                            continue;
                         }
                         else
                         {
                             // Clean up the current reader and download result
-                            this.currentReader.Dispose();
-                            this.currentReader = null;
-
-                            if (this.currentDownloadResult != null)
-                            {
-                                this.currentDownloadResult.Dispose();
-                                this.currentDownloadResult = null;
-                            }
+                            CleanupCurrentReaderAndDownloadResult();
                         }
                     }
 
@@ -117,8 +156,13 @@ public CloudFetchReader(
                                 return null;
                             }
 
+                            // Set up chunk-level row count tracking
+                            _currentChunkExpectedRows = this.currentDownloadResult.RowCount;
+                            _currentChunkRowsRead = 0;
+
                             Activity.Current?.AddEvent("cloudfetch.reader_waiting_for_download", [
-                                new("chunk_index", this.currentDownloadResult.ChunkIndex)
+                                new("chunk_index", this.currentDownloadResult.ChunkIndex),
+                                new("chunk_row_count", this.currentDownloadResult.RowCount)
                             ]);
 
                             await this.currentDownloadResult.DownloadCompletedTask;
@@ -160,6 +204,102 @@ public CloudFetchReader(
             });
         }
 
+        /// <summary>
+        /// Cleans up the current reader and download result, resetting chunk-level tracking.
+        /// </summary>
+        private void CleanupCurrentReaderAndDownloadResult()
+        {
+            if (this.currentReader != null)
+            {
+                this.currentReader.Dispose();
+                this.currentReader = null;
+            }
+            if (this.currentDownloadResult != null)
+            {
+                this.currentDownloadResult.Dispose();
+                this.currentDownloadResult = null;
+            }
+            _currentChunkExpectedRows = 0;
+            _currentChunkRowsRead = 0;
+        }
+
+        /// <summary>
+        /// Applies row count limiting to a record batch.
+        /// Supports two modes:
+        /// - Global limiting (SEA): Uses _totalExpectedRows from manifest.TotalRowCount
+        /// - Per-chunk limiting (Thrift): Uses _currentChunkExpectedRows from TSparkArrowResultLink.RowCount
+        /// </summary>
+        private RecordBatch? ApplyRowCountLimit(RecordBatch batch)
+        {
+            // Mode 1: Global row limiting (SEA with manifest.TotalRowCount)
+            if (_totalExpectedRows > 0)
+            {
+                long remainingRows = _totalExpectedRows - _rowsRead;
+
+                if (batch.Length <= remainingRows)
+                {
+                    _rowsRead += batch.Length;
+                    return batch;
+                }
+
+                if (remainingRows <= 0)
+                {
+                    return null;
+                }
+
+                Activity.Current?.AddEvent("cloudfetch.trimming_batch_global", [
+                    new("original_length", batch.Length),
+                    new("trimmed_length", remainingRows),
+                    new("total_expected_rows", _totalExpectedRows),
+                    new("rows_read_before", _rowsRead)
+                ]);
+
+                // Slice uses reference counting - dispose original to release its reference
+                var globalTrimmedBatch = batch.Slice(0, (int)remainingRows);
+                batch.Dispose();
+                _rowsRead += globalTrimmedBatch.Length;
+                return globalTrimmedBatch;
+            }
+
+            // Mode 2: Per-chunk row limiting (Thrift with TSparkArrowResultLink.RowCount)
+            // If no row limit tracking for this chunk (0 means no limit set, negative is invalid/defensive)
+            if (_currentChunkExpectedRows <= 0)
+            {
+                _currentChunkRowsRead += batch.Length;
+                return batch;
+            }
+
+            long chunkRemainingRows = _currentChunkExpectedRows - _currentChunkRowsRead;
+
+            // If we can return the full batch without exceeding the limit
+            if (batch.Length <= chunkRemainingRows)
+            {
+                _currentChunkRowsRead += batch.Length;
+                return batch;
+            }
+
+            // We need to trim the batch - it contains more rows than we should return
+            if (chunkRemainingRows <= 0)
+            {
+                // We've already read all expected rows for this chunk
+                return null;
+            }
+
+            Activity.Current?.AddEvent("cloudfetch.trimming_batch_chunk", [
+                new("original_length", batch.Length),
+                new("trimmed_length", chunkRemainingRows),
+                new("chunk_expected_rows", _currentChunkExpectedRows),
+                new("chunk_rows_read_before", _currentChunkRowsRead)
+            ]);
+
+            // Slice uses reference counting - dispose original to release its reference
+            var chunkTrimmedBatch = batch.Slice(0, (int)chunkRemainingRows);
+            batch.Dispose();
+            _currentChunkRowsRead += chunkTrimmedBatch.Length;
+
+            return chunkTrimmedBatch;
+        }
+
         protected override void Dispose(bool disposing)
         {
             if (this.currentReader != null)
diff --git a/csharp/src/Reader/CloudFetch/CloudFetchReaderFactory.cs b/csharp/src/Reader/CloudFetch/CloudFetchReaderFactory.cs
@@ -109,8 +109,9 @@ public static CloudFetchReader CreateThriftReader(
             // Start the download manager
             downloadManager.StartAsync().Wait();
 
-            // Create and return the reader
-            return new CloudFetchReader(statement, schema, response, downloadManager);
+            // For Thrift, use chunk-level row count limiting (pass 0 for totalExpectedRows)
+            // because we don't know the total upfront - the fetcher accumulates as it goes
+            return new CloudFetchReader(statement, schema, response, downloadManager, totalExpectedRows: 0);
         }
 
         /// <summary>
@@ -200,11 +201,9 @@ public static CloudFetchReader CreateStatementExecutionReader(
             // Start the download manager
             downloadManager.StartAsync().Wait();
 
-            // Create and return the reader
-            // Note: response is null for Statement Execution API because CloudFetchReader doesn't use it.
-            // The IResponse parameter exists for compatibility with the Thrift path (DatabricksReader),
-            // which uses it for direct results and operation handle management.
-            return new CloudFetchReader(statement, schema, response: null, downloadManager);
+            // For REST API (SEA), use global row count limiting from manifest.TotalRowCount.
+            // The manifest contains the adjusted total row count that respects LIMIT queries.
+            return new CloudFetchReader(statement, schema, response: null, downloadManager, totalExpectedRows: manifest.TotalRowCount);
         }
     }
 }
diff --git a/csharp/src/Reader/DatabricksReader.cs b/csharp/src/Reader/DatabricksReader.cs
@@ -42,6 +42,11 @@ internal sealed class DatabricksReader : BaseDatabricksReader
         int index;
         IArrowReader? reader;
 
+        // Row count limiting: tracks the expected row count for the current batch from metadata.
+        // When trimArrowBatchesToLimit=false (server default), the server may return more data
+        // than the limit in the last batch but reports adjusted rowCount in metadata.
+        private long _currentBatchExpectedRows;
+
         public DatabricksReader(IHiveServer2Statement statement, Schema schema, IResponse response, TFetchResultsResp? initialResults, bool isLz4Compressed)
             : base(statement, schema, response, isLz4Compressed) // IHiveServer2Statement implements IActivityTracer
         {
@@ -73,8 +78,15 @@ public DatabricksReader(IHiveServer2Statement statement, Schema schema, IRespons
                         RecordBatch? next = await this.reader.ReadNextRecordBatchAsync(cancellationToken);
                         if (next != null)
                         {
-                            activity?.AddEvent(SemanticConventions.Messaging.Batch.Response, [new(SemanticConventions.Db.Response.ReturnedRows, next.Length)]);
-                            return next;
+                            // Apply row count limiting: trim the batch if actual data exceeds metadata row count
+                            next = ApplyRowCountLimit(next, activity);
+                            if (next != null)
+                            {
+                                activity?.AddEvent(SemanticConventions.Messaging.Batch.Response, [new(SemanticConventions.Db.Response.ReturnedRows, next.Length)]);
+                                return next;
+                            }
+                            // If next is null after limiting, continue to next batch
+                            continue;
                         }
                         this.reader = null;
                     }
@@ -127,12 +139,41 @@ public DatabricksReader(IHiveServer2Statement statement, Schema schema, IRespons
             });
         }
 
+        /// <summary>
+        /// Applies row count limiting to a record batch.
+        /// When the server returns more rows than the metadata reports (trimArrowBatchesToLimit=false),
+        /// this method trims the batch to match the expected row count from metadata.
+        /// </summary>
+        private RecordBatch? ApplyRowCountLimit(RecordBatch batch, System.Diagnostics.Activity? activity)
+        {
+            // If no row limit tracking (0 means no limit set, negative is invalid/defensive),
+            // or batch fits within expected count - return as-is
+            if (_currentBatchExpectedRows <= 0 || batch.Length <= _currentBatchExpectedRows)
+            {
+                return batch;
+            }
+
+            // We need to trim the batch - actual data exceeds metadata row count
+            activity?.AddEvent("databricks_reader.trimming_batch", [
+                new("original_length", batch.Length),
+                new("expected_rows", _currentBatchExpectedRows)
+            ]);
+
+            // Slice uses reference counting - dispose original to release its reference
+            var trimmedBatch = batch.Slice(0, (int)_currentBatchExpectedRows);
+            batch.Dispose();
+            return trimmedBatch;
+        }
+
         private void ProcessFetchedBatches()
         {
             this.TraceActivity(activity =>
             {
                 var batch = this.batches![this.index];
 
+                // Store the expected row count from metadata for row count limiting
+                _currentBatchExpectedRows = batch.RowCount;
+
                 // Ensure batch data exists
                 if (batch.Batch == null || batch.Batch.Length == 0)
                 {
diff --git a/csharp/test/E2E/CloudFetchE2ETest.cs b/csharp/test/E2E/CloudFetchE2ETest.cs
@@ -114,11 +114,16 @@ public static IEnumerable<object[]> TestCases()
         {
             string[] protocols = { "thrift", "rest" };
 
+            string zeroQuery = "SELECT * FROM range(1000) LIMIT 0";
             string smallQuery = "SELECT * FROM range(1000)";
             string largeQuery = "SELECT * FROM main.tpcds_sf100_delta.store_sales LIMIT 1000000";
 
             foreach (var protocol in protocols)
             {
+                // LIMIT 0 test cases - edge case for empty result set (PECO-2524)
+                yield return new object[] { zeroQuery, 0, true, true, protocol };
+                yield return new object[] { zeroQuery, 0, false, true, protocol };
+
                 // Small query test cases
                 yield return new object[] { smallQuery, 1000, true, true, protocol };
                 yield return new object[] { smallQuery, 1000, false, true, protocol };
@@ -171,6 +176,7 @@ public async Task TestCloudFetch(string query, int rowCount, bool useCloudFetch,
 
         /// <summary>
         /// Executes a query and validates the row count.
+        /// Validates exact row count to ensure the driver correctly respects LIMIT N in queries (PECO-2524).
         /// </summary>
         private async Task ExecuteAndValidateQuery(AdbcConnection connection, string query, int expectedRowCount, string protocolName)
         {
@@ -206,14 +212,16 @@ private async Task ExecuteAndValidateQuery(AdbcConnection connection, string que
             }
             Console.WriteLine($"[TEST] Finished reading {batchCount} batches, {totalRows} total rows");
 
-            Assert.True(totalRows >= expectedRowCount,
-                $"Expected at least {expectedRowCount} rows but got {totalRows} using {protocolName}");
+            // Validate exact row count - driver must respect LIMIT N and trim excess rows (PECO-2524)
+            // For Thrift: sum of all batch.RowCount = total expected rows
+            // For REST API (SEA): manifest.TotalRowCount = total expected rows
+            Assert.Equal(expectedRowCount, totalRows);
 
             Assert.Null(await result.Stream.ReadNextRecordBatchAsync());
             statement.Dispose();
 
             // Also log to the test output helper if available
-            OutputHelper?.WriteLine($"[{protocolName}] Read {totalRows} rows");
+            OutputHelper?.WriteLine($"[{protocolName}] Read exactly {totalRows} rows as expected");
         }
     }
 }

Original file line number	Diff line number	Diff line change
`@@ -109,8 +109,9 @@ public static CloudFetchReader CreateThriftReader(`
`109`	`109`	`// Start the download manager`
`110`	`110`	`downloadManager.StartAsync().Wait();`
`111`	`111`
`112`		`- // Create and return the reader`
`113`		`- return new CloudFetchReader(statement, schema, response, downloadManager);`
	`112`	`+ // For Thrift, use chunk-level row count limiting (pass 0 for totalExpectedRows)`
	`113`	`+ // because we don't know the total upfront - the fetcher accumulates as it goes`
	`114`	`+ return new CloudFetchReader(statement, schema, response, downloadManager, totalExpectedRows: 0);`
`114`	`115`	`}`
`115`	`116`
`116`	`117`	`/// <summary>`
`@@ -200,11 +201,9 @@ public static CloudFetchReader CreateStatementExecutionReader(`
`200`	`201`	`// Start the download manager`
`201`	`202`	`downloadManager.StartAsync().Wait();`
`202`	`203`
`203`		`- // Create and return the reader`
`204`		`- // Note: response is null for Statement Execution API because CloudFetchReader doesn't use it.`
`205`		`- // The IResponse parameter exists for compatibility with the Thrift path (DatabricksReader),`
`206`		`- // which uses it for direct results and operation handle management.`
`207`		`- return new CloudFetchReader(statement, schema, response: null, downloadManager);`
	`204`	`+ // For REST API (SEA), use global row count limiting from manifest.TotalRowCount.`
	`205`	`+ // The manifest contains the adjusted total row count that respects LIMIT queries.`
	`206`	`+ return new CloudFetchReader(statement, schema, response: null, downloadManager, totalExpectedRows: manifest.TotalRowCount);`
`208`	`207`	`}`
`209`	`208`	`}`
`210`	`209`	`}`
Original file line number	Diff line number	Diff line change
`@@ -114,11 +114,16 @@ public static IEnumerable<object[]> TestCases()`
`114`	`114`	`{`
`115`	`115`	`string[] protocols = { "thrift", "rest" };`
`116`	`116`
	`117`	`+ string zeroQuery = "SELECT * FROM range(1000) LIMIT 0";`
`117`	`118`	`string smallQuery = "SELECT * FROM range(1000)";`
`118`	`119`	`string largeQuery = "SELECT * FROM main.tpcds_sf100_delta.store_sales LIMIT 1000000";`
`119`	`120`
`120`	`121`	`foreach (var protocol in protocols)`
`121`	`122`	`{`
	`123`	`+ // LIMIT 0 test cases - edge case for empty result set (PECO-2524)`
	`124`	`+ yield return new object[] { zeroQuery, 0, true, true, protocol };`
	`125`	`+ yield return new object[] { zeroQuery, 0, false, true, protocol };`
	`126`	`+`
`122`	`127`	`// Small query test cases`
`123`	`128`	`yield return new object[] { smallQuery, 1000, true, true, protocol };`
`124`	`129`	`yield return new object[] { smallQuery, 1000, false, true, protocol };`
`@@ -171,6 +176,7 @@ public async Task TestCloudFetch(string query, int rowCount, bool useCloudFetch,`
`171`	`176`
`172`	`177`	`/// <summary>`
`173`	`178`	`/// Executes a query and validates the row count.`
	`179`	`+ /// Validates exact row count to ensure the driver correctly respects LIMIT N in queries (PECO-2524).`
`174`	`180`	`/// </summary>`
`175`	`181`	`private async Task ExecuteAndValidateQuery(AdbcConnection connection, string query, int expectedRowCount, string protocolName)`
`176`	`182`	`{`
`@@ -206,14 +212,16 @@ private async Task ExecuteAndValidateQuery(AdbcConnection connection, string que`
`206`	`212`	`}`
`207`	`213`	`Console.WriteLine($"[TEST] Finished reading {batchCount} batches, {totalRows} total rows");`
`208`	`214`
`209`		`- Assert.True(totalRows >= expectedRowCount,`
`210`		`- $"Expected at least {expectedRowCount} rows but got {totalRows} using {protocolName}");`
	`215`	`+ // Validate exact row count - driver must respect LIMIT N and trim excess rows (PECO-2524)`
	`216`	`+ // For Thrift: sum of all batch.RowCount = total expected rows`
	`217`	`+ // For REST API (SEA): manifest.TotalRowCount = total expected rows`
	`218`	`+ Assert.Equal(expectedRowCount, totalRows);`
`211`	`219`
`212`	`220`	`Assert.Null(await result.Stream.ReadNextRecordBatchAsync());`
`213`	`221`	`statement.Dispose();`
`214`	`222`
`215`	`223`	`// Also log to the test output helper if available`
`216`		`- OutputHelper?.WriteLine($"[{protocolName}] Read {totalRows} rows");`
	`224`	`+ OutputHelper?.WriteLine($"[{protocolName}] Read exactly {totalRows} rows as expected");`
`217`	`225`	`}`
`218`	`226`	`}`
`219`	`227`	`}`