Pagination

matthewmturner · matthewmturner · commit 608b8b2f275e · 2026-02-15T10:29:34.000-05:00
diff --git a/src/tui/execution.rs b/src/tui/execution.rs
@@ -403,6 +403,31 @@ impl TuiExecution {
         }
     }
 
+    #[cfg(feature = "flightsql")]
+    pub async fn next_flightsql_batch(&self, sql: String, sender: UnboundedSender<AppEvent>) {
+        let mut streams = self.flightsql_result_stream.lock().await;
+        if let Some(s) = streams.as_mut() {
+            let start = std::time::Instant::now();
+            if let Some((ticket, batch_result)) = s.next().await {
+                match batch_result {
+                    Ok(batch) => {
+                        info!("Fetched next FlightSQL batch from {}: {} rows", ticket, batch.num_rows());
+                        let duration = start.elapsed();
+                        let results = ExecutionResultsBatch {
+                            query: sql,
+                            batch,
+                            duration,
+                        };
+                        let _ = sender.send(AppEvent::FlightSQLExecutionResultsNextBatch(results));
+                    }
+                    Err(e) => {
+                        error!("Error getting next FlightSQL batch: {:?}", e);
+                    }
+                }
+            }
+        }
+    }
+
     // TODO: Maybe just expose `inner` and use that rather than re-implementing the same
     // functions here.
     #[cfg(feature = "flightsql")]
diff --git a/src/tui/handlers/flightsql.rs b/src/tui/handlers/flightsql.rs
@@ -78,6 +78,26 @@ pub fn normal_mode_handler(app: &mut App, key: KeyEvent) {
         }
         (KeyCode::Right, KeyModifiers::NONE) => {
             let _event_tx = app.event_tx();
+
+            if let Some(current_page) = app.state.flightsql_tab.current_page() {
+                let next_page = current_page + 1;
+
+                // Check if we need more batches for the next page
+                if app.state.flightsql_tab.needs_more_batches_for_page(next_page) {
+                    info!("Fetching more batches for page {}", next_page);
+
+                    if let Some(last_query) = app.state.history_tab.history().last() {
+                        let execution = Arc::clone(&app.execution);
+                        let sql = last_query.sql().clone();
+                        tokio::spawn(async move {
+                            execution.next_flightsql_batch(sql, _event_tx).await;
+                        });
+                    }
+                    return; // Wait for batch to load before advancing page
+                }
+            }
+
+            // Sufficient data available, advance page
             if let Err(e) = _event_tx.send(AppEvent::FlightSQLExecutionResultsNextPage) {
                 error!("Error going to next FlightSQL results page: {e}");
             }
diff --git a/src/tui/handlers/mod.rs b/src/tui/handlers/mod.rs
@@ -237,15 +237,23 @@ pub fn app_event_handler(app: &mut App, event: AppEvent) -> Result<()> {
                 duration,
                 batch,
             } = r;
-            info!("Adding batch to flightsql tab");
+
+            let is_first_batch = app.state.flightsql_tab.current_page().is_none();
+
             app.state.flightsql_tab.set_in_progress(false);
             app.state.flightsql_tab.add_batch(batch);
-            app.state.flightsql_tab.next_page();
-            app.state.flightsql_tab.refresh_query_results_state();
-            let history_query =
-                HistoryQuery::new(Context::FlightSQL, query.to_string(), duration, None, None);
-            app.state.history_tab.add_to_history(history_query);
-            app.state.history_tab.refresh_history_table_state();
+
+            if is_first_batch {
+                app.state.flightsql_tab.next_page();
+                app.state.flightsql_tab.refresh_query_results_state();
+
+                let history_query =
+                    HistoryQuery::new(Context::FlightSQL, query.to_string(), duration, None, None);
+                app.state.history_tab.add_to_history(history_query);
+                app.state.history_tab.refresh_history_table_state();
+            } else {
+                app.state.flightsql_tab.refresh_query_results_state();
+            }
         }
         #[cfg(feature = "flightsql")]
         AppEvent::FlightSQLEstablishConnection => {
diff --git a/src/tui/mod.rs b/src/tui/mod.rs
@@ -17,9 +17,12 @@
 
 pub mod execution;
 pub mod handlers;
+mod pagination;
 pub mod state;
 pub mod ui;
 
+pub use pagination::{extract_page, has_sufficient_rows, page_row_range, PAGE_SIZE};
+
 use color_eyre::eyre::eyre;
 use color_eyre::Result;
 use datafusion_app::config::merge_configs;
diff --git a/src/tui/pagination.rs b/src/tui/pagination.rs
@@ -0,0 +1,91 @@
+use datafusion::arrow::array::{Array, RecordBatch, UInt32Array};
+use datafusion::arrow::compute::{concat_batches, take_record_batch};
+use datafusion::arrow::error::ArrowError;
+use std::sync::Arc;
+
+pub const PAGE_SIZE: usize = 100;
+
+/// Calculate the row range needed for a given page
+pub fn page_row_range(page: usize, page_size: usize) -> (usize, usize) {
+    let start = page * page_size;
+    let end = start + page_size;
+    (start, end)
+}
+
+/// Check if we have enough rows loaded to display the requested page
+pub fn has_sufficient_rows(loaded_rows: usize, page: usize, page_size: usize) -> bool {
+    let (_start, end) = page_row_range(page, page_size);
+    loaded_rows >= end
+}
+
+/// Extract a page of rows from loaded batches
+/// This handles pagination across batch boundaries by concatenating only what's needed
+pub fn extract_page(
+    batches: &[RecordBatch],
+    page: usize,
+    page_size: usize,
+) -> Result<RecordBatch, ArrowError> {
+    if batches.is_empty() {
+        return Ok(RecordBatch::new_empty(Arc::new(
+            datafusion::arrow::datatypes::Schema::empty(),
+        )));
+    }
+
+    let total_rows: usize = batches.iter().map(|b| b.num_rows()).sum();
+    let (start, end) = page_row_range(page, page_size);
+
+    // Clamp end to available rows
+    let end = end.min(total_rows);
+
+    if start >= total_rows {
+        // Page is beyond available data
+        return Ok(RecordBatch::new_empty(batches[0].schema()));
+    }
+
+    // Create indices for the rows we want
+    let indices = UInt32Array::from_iter_values((start as u32)..(end as u32));
+
+    // Extract rows from batches
+    extract_rows_from_batches(batches, &indices)
+}
+
+/// Extract specific rows (by global indices) from batches
+/// Handles batch boundaries by concatenating only necessary batches
+fn extract_rows_from_batches(
+    batches: &[RecordBatch],
+    indices: &dyn Array,
+) -> Result<RecordBatch, ArrowError> {
+    match batches.len() {
+        0 => Ok(RecordBatch::new_empty(Arc::new(
+            datafusion::arrow::datatypes::Schema::empty(),
+        ))),
+        1 => take_record_batch(&batches[0], indices),
+        _ => {
+            // Multiple batches: concat then extract rows
+            // Only concat the batches we've loaded (lazy loading ensures minimal concat)
+            let schema = batches[0].schema();
+            let concatenated = concat_batches(&schema, batches)?;
+            take_record_batch(&concatenated, indices)
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_page_row_range() {
+        assert_eq!(page_row_range(0, 100), (0, 100));
+        assert_eq!(page_row_range(1, 100), (100, 200));
+        assert_eq!(page_row_range(2, 50), (100, 150));
+    }
+
+    #[test]
+    fn test_has_sufficient_rows() {
+        assert!(has_sufficient_rows(100, 0, 100)); // Exactly enough
+        assert!(has_sufficient_rows(150, 0, 100)); // More than enough
+        assert!(!has_sufficient_rows(50, 0, 100)); // Not enough
+        assert!(!has_sufficient_rows(150, 1, 100)); // Need 200, only have 150
+    }
+}
diff --git a/src/tui/state/tabs/flightsql.rs b/src/tui/state/tabs/flightsql.rs
@@ -20,10 +20,8 @@ use std::sync::Arc;
 
 use color_eyre::Result;
 use datafusion::arrow::{
-    array::{Array, RecordBatch, UInt32Array},
-    compute::take_record_batch,
+    array::RecordBatch,
     datatypes::Schema,
-    error::ArrowError,
 };
 use log::{error, info};
 use ratatui::crossterm::event::KeyEvent;
@@ -34,11 +32,10 @@ use tokio::task::JoinHandle;
 use tui_textarea::TextArea;
 
 use crate::config::AppConfig;
+use crate::tui::pagination::{extract_page, has_sufficient_rows, PAGE_SIZE};
 use crate::tui::state::tabs::sql;
 use crate::tui::ExecutionError;
 
-const PAGE_SIZE: usize = 100;
-
 #[derive(Debug, Default)]
 pub enum FlightSQLConnectionStatus {
     #[default]
@@ -217,22 +214,10 @@ impl FlightSQLTabState<'_> {
     pub fn current_page_results(&self) -> Option<RecordBatch> {
         match (self.current_page, self.result_batches.as_ref()) {
             (Some(page), Some(batches)) => {
-                let total_rows: usize = batches.iter().map(|b| b.num_rows()).sum();
-                let indices = if total_rows < PAGE_SIZE {
-                    UInt32Array::from_iter_values(0_u32..(total_rows as u32))
-                } else {
-                    let start = page * PAGE_SIZE;
-                    let remaining = total_rows - start;
-                    // On the last page there could be less than PAGE_SIZE results to view
-                    let page_records = remaining.min(PAGE_SIZE);
-                    let end = (start as u32) + (page_records as u32);
-                    info!("Current page start({start}) end({end})");
-                    UInt32Array::from_iter_values((start as u32)..end)
-                };
-                match take_record_batches(batches, &indices) {
+                match extract_page(batches, page, PAGE_SIZE) {
                     Ok(batch) => Some(batch),
                     Err(err) => {
-                        error!("Error getting record batch: {}", err);
+                        error!("Error getting page {}: {}", page, err);
                         None
                     }
                 }
@@ -241,6 +226,17 @@ impl FlightSQLTabState<'_> {
         }
     }
 
+    pub fn total_loaded_rows(&self) -> usize {
+        self.result_batches
+            .as_ref()
+            .map(|batches| batches.iter().map(|b| b.num_rows()).sum())
+            .unwrap_or(0)
+    }
+
+    pub fn needs_more_batches_for_page(&self, page: usize) -> bool {
+        !has_sufficient_rows(self.total_loaded_rows(), page, PAGE_SIZE)
+    }
+
     pub fn next_page(&mut self) {
         self.change_page(
             |page, max_pages| {
@@ -309,14 +305,3 @@ impl FlightSQLTabState<'_> {
     }
 }
 
-fn take_record_batches(
-    batches: &[RecordBatch],
-    indices: &dyn Array,
-) -> Result<RecordBatch, ArrowError> {
-    match batches.len() {
-        0 => Ok(RecordBatch::new_empty(Arc::new(Schema::empty()))),
-        1 => take_record_batch(&batches[0], indices),
-        // For now we just get the first batch
-        _ => take_record_batch(&batches[0], indices),
-    }
-}
diff --git a/tests/tui_cases/flightsql_pagination.rs b/tests/tui_cases/flightsql_pagination.rs
@@ -83,6 +83,12 @@ fn create_values_query(num: usize) -> String {
     format!("{base} {vals}")
 }
 
+fn create_values_query_offset(num: usize, offset: usize) -> String {
+    let base = "SELECT * FROM VALUES";
+    let vals = (offset..offset + num).map(|i| format!("({i})")).join(",");
+    format!("{base} {vals}")
+}
+
 // Tests that we can paginate through multiple pages and go back to the first page
 #[tokio::test]
 async fn multiple_pages_forward_and_back() {
@@ -199,3 +205,60 @@ async fn multiple_pages_forward_and_back_and_forward() {
         assert_batches_eq!(expected, &batches);
     }
 }
+
+// Tests lazy loading: only load batches as needed for pagination
+// Simulates 3 batches: 60 rows, 60 rows, 20 rows (140 total)
+#[tokio::test]
+async fn multiple_batches_lazy_loading() {
+    let mut test_app = TestApp::new().await;
+
+    test_app
+        .handle_app_event(AppEvent::FlightSQLNewExecution)
+        .unwrap();
+
+    // Send only first batch initially (lazy loading)
+    let batch1 = create_execution_results(&create_values_query(60)).await;
+    test_app
+        .handle_app_event(AppEvent::FlightSQLExecutionResultsNextBatch(batch1))
+        .unwrap();
+
+    // Verify page 0 shows 60 rows (only first batch loaded)
+    {
+        let state = test_app.state();
+        assert_eq!(state.flightsql_tab.current_page().unwrap(), 0);
+        let page_results = state.flightsql_tab.current_page_results().unwrap();
+        assert_eq!(page_results.num_rows(), 60);
+    }
+
+    // Send second batch (simulating lazy load)
+    let batch2 = create_execution_results(&create_values_query_offset(60, 60)).await;
+    test_app
+        .handle_app_event(AppEvent::FlightSQLExecutionResultsNextBatch(batch2))
+        .unwrap();
+
+    // Now page 0 should show 100 rows (spanning both batches)
+    {
+        let state = test_app.state();
+        let page_results = state.flightsql_tab.current_page_results().unwrap();
+        assert_eq!(page_results.num_rows(), 100);
+    }
+
+    // Go to page 1
+    test_app
+        .handle_app_event(AppEvent::FlightSQLExecutionResultsNextPage)
+        .unwrap();
+
+    // Send third batch
+    let batch3 = create_execution_results(&create_values_query_offset(20, 120)).await;
+    test_app
+        .handle_app_event(AppEvent::FlightSQLExecutionResultsNextBatch(batch3))
+        .unwrap();
+
+    // Verify page 1 shows remaining rows
+    {
+        let state = test_app.state();
+        assert_eq!(state.flightsql_tab.current_page().unwrap(), 1);
+        let page_results = state.flightsql_tab.current_page_results().unwrap();
+        assert_eq!(page_results.num_rows(), 40);
+    }
+}