ESQL: Begin using .. for ranges (elastic#134460)

nik9000 · web-flow · commit 329e2c1122a0 · 2025-09-10T15:24:42.000-04:00
In our tests for loading enrich policies we were embedding json into the
csv. That's ugly looking but was fine for a while. But we're going to
have an actual syntax for range literals in ESQL soon. This ports the
tests to using that syntax.

```
-{"gte": "1900-01-01"\, "lt":"1910-01-01"}, 1900, Edwardian Era
+1900-01-01..1910-01-01                   , 1900, Edwardian Era
```
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/java/org/elasticsearch/xpack/esql/CsvTestsDataLoader.java b/x-pack/plugin/esql/qa/testFixtures/src/main/java/org/elasticsearch/xpack/esql/CsvTestsDataLoader.java
@@ -46,6 +46,8 @@
 import java.util.Map;
 import java.util.Set;
 import java.util.concurrent.Semaphore;
+import java.util.regex.Matcher;
+import java.util.regex.Pattern;
 import java.util.stream.Collectors;
 import java.util.stream.Stream;
 
@@ -637,6 +639,8 @@ public static String readTextFile(URL resource) throws IOException {
         }
     }
 
+    record ColumnHeader(String name, String type) {}
+
     @SuppressWarnings("unchecked")
     /**
      * Loads a classic csv file in an ES cluster using a RestClient.
@@ -654,12 +658,13 @@ public static String readTextFile(URL resource) throws IOException {
      */
     private static void loadCsvData(RestClient client, String indexName, URL resource, boolean allowSubFields, Logger logger)
         throws IOException {
+
         ArrayList<String> failures = new ArrayList<>();
         StringBuilder builder = new StringBuilder();
         try (BufferedReader reader = reader(resource)) {
             String line;
             int lineNumber = 1;
-            String[] columns = null; // list of column names. If one column name contains dot, it is a subfield and its value will be null
+            ColumnHeader[] columns = null; // Column info. If one column name contains dot, it is a subfield and its value will be null
             List<Integer> subFieldsIndices = new ArrayList<>(); // list containing the index of a subfield in "columns" String[]
 
             while ((line = reader.readLine()) != null) {
@@ -669,15 +674,16 @@ private static void loadCsvData(RestClient client, String indexName, URL resourc
                     String[] entries = multiValuesAwareCsvToStringArray(line, lineNumber);
                     // the schema row
                     if (columns == null) {
-                        columns = new String[entries.length];
+                        columns = new ColumnHeader[entries.length];
                         for (int i = 0; i < entries.length; i++) {
                             int split = entries[i].indexOf(':');
                             if (split < 0) {
-                                columns[i] = entries[i].trim();
+                                columns[i] = new ColumnHeader(entries[i].trim(), null);
                             } else {
                                 String name = entries[i].substring(0, split).trim();
+                                String type = entries[i].substring(split + 1).trim();
                                 if (allowSubFields || name.contains(".") == false) {
-                                    columns[i] = name;
+                                    columns[i] = new ColumnHeader(name, type);
                                 } else {// if it's a subfield, ignore it in the _bulk request
                                     columns[i] = null;
                                     subFieldsIndices.add(i);
@@ -707,7 +713,7 @@ private static void loadCsvData(RestClient client, String indexName, URL resourc
                                     // Value is null, skip
                                     continue;
                                 }
-                                if ("_id".equals(columns[i])) {
+                                if (columns[i] != null && "_id".equals(columns[i].name)) {
                                     // Value is an _id
                                     idField = entries[i];
                                     continue;
@@ -722,17 +728,17 @@ private static void loadCsvData(RestClient client, String indexName, URL resourc
                                     if (multiValues.length > 1) {
                                         StringBuilder rowStringValue = new StringBuilder("[");
                                         for (String s : multiValues) {
-                                            rowStringValue.append(quoteIfNecessary(s)).append(",");
+                                            rowStringValue.append(toJson(columns[i].type, s)).append(",");
                                         }
                                         // remove the last comma and put a closing bracket instead
                                         rowStringValue.replace(rowStringValue.length() - 1, rowStringValue.length(), "]");
                                         entries[i] = rowStringValue.toString();
                                     } else {
-                                        entries[i] = quoteIfNecessary(entries[i]);
+                                        entries[i] = toJson(columns[i].type, entries[i]);
                                     }
                                     // replace any escaped commas with single comma
                                     entries[i] = entries[i].replace(ESCAPED_COMMA_SEQUENCE, ",");
-                                    row.append("\"").append(columns[i]).append("\":").append(entries[i]);
+                                    row.append("\"").append(columns[i].name).append("\":").append(entries[i]);
                                 } catch (Exception e) {
                                     throw new IllegalArgumentException(
                                         format(
@@ -770,10 +776,23 @@ private static void loadCsvData(RestClient client, String indexName, URL resourc
         }
     }
 
-    private static String quoteIfNecessary(String value) {
-        boolean isQuoted = (value.startsWith("\"") && value.endsWith("\"")) || (value.startsWith("{") && value.endsWith("}"));
-        boolean isNumeric = value.matches(NUMERIC_REGEX);
-        return isQuoted || isNumeric ? value : "\"" + value + "\"";
+    private static final Pattern RANGE_PATTERN = Pattern.compile("([0-9\\-.Z:]+)\\.\\.([0-9\\-.Z:]+)");
+
+    private static String toJson(String type, String value) {
+        return switch (type == null ? "" : type) {
+            case "date_range", "double_range", "integer_range" -> {
+                Matcher m = RANGE_PATTERN.matcher(value);
+                if (m.matches() == false) {
+                    throw new IllegalArgumentException("can't parse range: " + value);
+                }
+                yield "{\"gte\": \"" + m.group(1) + "\", \"lt\": \"" + m.group(2) + "\"}";
+            }
+            default -> {
+                boolean isQuoted = (value.startsWith("\"") && value.endsWith("\"")) || (value.startsWith("{") && value.endsWith("}"));
+                boolean isNumeric = value.matches(NUMERIC_REGEX);
+                yield isQuoted || isNumeric ? value : "\"" + value + "\"";
+            }
+        };
     }
 
     private static void sendBulkRequest(String indexName, StringBuilder builder, RestClient client, Logger logger, List<String> failures)
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/data/ages.csv b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/data/ages.csv
@@ -1,11 +1,11 @@
 age_range:integer_range, description:keyword
-{"gte": 0\, "lt":2},     Baby
-{"gte": 2\, "lt":4},     Toddler
-{"gte": 3\, "lt":5},     Preschooler
-{"gte": 5\, "lt":12},    Child
-{"gte": 13\, "lt":20},   Adolescent
-{"gte": 20\, "lt":40},   Young Adult
-{"gte": 40\, "lt":60},   Middle-aged
-{"gte": 60\, "lt":80},   Senior
-{"gte": 80\, "lt":100},  Elderly
-{"gte": 100\, "lt":200}, Incredible
+                 0..2  , Baby
+                 2..4  , Toddler
+                 3..5  , Preschooler
+                 5..12 , Child
+                13..20 , Adolescent
+                20..40 , Young Adult
+                40..60 , Middle-aged
+                60..80 , Senior
+                80..100, Elderly
+               100..200, Incredible
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/data/decades.csv b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/data/decades.csv
@@ -1,14 +1,14 @@
-date_range:date_range,   decade:integer, description:keyword
-{"gte": "1900-01-01"\, "lt":"1910-01-01"}, 1900, Edwardian Era
-{"gte": "1910-01-01"\, "lt":"1920-01-01"}, 1910, Ragtime Era
-{"gte": "1920-01-01"\, "lt":"1930-01-01"}, 1920, Roaring Twenties
-{"gte": "1930-01-01"\, "lt":"1940-01-01"}, 1930, Dirty Thirties
-{"gte": "1940-01-01"\, "lt":"1950-01-01"}, 1940, Fabulous Forties
-{"gte": "1950-01-01"\, "lt":"1960-01-01"}, 1950, Nifty Fifties
-{"gte": "1960-01-01"\, "lt":"1970-01-01"}, 1960, Swinging Sixties
-{"gte": "1970-01-01"\, "lt":"1980-01-01"}, 1970, Groovy Seventies
-{"gte": "1980-01-01"\, "lt":"1990-01-01"}, 1980, Radical Eighties
-{"gte": "1990-01-01"\, "lt":"2000-01-01"}, 1990, Nineties Nostalgia
-{"gte": "2000-01-01"\, "lt":"2010-01-01"}, 2000, Innovation Explosion Decade
-{"gte": "2010-01-01"\, "lt":"2020-01-01"}, 2010, Renaissance Decade
-{"gte": "2020-01-01"\, "lt":"2030-01-01"}, 2020, Empowerment Era
+ date_range:date_range, decade:integer, description:keyword
+1900-01-01..1910-01-01,           1900, Edwardian Era
+1910-01-01..1920-01-01,           1910, Ragtime Era
+1920-01-01..1930-01-01,           1920, Roaring Twenties
+1930-01-01..1940-01-01,           1930, Dirty Thirties
+1940-01-01..1950-01-01,           1940, Fabulous Forties
+1950-01-01..1960-01-01,           1950, Nifty Fifties
+1960-01-01..1970-01-01,           1960, Swinging Sixties
+1970-01-01..1980-01-01,           1970, Groovy Seventies
+1980-01-01..1990-01-01,           1980, Radical Eighties
+1990-01-01..2000-01-01,           1990, Nineties Nostalgia
+2000-01-01..2010-01-01,           2000, Innovation Explosion Decade
+2010-01-01..2020-01-01,           2010, Renaissance Decade
+2020-01-01..2030-01-01,           2020, Empowerment Era
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/data/heights.csv b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/data/heights.csv
@@ -1,6 +1,6 @@
 height_range:double_range, description:keyword
-{"gte": 0\, "lt": 1.5},    Very Short
-{"gte": 1.5\, "lt": 1.6},  Short
-{"gte": 1.6\, "lt": 1.8},  Medium Height
-{"gte": 1.8\, "lt": 2.0},  Tall
-{"gte": 2.0\, "lt": 5.0},  Very Tall
+                 0.0..1.5, Very Short
+                 1.5..1.6, Short
+                 1.6..1.8, Medium Height
+                 1.8..2.0, Tall
+                 2.0..5.0, Very Tall