From cb03a30ede53a3ef3d93eaea413c5587f56756d4 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Thu, 18 Sep 2025 15:20:16 -0700
Subject: [PATCH 01/30] initial docs

---
 .../docs/r2/sql/end-to-end-pipeline.mdx       | 364 ++++++++++++++++++
 src/content/docs/r2/sql/index.mdx             |  21 +
 .../platform/limitations-best-practices.mdx   | 212 ++++++++++
 src/content/docs/r2/sql/platform/pricing.mdx  |   0
 .../docs/r2/sql/platform/sql-reference.mdx    | 251 ++++++++++++
 src/content/docs/r2/sql/troubleshooting.mdx   | 308 +++++++++++++++
 6 files changed, 1156 insertions(+)
 create mode 100644 src/content/docs/r2/sql/end-to-end-pipeline.mdx
 create mode 100644 src/content/docs/r2/sql/index.mdx
 create mode 100644 src/content/docs/r2/sql/platform/limitations-best-practices.mdx
 create mode 100644 src/content/docs/r2/sql/platform/pricing.mdx
 create mode 100644 src/content/docs/r2/sql/platform/sql-reference.mdx
 create mode 100644 src/content/docs/r2/sql/troubleshooting.mdx

diff --git a/src/content/docs/r2/sql/end-to-end-pipeline.mdx b/src/content/docs/r2/sql/end-to-end-pipeline.mdx
new file mode 100644
index 00000000000000..455d5ed5fd0a36
--- /dev/null
+++ b/src/content/docs/r2/sql/end-to-end-pipeline.mdx
@@ -0,0 +1,364 @@
+---
+title: Build a fraud detection pipeline with Cloudflare Pipelines and R2 SQL
+summary: Learn how to create an end-to-end data pipeline using Cloudflare Pipelines, R2 Data Catalog, and R2 SQL for real-time transaction analysis.
+pcx_content_type: tutorial
+products:
+  - R2
+	- R2 Data Catalog
+  - R2 SQL
+---
+
+
+# Build a fraud detection pipeline with the Cloudflare Data Platform
+
+In this guide, you will learn how to build a complete data pipeline using Cloudflare Pipelines, R2 Data Catalog, and R2 SQL. This also includes a sample Python script that creates and sends financial transaction data to your Pipeline that can be queried by R2 SQL or any Apache Iceberg-compatible query engine.
+
+This tutorial demonstrates how to:
+- Set up R2 Data Catalog to store our transaction events in an Apache Iceberg table
+- Set up a Cloudflare Pipeline
+- Create transaction data with fraud patterns to send to your Pipeline
+- Query your data using R2 SQL for fraud analysis
+
+
+## Prerequisites
+
+1. Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up).
+2. Install [Node.js](https://nodejs.org/en/).
+3. Install [Python 3.8+](https://python.org) for the data generation script.
+
+:::note[Node.js version manager]
+Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions. Wrangler requires a Node version of 16.17.0 or later.
+:::
+
+## 1. Set up authentication
+
+You'll need API tokens to interact with Cloudflare services.
+
+### Custom API Token
+1. Go to **My Profile** → **API Tokens** in the Cloudflare dashboard
+2. Select **Create Token** → **Custom token**
+3. Add the following permissions:
+   - **Workers R2 Storage** - Edit, Read
+   - **Workers R2 Data Catalog** - Edit, Read
+   - **Workers R2 SQL** - Read
+	 - **Workers R2 SQL** - Read, Send, Edit
+
+Export your new token as an environment variable:
+
+```bash
+export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
+```
+
+If this is your first time using Wrangler, make sure to login.
+```bash
+npx wrangler login
+```
+
+## 2. Create an R2 bucket
+
+Create a new R2 bucket to store your fraud detection data:
+
+```bash
+npx wrangler r2 bucket create fraud-detection-data
+```
+
+## 3. Enable R2 Data Catalog
+
+Enable the Data Catalog feature on your bucket to use Apache Iceberg tables:
+
+```bash
+npx wrangler r2 bucket catalog enable fraud-detection-data
+```
+:::note
+Make sure to save the Warehouse for use later in this guide
+:::
+
+### Optional - Enable compaction on your R2 Data Catalog
+R2 Data Catalog can automatically compact tables for you. In production event streaming use cases, it's common to end up with many small files so it's recommended to enable compaction. Since this is a sample use case, this is optional.
+```bash
+npx wrangler r2 bucket catalog compaction enable fraud-detection-data --token $WRANGLER_R2_SQL_AUTH_TOKEN
+```
+
+## 4. Set up the pipeline infrastructure
+
+### Create the Pipeline stream
+
+Create a stream to receive incoming fraud detection events:
+
+```bash
+npx wrangler pipelines streams create fraud-transactions \
+  --schema '{
+    "fields": [
+      {"name": "transaction_id", "type": "string", "required": true},
+      {"name": "user_id", "type": "int64", "required": true},
+      {"name": "amount", "type": "f64", "required": false},
+      {"name": "transaction_timestamp", "type": "string", "required": false},
+      {"name": "location", "type": "string", "required": false},
+      {"name": "merchant_category", "type": "string", "required": false},
+      {"name": "is_fraud", "type": "string", "required": false},
+      {"name": "ingestion_timestamp", "type": "string", "required": false}
+    ]
+  }' \
+	--http-enabled true \
+  --http-auth true
+```
+:::note
+After running the `stream create` command, note the **Stream Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
+:::
+
+### Create the data sink
+
+Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
+
+```bash
+npx wrangler pipelines sinks create fraud-data-sink \
+  --type "r2-data-catalog" \
+	--bucket "fraud-detection-data" \
+	--roll-interval 30 \
+	--namespace "fraud_detection" \
+	--table "transactions" \
+	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
+```
+
+:::note
+This creates a `sink` configuration that will write to the Iceberg table fraud_detection.transactions every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partion the table by `DAY`
+:::
+
+### Create the pipeline
+
+Connect your stream to your sink with SQL:
+
+```bash
+npx wrangler pipelines create fraud-pipeline \
+  --sql "INSERT INTO fraud-data-sink SELECT * FROM fraud-transactions"
+```
+
+## 5. Generate fraud detection data
+
+Create a Python script to generate realistic transaction data with fraud patterns:
+
+```python title="fraud_data_generator.py"
+import requests
+import json
+import uuid
+import random
+import time
+from datetime import datetime, timezone, timedelta
+
+# Configuration
+STREAM_ENDPOINT = "https://YOUR_STREAM_ID.ingest.cloudflare.com" # From the stream you created
+API_TOKEN = "WRANGLER_R2_SQL_AUTH_TOKEN" #the same one created earlier
+EVENTS_TO_SEND = 1000 # Feel free to adjust this
+
+def generate_transaction():
+    """Generate some transactions with occassional fraud patterns"""
+
+    # User IDs
+    high_risk_users = [1001, 1002, 1003, 1004, 1005]
+    normal_users = list(range(1006, 2000))
+
+    user_id = random.choice(high_risk_users + normal_users)
+    is_high_risk_user = user_id in high_risk_users
+
+    # Generate amount
+    if random.random() < 0.05:
+        amount = round(random.uniform(5000, 50000), 2)
+    elif random.random() < 0.03:
+        amount = round(random.uniform(0.01, 1.00), 2)
+    else:
+        amount = round(random.uniform(10, 500), 2)
+
+    # Locations
+    normal_locations = ["NEW_YORK", "LOS_ANGELES", "CHICAGO", "MIAMI", "SEATTLE"]
+    high_risk_locations = ["UNKNOWN_LOCATION", "VPN_EXIT", "BELARUS", "NIGERIA"]
+
+    if is_high_risk_user and random.random() < 0.3:
+        location = random.choice(high_risk_locations)
+    else:
+        location = random.choice(normal_locations)
+
+    # Merchant categories
+    normal_merchants = ["GROCERY", "GAS_STATION", "RESTAURANT", "RETAIL"]
+    high_risk_merchants = ["GAMBLING", "CRYPTO", "MONEY_TRANSFER", "GIFT_CARDS"]
+
+    if random.random() < 0.1:  # 10% high-risk merchants
+        merchant_category = random.choice(high_risk_merchants)
+    else:
+        merchant_category = random.choice(normal_merchants)
+
+    # Determine if transaction is fraudulent based on basic risk factors
+    fraud_score = 0
+    if amount > 2000: fraud_score += 0.4
+    if amount < 1: fraud_score += 0.3
+    if location in high_risk_locations: fraud_score += 0.5
+    if merchant_category in high_risk_merchants: fraud_score += 0.3
+    if is_high_risk_user: fraud_score += 0.2
+
+    # Compare the fraud score
+    is_fraud = random.random() < min(fraud_score * 0.3, 0.8)
+
+    # Generate timestamps (some fraud happens at unusual hours)
+    base_time = datetime.now(timezone.utc)
+    if is_fraud and random.random() < 0.4:  # 40% of fraud at night
+        hour = random.randint(0, 5)  # Late night/early morning
+        transaction_time = base_time.replace(hour=hour)
+    else:
+        transaction_time = base_time - timedelta(
+            hours=random.randint(0, 168)  # Last week
+        )
+
+    return {
+        "transaction_id": str(uuid.uuid4()),
+        "user_id": user_id,
+        "amount": amount,
+        "transaction_timestamp": transaction_time.isoformat(),
+        "location": location,
+        "merchant_category": merchant_category,
+        "is_fraud": "TRUE" if is_fraud else "FALSE",
+        "ingestion_timestamp": datetime.now(timezone.utc).isoformat()
+    }
+
+def send_batch_to_stream(events, batch_size=100):
+    """Send events to Cloudflare Stream in batches"""
+
+    headers = {
+        "Authorization": f"Bearer {API_TOKEN}",
+        "Content-Type": "application/json"
+    }
+
+    total_sent = 0
+    fraud_count = 0
+
+    for i in range(0, len(events), batch_size):
+        batch = events[i:i + batch_size]
+        fraud_in_batch = sum(1 for event in batch if event["is_fraud"] == "TRUE")
+
+        try:
+            response = requests.post(STREAM_ENDPOINT, headers=headers, json=batch)
+
+            if response.status_code in [200, 201]:
+                total_sent += len(batch)
+                fraud_count += fraud_in_batch
+                print(f"✅ Sent batch of {len(batch)} events (Total: {total_sent})")
+            else:
+                print(f"❌ Failed to send batch: {response.status_code} - {response.text}")
+
+        except Exception as e:
+            print(f"❌ Error sending batch: {e}")
+
+        # Small delay between batches
+        time.sleep(0.1)
+
+    return total_sent, fraud_count
+
+def main():
+    print("Generating fraud detection data...")
+
+    # Generate events
+    events = []
+    for i in range(EVENTS_TO_SEND):
+        events.append(generate_transaction())
+        if (i + 1) % 100 == 0:
+            print(f"Generated {i + 1} events...")
+
+    fraud_events = sum(1 for event in events if event["is_fraud"] == "TRUE")
+    print(f"📊 Generated {len(events)} total events ({fraud_events} fraud, {fraud_events/len(events)*100:.1f}%)")
+
+    # Send to stream
+    print("📤 Sending data to Cloudflare Stream...")
+    sent, fraud_sent = send_batch_to_stream(events)
+
+    print(f"\n🎉 Complete!")
+    print(f"   Events sent: {sent:,}")
+    print(f"   Fraud events: {fraud_sent:,} ({fraud_sent/sent*100:.1f}%)")
+    print(f"   Data is now flowing through your pipeline!")
+
+if __name__ == "__main__":
+    main()
+```
+
+Update the configuration variables in the script:
+- Replace `YOUR_STREAM_ID` with your actual stream endpoint from step 4
+- Replace `YOUR_API_TOKEN` with your Cloudflare API token
+
+Install the required Python dependency and run the script:
+
+```bash
+pip install requests
+python fraud_data_generator.py
+```
+
+## 6. Query your fraud data with R2 SQL
+
+Now you can analyze your fraud detection data using R2 SQL. Here are some example queries:
+
+### View recent transactions
+
+```bash
+npx wrangler r2 sql query "YOUR_WAREHOUSE" "
+SELECT
+    transaction_id,
+    user_id,
+    amount,
+    location,
+    merchant_category,
+    is_fraud,
+    transaction_timestamp
+FROM fraud_detection.transactions
+WHERE __ingest_ts > '2025-09-12T01:00:00Z'
+AND is_fruad = 'TRUE'
+LIMIT 10"
+```
+:::note
+Replace `YOUR_WAREHOUSE` with your R2 Data Catalog warehouse. This in the form of `{YOUR_ACCOUNT_ID}_{BUCKET_NAME}`. This can be found in the dash under the settings in your bucket. Adjust the `__ingest_ts` date in the query as needed.
+:::
+
+### Let's filter the raw transactions into a new table to highlight high-value transactions
+
+Create a new sink that will write the filtered data to a new Apache Iceberg table in R2 Data Catalog:
+
+```bash
+npx wrangler pipelines sink create filtered-fraud-sink \
+  --type "r2-data-catalog" \
+	--bucket "fraud-detection-data" \
+	--roll-interval 30 \
+	--namespace "fraud_detection" \
+	--table "fraud_transactions" \
+	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
+```
+
+Now you'll create a new SQL query to process data from the original `fraud-transactions` stream and only write flagged transactions that are over the `amount` of 1000.
+
+```bash
+npx wrangler pipelines create fraud-pipeline \
+  --sql "INSERT INTO filtered-fraud-sink SELECT * FROM fraud-transactions WHERE is_fraud='TRUE' and amount > 1000"
+```
+
+:::note
+It may take a few minutes for the new Pipeline to fully Initialize and start processing the data. Also keep in mind the 30 second `roll-interval`
+:::
+
+Let's query our table and check the results:
+```bash
+npx wrangler r2 sql query "
+SELECT
+    transaction_id,
+    user_id,
+    amount,
+    location,
+    merchant_category,
+    is_fraud,
+    transaction_timestamp
+FROM fraud_detection.fraud_transactions
+WHERE __ingest_ts > '2025-09-12T01:00:00Z'
+LIMIT 10"
+```
+
+## Conclusion
+
+You have successfully built an end to end data pipeline using Cloudflare's data platform. Through this tutorial, you've learned to:
+
+1. **Use R2 Data Catalog** - Leveraged Apache Iceberg tables for efficient data storage
+2. **Set up Cloudflare Pipelines** - Created streams, sinks, and pipelines for data ingestion
+3. **Generated sample data** - Created transaction data with basic fraud patterns
+4. **Query with R2 SQL** - Performed complex fraud analysis using SQL queries
diff --git a/src/content/docs/r2/sql/index.mdx b/src/content/docs/r2/sql/index.mdx
new file mode 100644
index 00000000000000..3aeaa93c32873d
--- /dev/null
+++ b/src/content/docs/r2/sql/index.mdx
@@ -0,0 +1,21 @@
+---
+pcx_content_type: navigation
+title: R2 SQL
+sidebar:
+	order: 7
+	group:
+		badge: Beta
+head: []
+description: Query your R2 Data Catalog tables with R2 SQL.
+---
+
+## Efficiently Query Apache Iceberg tables in R2 Data Catalog Using R2 SQL.
+
+
+:::note
+R2 SQL is in public beta, and any developer with an R2 subscription can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL
+:::
+
+R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying Apache Iceberg tables stored in [R2 data catalog](https://developers.cloudflare.com/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
+
+Query your first table in R2 SQL by following the Get Started guide, learn how to create a data pipeline that takes a stream of events and automatically creates an Apache Iceberg table, making them accessible with R2 SQL.
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/platform/limitations-best-practices.mdx b/src/content/docs/r2/sql/platform/limitations-best-practices.mdx
new file mode 100644
index 00000000000000..da626501f8ff63
--- /dev/null
+++ b/src/content/docs/r2/sql/platform/limitations-best-practices.mdx
@@ -0,0 +1,212 @@
+---
+title: Limitations and Best Practices
+pcx_content_type: concept
+tags:
+  - SQL
+sidebar:
+  order: 5
+
+---
+
+# R2 SQL Limitations and Best Practices
+
+## Overview
+
+R2 SQL is in public beta, limitations and best practices will change over time.
+
+R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2 data catalog. This document outlines the supported features, limitations, and best practices of R2 SQL.
+
+
+## Quick Reference
+
+| Feature | Supported | Notes |
+| :---- | :---- | :---- |
+| Basic SELECT | Yes | Columns, \*, aliases |
+| SQL Functions | No | No COUNT, AVG, etc. |
+| Single table FROM | Yes | With aliasing |
+| JOINs | No | No table joins |
+| WHERE with time | Yes | Required |
+| Array filtering | No | No array type support |
+| JSON filtering | No | No nested object queries |
+| Simple LIMIT | Yes | 1-10,000 range |
+| ORDER BY | Yes | Only on partition key |
+| GROUP BY | No | Not supported |
+
+## Supported SQL Clauses
+
+R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, and `LIMIT`. All other SQL clauses are not supported at the moment. New features will release often, keep an eye on this page and the changelog\[LINK TO CHANGE LOG\] for the latest.
+
+---
+
+## SELECT Clause
+
+### Supported Features
+
+- **Individual columns**: `SELECT column1, column2`
+- **All columns**: `SELECT *`
+
+### Limitations
+
+- **No JSON field querying**: Cannot query individual fields from JSON objects
+- **No SQL functions**: Functions like `AVG()`, `COUNT()`, `MAX()`, `MIN()`, quantiles are not supported
+- **No synthetic data**: Cannot create synthetic columns like `SELECT 1 AS what, "hello" AS greeting`
+- **Field aliasing**: `SELECT field AS another_name`
+
+
+### Examples
+
+```sql
+-- Valid
+SELECT timestamp, user_id, status
+SELECT *
+
+-- Invalid
+SELECT user_id AS uid, timestamp AS ts
+SELECT COUNT(*) FROM events
+SELECT json_field.property FROM table
+SELECT 1 AS synthetic_column
+```
+
+---
+
+## FROM Clause
+
+### Supported Features
+
+- **Single table queries**: `SELECT * FROM table_name`
+
+### Limitations
+
+- **No multiple tables**: Cannot specify multiple tables in FROM clause
+- **No subqueries**: `SELECT ... FROM (SELECT ...)` is not supported
+- **No JOINs**: No INNER, LEFT, RIGHT, or FULL JOINs
+- **No SQL functions**: Cannot use functions like `read_parquet()`
+- **No synthetic tables**: Cannot create tables from values
+- **No schema evolution**: Schema cannot be altered (no ALTER TABLE, migrations)
+- **Immutable datasets**: No UPDATE or DELETE operations allowed
+- **Fully defined schema**: Dynamic or union-type fields are not supported
+- **Table aliasing**: `SELECT * FROM table_name AS alias`
+
+### Examples
+
+```sql
+--Valid
+SELECT * FROM http_requests
+
+--Invalid
+SELECT * FROM table1, table2
+SELECT * FROM table1 JOIN table2 ON table1.id = table2.id
+SELECT * FROM (SELECT * FROM events WHERE status = 200)
+```
+
+---
+
+## WHERE Clause
+
+### Supported Features
+
+- **Time filtering**: Queries should include a time filter
+- **Simple type filtering**: Supports `string`, `boolean`, and `number` types
+- **Boolean logic**: Supports `AND`, `OR`, `NOT` operators
+- **Comparison operators**: `>`, `>=`, `=`, `<`, `<=`, `!=`
+- **Grouped conditions**: `WHERE col_a="hello" AND (col_b>5 OR col_c != 3)`
+- **Pattern mating:** `WHERE col_a LIKE ‘%hello w%’`
+- **NULL Handling:** `WHERE col_a IS NOT NULL`
+
+### Limitations
+
+- **No column-to-column comparisons**: Cannot use `WHERE col_a = col_b`
+- **No array filtering**: Cannot filter on array types (array\[number\], array\[string\], array\[boolean\])
+- **No JSON/object filtering**: Cannot filter on fields inside nested objects or JSON
+- **No SQL functions**: No function calls in WHERE clause
+- **No arithmetic operators**: Cannot use `+`, `-`, `*`, `/` in conditions
+
+### Examples
+
+```sql
+--Valid
+SELECT * FROM events WHERE timestamp BETWEEN '2024-01-01' AND '2024-01-02'
+SELECT * FROM logs WHERE status = 200 AND user_type = 'premium'
+SELECT * FROM requests WHERE (method = 'GET' OR method = 'POST') AND response_time < 1000
+
+--Invalid
+SELECT * FROM events -- Missing time filter
+SELECT * FROM logs WHERE tags[0] = 'error' -- Array filtering
+SELECT * FROM requests WHERE metadata.user_id = '123' -- JSON field filtering
+SELECT * FROM events WHERE col_a = col_b -- Column comparison
+SELECT * FROM logs WHERE response_time + latency > 5000 -- Arithmetic
+```
+
+---
+
+## ORDER BY Clause
+
+### Supported Features
+
+- **ASC**: Ascending order (Default)
+- **DESC**: Descending order
+
+### Limitations
+
+- **Non-partition keys not supported**: `ORDER BY` on columns other than the partition key is not supported
+
+### Examples
+
+```sql
+SELECT * FROM table_name WHERE ... ORDER BY partitionKey
+SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
+SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
+```
+
+---
+
+## LIMIT Clause
+
+### Supported Features
+
+- **Simple limits**: `LIMIT number`
+- **Range**: Minimum 1, maximum 10,000
+
+### Limitations
+
+- **No pagination**: `LIMIT offset, count` syntax not supported
+- **No SQL functions**: Cannot use functions to determine limit
+- **No arithmetic**: Cannot use expressions like `LIMIT 10 * 50`
+
+### Examples
+
+```sql
+-- Valid
+SELECT * FROM events WHERE ... LIMIT 100
+SELECT * FROM logs WHERE ... LIMIT 10000
+
+-- Invalid
+SELECT * FROM events LIMIT 100, 50 -- Pagination
+SELECT * FROM logs LIMIT COUNT(*) / 2 -- Functions
+SELECT * FROM events LIMIT 10 * 10 -- Arithmetic
+```
+
+---
+
+## Unsupported SQL Clauses
+
+The following SQL clauses are **not supported**:
+
+- `GROUP BY`
+- `HAVING`
+- `UNION`/`INTERSECT`/`EXCEPT`
+- `WITH` (Common Table Expressions)
+- `WINDOW` functions
+- `INSERT`/`UPDATE`/`DELETE`
+- `CREATE`/`ALTER`/`DROP`
+
+---
+
+## Best Practices
+
+1. **Always include time filters** in your WHERE clause to ensure efficient queries
+2. **Use specific column selection** instead of `SELECT *` when possible for better performance
+3. **Structure your data** to avoid nested JSON objects if you need to filter on those fields
+
+---
+
diff --git a/src/content/docs/r2/sql/platform/pricing.mdx b/src/content/docs/r2/sql/platform/pricing.mdx
new file mode 100644
index 00000000000000..e69de29bb2d1d6
diff --git a/src/content/docs/r2/sql/platform/sql-reference.mdx b/src/content/docs/r2/sql/platform/sql-reference.mdx
new file mode 100644
index 00000000000000..d020aac3b378d4
--- /dev/null
+++ b/src/content/docs/r2/sql/platform/sql-reference.mdx
@@ -0,0 +1,251 @@
+---
+title: SQL Reference
+pcx_content_type: concept
+tags:
+  - SQL
+sidebar:
+  order: 5
+---
+
+# R2 SQL Language Reference
+
+## Overview
+
+R2 SQL is in public beta, supported SQL grammar will change over time.
+
+This reference documents the R2 SQL syntax based on the currently supported grammar in public beta.
+
+---
+
+## Complete Query Syntax
+
+```sql
+SELECT column_list
+FROM table_name
+WHERE conditions
+[ORDER BY column_name [DESC, ASC]]
+[LIMIT number]
+```
+
+---
+
+## SELECT Clause
+
+### Syntax
+
+```sql
+SELECT column_specification [, column_specification, ...]
+```
+
+### Column Specification
+
+- **Column name**: `column_name`
+- **All columns**: `*`
+
+### Examples
+
+```sql
+SELECT * FROM table_name
+SELECT user_id FROM table_name
+SELECT user_id, timestamp, status FROM table_name
+SELECT timestamp, user_id, response_code FROM table_name
+```
+
+---
+
+## FROM Clause
+
+### Syntax
+
+```sql
+SELECT * FROM table_name
+```
+
+### Examples
+
+```sql
+SELECT column_name FROM table_name
+```
+
+---
+
+## WHERE Clause
+
+### Syntax
+
+```sql
+SELECT * WHERE condition [AND|OR condition ...]
+```
+
+### Conditions
+
+#### Null Checks
+
+- `column_name IS NULL`
+- `column_name IS NOT NULL`
+
+#### Value Comparisons
+
+- `column_name BETWEEN value AND value`
+- `column_name = value`
+- `column_name >= value`
+- `column_name > value`
+- `column_name <= value`
+- `column_name < value`
+- `column_name != value`
+
+#### Logical Operators
+
+- `AND` \- Logical AND
+- `OR` \- Logical OR
+
+### Data Types
+
+- **integer** \- Whole numbers
+- **float** \- Decimal numbers
+- **string** \- Text values (quoted)
+
+### Examples
+
+```sql
+SELECT * FROM table_name WHERE timestamp BETWEEN '2025-01-01' AND '2025-01-02'
+SELECT * FROM table_name WHERE status = 200
+SELECT * FROM table_name WHERE response_time > 1000
+SELECT * FROM table_name WHERE user_id IS NOT NULL
+SELECT * FROM table_name WHERE method = 'GET' AND status >= 200 AND status < 300
+SELECT * FROM table_name WHERE (status = 404 OR status = 500) AND timestamp > '2024-01-01'
+```
+
+---
+
+## ORDER BY Clause
+
+### Syntax
+
+```sql
+--Note: ORDERY BY only supports ordering by the partition key
+ORDER BY partition_key [DESC]
+```
+
+- **Default**: Ascending order (ASC)
+- **DESC**: Descending order
+
+### Examples
+
+```sql
+SELECT * FROM table_name WHERE ... ORDER BY partitionKey
+SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
+SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
+
+```
+
+---
+
+## LIMIT Clause
+
+### Syntax
+
+```sql
+LIMIT number
+```
+
+- **Range**: 1 to 10,000
+- **Type**: Integer only
+
+### Examples
+
+```sql
+SELECT * FROM table_name WHERE ... LIMIT 100
+```
+
+---
+
+## Complete Query Examples
+
+### Basic Query
+
+```sql
+SELECT *
+FROM http_requests
+WHERE timestamp BETWEEN '2024-01-01' AND '2024-01-02'
+LIMIT 100
+```
+
+### Filtered Query with Sorting
+
+```sql
+SELECT user_id, timestamp, status, response_time
+FROM access_logs
+WHERE status >= 400 AND response_time > 5000
+ORDER BY response_time DESC
+LIMIT 50
+```
+
+### Complex Conditions
+
+```sql
+SELECT timestamp, method, status, user_agent
+FROM http_requests
+WHERE (method = 'POST' OR method = 'PUT')
+  AND status BETWEEN 200 AND 299
+  AND user_agent IS NOT NULL
+ORDER BY timestamp DESC
+LIMIT 1000
+```
+
+### Null Handling
+
+```sql
+SELECT user_id, session_id, timestamp
+FROM user_events
+WHERE session_id IS NOT NULL
+  AND timestamp >= '2024-01-01'
+ORDER BY timestamp
+LIMIT 500
+```
+
+---
+
+## Data Type Reference
+
+### Supported Types
+
+| Type | Description | Example Values |
+| :---- | :---- | :---- |
+| `integer` | Whole numbers | `1`, `42`, `-10`, `0` |
+| `float` | Decimal numbers | `1.5`, `3.14`, `-2.7`, `0.0` |
+| `string` | Text values | `'hello'`, `'GET'`, `'2024-01-01'` |
+
+### Type Usage in Conditions
+
+```sql
+-- Integer comparisons
+SELECT * FROM table_name WHERE status = 200
+SELECT * FROM table_name WHERE response_time > 1000
+
+-- Float comparisons
+SELECT * FROM table_name WHERE cpu_usage >= 85.5
+SELECT * FROM table_name WHERE memory_ratio < 0.8
+
+-- String comparisons
+SELECT * FROM table_name WHERE method = 'POST'
+SELECT * FROM table_name WHERE user_agent != 'bot'
+SELECT * FROM table_name WHERE country_code = 'US'
+```
+
+---
+
+## Operator Precedence
+
+1. **Comparison operators**: `=`, `!=`, `<`, `<=`, `>`, `>=`, `BETWEEN`, `IS NULL`, `IS NOT NULL`
+2. **AND** (higher precedence)
+3. **OR** (lower precedence)
+
+Use parentheses to override default precedence:
+
+```sql
+SELECT * FROM table_name WHERE (status = 404 OR status = 500) AND method = 'GET'
+```
+
+---
+
diff --git a/src/content/docs/r2/sql/troubleshooting.mdx b/src/content/docs/r2/sql/troubleshooting.mdx
new file mode 100644
index 00000000000000..5f1a6542cc1819
--- /dev/null
+++ b/src/content/docs/r2/sql/troubleshooting.mdx
@@ -0,0 +1,308 @@
+---
+title: "R2 SQL Troubleshooting Guide"
+pcx_content_type: concept
+tags:
+  - SQL
+sidebar:
+  order: 5
+---
+
+# R2 SQL Troubleshooting Guide
+
+This guide covers potential errors and limitations you may encounter when using R2 SQL. R2 SQL is in open beta and supported functionality will evolve and change over time.
+
+## Query Structure Errors
+
+### Missing Required Clauses
+
+<div className="error-box">
+**Error**: `expected exactly 1 table in `FROM` clause`
+</div>
+
+**Problem**: R2 SQL requires specific clauses in your query.
+
+```sql
+-- Invalid - Missing FROM clause
+SELECT user_id WHERE status = 200
+
+-- Valid
+SELECT user_id
+FROM http_requests
+WHERE status = 200 AND timestamp BETWEEN '2024-01-01' AND '2024-01-02'
+```
+
+**Solution**: Always include `FROM` in your queries.
+
+---
+
+## SELECT Clause Issues
+
+### Unsupported SQL Functions
+
+<div className="error-box">
+**Error**: `Function not supported`
+</div>
+
+**Problem**: Trying to use aggregate or SQL functions in SELECT.
+
+```sql
+-- Invalid - Aggregate functions not supported
+SELECT COUNT(*) FROM events WHERE timestamp > '2024-01-01'
+SELECT AVG(response_time) FROM http_requests WHERE status = 200
+SELECT MAX(timestamp) FROM logs WHERE user_id = '123'
+```
+
+**Solution**: Use basic column selection and handle aggregation in your application code.
+
+### JSON Field Access
+
+<div className="error-box">
+**Error**: `Cannot access nested fields`
+</div>
+
+**Problem**: Attempting to query individual fields from JSON objects.
+
+```sql
+-- Invalid - JSON field access not supported
+SELECT metadata.user_id FROM events
+SELECT json_field->>'property' FROM logs
+
+-- Valid - Select entire JSON field
+SELECT metadata FROM events
+SELECT json_field FROM logs
+```
+
+**Solution**: Select the entire JSON column and parse it in your application.
+
+### Synthetic Data
+
+<div className="error-box">
+**Error**: `aliases (`AS`) are not supported`
+</div>
+
+**Problem**: Creating synthetic columns with literal values.
+
+```sql
+-- Invalid - Synthetic data not supported
+SELECT user_id, 'active' as status, 1 as priority FROM users
+
+-- Valid
+SELECT user_id, status, priority FROM users WHERE status = 'active'
+```
+
+**Solution**: Add the required data to your table schema or handle it in post-processing.
+
+---
+
+## FROM Clause Issues
+
+### Multiple Tables
+
+<div className="error-box">
+**Error**: `Multiple tables not supported` or `JOIN operations not allowed`
+</div>
+
+**Problem**: Attempting to query multiple tables or use JOINs.
+
+```sql
+-- Invalid - Multiple tables not supported
+SELECT a.*, b.* FROM table1 a, table2 b WHERE a.id = b.id
+SELECT * FROM events JOIN users ON events.user_id = users.id
+
+-- Valid - Separate queries
+SELECT * FROM table1 WHERE id IN ('id1', 'id2', 'id3')
+-- Then in application code, query table2 separately
+SELECT * FROM table2 WHERE id IN ('id1', 'id2', 'id3')
+```
+
+**Solution**:
+- Denormalize your data by including necessary fields in a single table
+- Perform multiple queries and join data in your application
+- Restructure your data model to avoid cross-table queries
+
+### Subqueries
+
+<div className="error-box">
+**Error**: `only table name is supported in `FROM` clause`
+</div>
+
+**Problem**: Using subqueries in FROM clause.
+
+```sql
+-- Invalid - Subqueries not supported
+SELECT * FROM (SELECT user_id FROM events WHERE status = 200) as active_users
+
+-- Valid - Use direct query with appropriate filters
+SELECT user_id FROM events WHERE status = 200
+```
+
+**Solution**: Flatten your query logic or use multiple sequential queries.
+
+---
+
+## WHERE Clause Issues
+
+### Array Filtering
+
+<div className="error-box">
+**Error**: `This feature is not implemented: GetFieldAccess`
+</div>
+
+**Problem**: Attempting to filter on array fields.
+
+```sql
+-- Invalid - Array filtering not supported
+SELECT * FROM logs WHERE tags[0] = 'error'
+SELECT * FROM events WHERE 'admin' = ANY(roles)
+
+-- Valid alternatives - denormalize or use string contains
+SELECT * FROM logs WHERE tags_string LIKE '%error%'
+-- Or restructure data to avoid arrays
+```
+
+**Solution**:
+- Denormalize array data into separate columns
+- Use string concatenation of array values for pattern matching
+- Restructure your schema to avoid array types
+
+### JSON Object Filtering
+
+<div className="error-box">
+**Error**: `unsupported binary operator` or `Error during planning: could not parse compound`
+</div>
+
+**Problem**: Filtering on fields inside JSON objects.
+
+```sql
+-- Invalid - JSON field filtering not supported
+SELECT * FROM requests WHERE metadata.country = 'US'
+SELECT * FROM logs WHERE json_data->>'level' = 'error'
+
+-- Valid alternatives
+SELECT * FROM requests WHERE country = 'US'  -- If denormalized
+-- Or filter entire JSON field and parse in application
+SELECT * FROM logs WHERE json_data IS NOT NULL
+```
+
+**Solution**:
+- Denormalize frequently queried JSON fields into separate columns
+- Filter on the entire JSON field and handle parsing in your application
+
+### Column Comparisons
+
+<div className="error-box">
+**Error**: `right argument to a binary expression must be a literal`
+</div>
+
+**Problem**: Comparing one column to another in WHERE clause.
+
+```sql
+-- Invalid - Column comparisons not supported
+SELECT * FROM events WHERE start_time < end_time
+SELECT * FROM logs WHERE request_size > response_size
+
+-- Valid - Use computed columns or application logic
+-- Add a computed column 'duration' to your schema
+SELECT * FROM events WHERE duration > 0
+```
+
+**Solution**:
+- Pre-compute comparisons and store as separate columns
+- Handle comparisons in your application layer
+- Restructure your data model
+
+---
+
+## LIMIT Clause Issues
+
+### Invalid Limit Values
+
+<div className="error-box">
+**Error**: `maximum LIMIT is 10000`
+</div>
+
+**Problem**: Using invalid LIMIT values.
+
+```sql
+-- Invalid - Out of range limits
+SELECT * FROM events LIMIT 50000  -- Maximum is 10,000
+
+-- Valid
+SELECT * FROM events LIMIT 1
+SELECT * FROM events LIMIT 10000
+```
+
+**Solution**: Use LIMIT values between 1 and 10,000.
+
+### Pagination Attempts
+
+<div className="error-box">
+**Error**: `OFFSET not supported`
+</div>
+
+**Problem**: Attempting to use pagination syntax.
+
+```sql
+-- Invalid - Pagination not supported
+SELECT * FROM events LIMIT 100 OFFSET 200
+SELECT * FROM events LIMIT 100, 100
+
+-- Valid alternatives - Use ORDER BY with conditional filters
+-- Page 1
+SELECT * FROM events WHERE timestamp >= '2024-01-01' ORDER BY timestamp LIMIT 100
+
+-- Page 2 - Use last timestamp from previous page
+SELECT * FROM events WHERE timestamp > '2024-01-01T10:30:00Z' ORDER BY timestamp LIMIT 100
+```
+
+**Solution**: Implement cursor-based pagination using ORDER BY and WHERE conditions.
+
+---
+
+## Schema Issues
+
+### Dynamic Schema Changes
+
+<div className="error-box">
+**Error**: `Sinvalid SQL: only top-level SELECT clause is supported`
+</div>
+
+**Problem**: Attempting to modify table schema or reference non-existent columns.
+
+```sql
+-- Invalid - Schema changes not supported
+ALTER TABLE events ADD COLUMN new_field STRING
+UPDATE events SET status = 200 WHERE user_id = '123'
+```
+
+**Solution**:
+- Plan your schema carefully before data ingestion
+- Contact your data engineering team for schema changes
+- Ensure all column names exist in your current schema
+
+---
+
+## Performance Optimization
+
+### Query Performance Issues
+
+If your queries are running slowly:
+
+1. **Always include partition (timestamp) filters**: This is the most important optimization
+   ```sql
+   -- Good
+   WHERE timestamp BETWEEN '2024-01-01' AND '2024-01-02'
+   ```
+
+2. **Use selective filtering**: Include specific conditions to reduce result sets
+   ```sql
+   -- Good
+   WHERE status = 200 AND country = 'US' AND timestamp > '2024-01-01'
+   ```
+
+3. **Limit result size**: Use appropriate LIMIT values
+   ```sql
+   -- Good for exploration
+   SELECT * FROM events WHERE timestamp > '2024-01-01' LIMIT 100
+   ```
+

From 1cbebacf464c99431a9d3dcb98fabd49c1e005ba Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Thu, 18 Sep 2025 15:28:16 -0700
Subject: [PATCH 02/30] fixed link in index

---
 src/content/docs/r2/sql/index.mdx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2/sql/index.mdx b/src/content/docs/r2/sql/index.mdx
index 3aeaa93c32873d..d37f584fdf50e8 100644
--- a/src/content/docs/r2/sql/index.mdx
+++ b/src/content/docs/r2/sql/index.mdx
@@ -18,4 +18,4 @@ R2 SQL is in public beta, and any developer with an R2 subscription can start us
 
 R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying Apache Iceberg tables stored in [R2 data catalog](https://developers.cloudflare.com/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
 
-Query your first table in R2 SQL by following the Get Started guide, learn how to create a data pipeline that takes a stream of events and automatically creates an Apache Iceberg table, making them accessible with R2 SQL.
\ No newline at end of file
+Create an end to end data pipeline and query your first table in R2 SQL by following [this step by step guide](/r2/sql/end-to-end-pipeline/), learn how to create a data pipeline that takes a stream of events and automatically creates an Apache Iceberg table, making them accessible with R2 SQL.
\ No newline at end of file

From dd0e8d5237a1dc543ea36042b3305187f753ed11 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Fri, 19 Sep 2025 09:12:49 -0700
Subject: [PATCH 03/30] fix indents in index, add query-data

---
 src/content/docs/r2/sql/index.mdx      | 8 ++++----
 src/content/docs/r2/sql/query-data.mdx | 0
 2 files changed, 4 insertions(+), 4 deletions(-)
 create mode 100644 src/content/docs/r2/sql/query-data.mdx

diff --git a/src/content/docs/r2/sql/index.mdx b/src/content/docs/r2/sql/index.mdx
index d37f584fdf50e8..a97dd2bfbd417b 100644
--- a/src/content/docs/r2/sql/index.mdx
+++ b/src/content/docs/r2/sql/index.mdx
@@ -2,11 +2,11 @@
 pcx_content_type: navigation
 title: R2 SQL
 sidebar:
-	order: 7
-	group:
-		badge: Beta
+  order: 7
+  group:
+    badge: Beta
 head: []
-description: Query your R2 Data Catalog tables with R2 SQL.
+description: A distributed SQL engine for R2 Data Catalog
 ---
 
 ## Efficiently Query Apache Iceberg tables in R2 Data Catalog Using R2 SQL.
diff --git a/src/content/docs/r2/sql/query-data.mdx b/src/content/docs/r2/sql/query-data.mdx
new file mode 100644
index 00000000000000..e69de29bb2d1d6

From 87e5a32f31faa0b0e5738c92cefaeb065a77f063 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Fri, 19 Sep 2025 10:49:34 -0700
Subject: [PATCH 04/30] Improved all docs, added index.mdx in platform

also tested examples e2e
---
 .../docs/r2/sql/end-to-end-pipeline.mdx       | 142 +++++++++++++-----
 src/content/docs/r2/sql/platform/index.mdx    |   7 +
 src/content/docs/r2/sql/platform/pricing.mdx  |  17 +++
 src/content/docs/r2/sql/query-data.mdx        |  77 ++++++++++
 src/content/docs/r2/sql/troubleshooting.mdx   |   7 +-
 5 files changed, 206 insertions(+), 44 deletions(-)
 create mode 100644 src/content/docs/r2/sql/platform/index.mdx

diff --git a/src/content/docs/r2/sql/end-to-end-pipeline.mdx b/src/content/docs/r2/sql/end-to-end-pipeline.mdx
index 455d5ed5fd0a36..b9a7b65d8a0c9e 100644
--- a/src/content/docs/r2/sql/end-to-end-pipeline.mdx
+++ b/src/content/docs/r2/sql/end-to-end-pipeline.mdx
@@ -1,10 +1,10 @@
 ---
-title: Build a fraud detection pipeline with Cloudflare Pipelines and R2 SQL
+title: Build an end to end data pipeline
 summary: Learn how to create an end-to-end data pipeline using Cloudflare Pipelines, R2 Data Catalog, and R2 SQL for real-time transaction analysis.
 pcx_content_type: tutorial
 products:
   - R2
-	- R2 Data Catalog
+  - R2 Data Catalog
   - R2 SQL
 ---
 
@@ -83,11 +83,9 @@ npx wrangler r2 bucket catalog compaction enable fraud-detection-data --token $W
 
 ### Create the Pipeline stream
 
-Create a stream to receive incoming fraud detection events:
-
-```bash
-npx wrangler pipelines streams create fraud-transactions \
-  --schema '{
+First, create a schema file called `raw_transactions_schema.json` with the following `json` schema:
+```json
+{
     "fields": [
       {"name": "transaction_id", "type": "string", "required": true},
       {"name": "user_id", "type": "int64", "required": true},
@@ -98,20 +96,70 @@ npx wrangler pipelines streams create fraud-transactions \
       {"name": "is_fraud", "type": "string", "required": false},
       {"name": "ingestion_timestamp", "type": "string", "required": false}
     ]
-  }' \
+}
+```
+
+Create a stream to receive incoming fraud detection events:
+
+```bash
+npx wrangler pipelines streams create rawtransactionstream \
+  --schema-file raw_transactions_schema.json \
 	--http-enabled true \
   --http-auth true
 ```
 :::note
-After running the `stream create` command, note the **Stream Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
+Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
 :::
+```bash
+# The http ingest endpoint from the output (see example below)
+export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example below)
+```
+
+The output should look like this:
+```sh
+🌀 Creating stream 'rawtransactionstream'...
+✨ Successfully created stream 'rawtransactionstream' with id 'stream_id'.
+
+Creation Summary:
+General:
+  Name:  rawtransactionstream
+
+HTTP Ingest:
+  Enabled:         Yes
+  Authentication:  Yes
+  Endpoint:        https://stream_id.ingest.cloudflare.com
+  CORS Origins:    None
+
+Input Schema:
+┌───────────────────────┬────────┬────────────┬──────────┐
+│ Field Name            │ Type   │ Unit/Items │ Required │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ transaction_id        │ string │            │ Yes      │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ user_id               │ int64  │            │ Yes      │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ amount                │ f64    │            │ No       │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ transaction_timestamp │ string │            │ No       │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ location              │ string │            │ No       │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ merchant_category     │ string │            │ No       │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ is_fraud              │ string │            │ No       │
+├───────────────────────┼────────┼────────────┼──────────┤
+│ ingestion_timestamp   │ string │            │ No       │
+└───────────────────────┴────────┴────────────┴──────────┘
+```
+
+
 
 ### Create the data sink
 
 Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
 
 ```bash
-npx wrangler pipelines sinks create fraud-data-sink \
+npx wrangler pipelines sinks create rawtransactionsink \
   --type "r2-data-catalog" \
 	--bucket "fraud-detection-data" \
 	--roll-interval 30 \
@@ -129,8 +177,8 @@ This creates a `sink` configuration that will write to the Iceberg table fraud_d
 Connect your stream to your sink with SQL:
 
 ```bash
-npx wrangler pipelines create fraud-pipeline \
-  --sql "INSERT INTO fraud-data-sink SELECT * FROM fraud-transactions"
+npx wrangler pipelines create transactionspipeline \
+  --sql "INSERT INTO rawtransactionsink SELECT * FROM rawtransactionstream"
 ```
 
 ## 5. Generate fraud detection data
@@ -143,15 +191,16 @@ import json
 import uuid
 import random
 import time
+import os
 from datetime import datetime, timezone, timedelta
 
-# Configuration
-STREAM_ENDPOINT = "https://YOUR_STREAM_ID.ingest.cloudflare.com" # From the stream you created
-API_TOKEN = "WRANGLER_R2_SQL_AUTH_TOKEN" #the same one created earlier
+# Configuration - exported from the prior steps
+STREAM_ENDPOINT = os.environ["STREAM_ENDPOINT"]# From the stream you created
+API_TOKEN = os.environ["WRANGLER_R2_SQL_AUTH_TOKEN"] #the same one created earlier
 EVENTS_TO_SEND = 1000 # Feel free to adjust this
 
 def generate_transaction():
-    """Generate some transactions with occassional fraud patterns"""
+    """Generate some random transactions with occassional fraud"""
 
     # User IDs
     high_risk_users = [1001, 1002, 1003, 1004, 1005]
@@ -160,7 +209,7 @@ def generate_transaction():
     user_id = random.choice(high_risk_users + normal_users)
     is_high_risk_user = user_id in high_risk_users
 
-    # Generate amount
+    # Generate amounts
     if random.random() < 0.05:
         amount = round(random.uniform(5000, 50000), 2)
     elif random.random() < 0.03:
@@ -169,8 +218,8 @@ def generate_transaction():
         amount = round(random.uniform(10, 500), 2)
 
     # Locations
-    normal_locations = ["NEW_YORK", "LOS_ANGELES", "CHICAGO", "MIAMI", "SEATTLE"]
-    high_risk_locations = ["UNKNOWN_LOCATION", "VPN_EXIT", "BELARUS", "NIGERIA"]
+    normal_locations = ["NEW_YORK", "LOS_ANGELES", "CHICAGO", "MIAMI", "SEATTLE", "SAN FRANCISCO"]
+    high_risk_locations = ["UNKNOWN_LOCATION", "VPN_EXIT", "MARS", "BAT_CAVE"]
 
     if is_high_risk_user and random.random() < 0.3:
         location = random.choice(high_risk_locations)
@@ -186,7 +235,7 @@ def generate_transaction():
     else:
         merchant_category = random.choice(normal_merchants)
 
-    # Determine if transaction is fraudulent based on basic risk factors
+    # Series of checks to either increase fraud score by a certain margin
     fraud_score = 0
     if amount > 2000: fraud_score += 0.4
     if amount < 1: fraud_score += 0.3
@@ -194,7 +243,7 @@ def generate_transaction():
     if merchant_category in high_risk_merchants: fraud_score += 0.3
     if is_high_risk_user: fraud_score += 0.2
 
-    # Compare the fraud score
+    # Compare the fraud scores
     is_fraud = random.random() < min(fraud_score * 0.3, 0.8)
 
     # Generate timestamps (some fraud happens at unusual hours)
@@ -239,14 +288,13 @@ def send_batch_to_stream(events, batch_size=100):
             if response.status_code in [200, 201]:
                 total_sent += len(batch)
                 fraud_count += fraud_in_batch
-                print(f"✅ Sent batch of {len(batch)} events (Total: {total_sent})")
+                print(f"Sent batch of {len(batch)} events (Total: {total_sent})")
             else:
-                print(f"❌ Failed to send batch: {response.status_code} - {response.text}")
+                print(f"Failed to send batch: {response.status_code} - {response.text}")
 
         except Exception as e:
-            print(f"❌ Error sending batch: {e}")
+            print(f"Error sending batch: {e}")
 
-        # Small delay between batches
         time.sleep(0.1)
 
     return total_sent, fraud_count
@@ -265,10 +313,10 @@ def main():
     print(f"📊 Generated {len(events)} total events ({fraud_events} fraud, {fraud_events/len(events)*100:.1f}%)")
 
     # Send to stream
-    print("📤 Sending data to Cloudflare Stream...")
+    print("Sending data to Pipeline stream...")
     sent, fraud_sent = send_batch_to_stream(events)
 
-    print(f"\n🎉 Complete!")
+    print(f"\nComplete!")
     print(f"   Events sent: {sent:,}")
     print(f"   Fraud events: {fraud_sent:,} ({fraud_sent/sent*100:.1f}%)")
     print(f"   Data is now flowing through your pipeline!")
@@ -305,8 +353,8 @@ SELECT
     is_fraud,
     transaction_timestamp
 FROM fraud_detection.transactions
-WHERE __ingest_ts > '2025-09-12T01:00:00Z'
-AND is_fruad = 'TRUE'
+WHERE __ingest_ts > '2025-09-24T01:00:00Z'
+AND is_fraud = 'TRUE'
 LIMIT 10"
 ```
 :::note
@@ -318,7 +366,7 @@ Replace `YOUR_WAREHOUSE` with your R2 Data Catalog warehouse. This in the form o
 Create a new sink that will write the filtered data to a new Apache Iceberg table in R2 Data Catalog:
 
 ```bash
-npx wrangler pipelines sink create filtered-fraud-sink \
+npx wrangler pipelines sinks create filteredfraudsink \
   --type "r2-data-catalog" \
 	--bucket "fraud-detection-data" \
 	--roll-interval 30 \
@@ -327,20 +375,20 @@ npx wrangler pipelines sink create filtered-fraud-sink \
 	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
 ```
 
-Now you'll create a new SQL query to process data from the original `fraud-transactions` stream and only write flagged transactions that are over the `amount` of 1000.
+Now you'll create a new SQL query to process data from the original `rawtransactionstream` stream and only write flagged transactions that are over the `amount` of 1000.
 
 ```bash
-npx wrangler pipelines create fraud-pipeline \
-  --sql "INSERT INTO filtered-fraud-sink SELECT * FROM fraud-transactions WHERE is_fraud='TRUE' and amount > 1000"
+npx wrangler pipelines create fraudpipeline \
+  --sql "INSERT INTO filteredfraudsink SELECT * FROM rawtransactionstream WHERE is_fraud='TRUE' and amount > 1000"
 ```
 
 :::note
 It may take a few minutes for the new Pipeline to fully Initialize and start processing the data. Also keep in mind the 30 second `roll-interval`
 :::
 
-Let's query our table and check the results:
+Let's query the table and check the results:
 ```bash
-npx wrangler r2 sql query "
+npx wrangler r2 sql query "YOUR_WAREHOUSE" "
 SELECT
     transaction_id,
     user_id,
@@ -350,9 +398,27 @@ SELECT
     is_fraud,
     transaction_timestamp
 FROM fraud_detection.fraud_transactions
-WHERE __ingest_ts > '2025-09-12T01:00:00Z'
 LIMIT 10"
 ```
+Let's also verify that the non-fraudulent events are being filtered out:
+```bash
+npx wrangler r2 sql query "YOUR_WAREHOUSE" "
+SELECT
+    transaction_id,
+    user_id,
+    amount,
+    location,
+    merchant_category,
+    is_fraud,
+    transaction_timestamp
+FROM fraud_detection.fraud_transactions
+WHERE is_fraud = 'FALSE'
+LIMIT 10"
+```
+You should see the following output:
+```text
+Query executed successfully with no results
+```
 
 ## Conclusion
 
@@ -360,5 +426,5 @@ You have successfully built an end to end data pipeline using Cloudflare's data
 
 1. **Use R2 Data Catalog** - Leveraged Apache Iceberg tables for efficient data storage
 2. **Set up Cloudflare Pipelines** - Created streams, sinks, and pipelines for data ingestion
-3. **Generated sample data** - Created transaction data with basic fraud patterns
-4. **Query with R2 SQL** - Performed complex fraud analysis using SQL queries
+3. **Generated sample data** - Created transaction data with some basic fraud patterns
+4. **Query your tables with R2 SQL** - Access raw and processed data tables stored in R2 Data Catalog
diff --git a/src/content/docs/r2/sql/platform/index.mdx b/src/content/docs/r2/sql/platform/index.mdx
new file mode 100644
index 00000000000000..ef43ff93fe3c19
--- /dev/null
+++ b/src/content/docs/r2/sql/platform/index.mdx
@@ -0,0 +1,7 @@
+---
+title: Platform
+pcx_content_type: navigation
+sidebar:
+  group:
+    hideIndex: true
+---
diff --git a/src/content/docs/r2/sql/platform/pricing.mdx b/src/content/docs/r2/sql/platform/pricing.mdx
index e69de29bb2d1d6..2b41cd9c6df209 100644
--- a/src/content/docs/r2/sql/platform/pricing.mdx
+++ b/src/content/docs/r2/sql/platform/pricing.mdx
@@ -0,0 +1,17 @@
+---
+pcx_content_type: concept
+title: Pricing
+sidebar:
+  order: 1
+head:
+  - tag: title
+    content: R2 SQL - Pricing
+
+---
+
+
+R2 SQL is currently not billed during open beta but will eventually be billed on the amount of data queried.
+
+During the first phase of the R2 SQL open beta, you will not be billed for R2 SQL usage. You will be billed only for R2 usage.
+
+We plan to price based on the volume of data queried by R2 SQL. We will provide at least 30 days' notice and exact pricing before charging.
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/query-data.mdx b/src/content/docs/r2/sql/query-data.mdx
index e69de29bb2d1d6..3905eb47b20380 100644
--- a/src/content/docs/r2/sql/query-data.mdx
+++ b/src/content/docs/r2/sql/query-data.mdx
@@ -0,0 +1,77 @@
+---
+title: Query data in R2 Data Catalog
+pcx_content_type: example
+---
+
+:::note
+R2 SQL is currently in open beta
+:::
+
+## Prerequisites
+
+- Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up/workers-and-pages).
+- [Create an R2 bucket](/r2/buckets/create-buckets/) and [enable the data catalog](/r2/data-catalog/manage-catalogs/#enable-r2-data-catalog-on-a-bucket).
+- [Create an R2 API token](/r2/api/tokens/) with [R2, R2 SQL, and data catalog permissions](/r2/api/tokens/#permissions).
+- Tables must have a time-based partition key in order be queried by R2 SQL. Read about the current [limitations](/r2/sql/platform/limitations-best-practices) to learn more.
+
+R2 SQL can currently be accessed via Wrangler commands or a REST API.
+
+## Wrangler
+
+
+Export your R2 API token as an environment variable:
+
+```bash
+export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
+```
+
+If this is your first time using Wrangler, make sure to login.
+```bash
+npx wrangler login
+```
+
+You'll also want to grab the **warehouse** of the your R2 Data Catalog:
+
+```sh
+❯ npx wrangler r2 bucket catalog get [BUCKET_NAME]
+
+ ⛅️ wrangler 4.38.0
+────────────────────────────────────────────────────────────────────────────
+▲ [WARNING] 🚧 `wrangler r2 bucket catalog get` is an open-beta command. Please report any issues to https://github.com/cloudflare/workers-sdk/issues/new/choose
+
+
+Catalog URI:  https://catalog.cloudflarestorage.com/[ACCOUNT_ID]/[BUCKET_NAME]
+Warehouse:    [ACCOUNT_ID]_[BUCKET_NAME]
+Status:       active
+```
+
+To query R2 SQL with Wrangler, simply run:
+
+```sh
+npx wrangler r2 sql query "YOUR_WAREHOUSE" "SELECT * FROM namespace.table_name limit 10;"
+```
+For a full list of supported sql commands, check out the [R2 SQL reference page](/r2/sql/platform/sql-reference).
+
+
+## REST API
+
+Set your environment variable
+
+```bash
+export ACCOUNT_ID="your-cloudflare-account-id"
+export BUCKET_NAME="your-r2-bucket-name"
+export WRANGLER_R2_SQL_AUTH_TOKEN="your_token_here"
+```
+
+Now you're ready to use the REST endpoint
+
+```bash
+curl -X POST \
+  "https://api.sql.cloudflarestorage.com/api/v1/accounts/${ACCOUNT_ID}/r2-sql/query/${BUCKET_NAME}" \
+  -H "Authorization: Bearer ${WRANGLER_R2_SQL_AUTH_TOKEN}" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "warehouse": "your-warehouse-name",
+    "query": "SELECT * FROM namespace.table_name limit 10;"
+  }' | jq .
+```
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/troubleshooting.mdx b/src/content/docs/r2/sql/troubleshooting.mdx
index 5f1a6542cc1819..d233ccdaeffa0c 100644
--- a/src/content/docs/r2/sql/troubleshooting.mdx
+++ b/src/content/docs/r2/sql/troubleshooting.mdx
@@ -118,7 +118,6 @@ SELECT * FROM table2 WHERE id IN ('id1', 'id2', 'id3')
 **Solution**:
 - Denormalize your data by including necessary fields in a single table
 - Perform multiple queries and join data in your application
-- Restructure your data model to avoid cross-table queries
 
 ### Subqueries
 
@@ -206,10 +205,7 @@ SELECT * FROM logs WHERE request_size > response_size
 SELECT * FROM events WHERE duration > 0
 ```
 
-**Solution**:
-- Pre-compute comparisons and store as separate columns
-- Handle comparisons in your application layer
-- Restructure your data model
+**Solution**: Handle comparisons in your application layer
 
 ---
 
@@ -277,7 +273,6 @@ UPDATE events SET status = 200 WHERE user_id = '123'
 
 **Solution**:
 - Plan your schema carefully before data ingestion
-- Contact your data engineering team for schema changes
 - Ensure all column names exist in your current schema
 
 ---

From b8abf911b2e24ddf2a2edeb85d07a01b522c319a Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Fri, 19 Sep 2025 10:50:54 -0700
Subject: [PATCH 05/30] removed redundant command

---
 src/content/docs/r2/sql/end-to-end-pipeline.mdx | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/src/content/docs/r2/sql/end-to-end-pipeline.mdx b/src/content/docs/r2/sql/end-to-end-pipeline.mdx
index b9a7b65d8a0c9e..3e236a1e31f28d 100644
--- a/src/content/docs/r2/sql/end-to-end-pipeline.mdx
+++ b/src/content/docs/r2/sql/end-to-end-pipeline.mdx
@@ -325,10 +325,6 @@ if __name__ == "__main__":
     main()
 ```
 
-Update the configuration variables in the script:
-- Replace `YOUR_STREAM_ID` with your actual stream endpoint from step 4
-- Replace `YOUR_API_TOKEN` with your Cloudflare API token
-
 Install the required Python dependency and run the script:
 
 ```bash

From 1f9632f0822aedbcbcf6a5f89186a9b7d0e6664b Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Sat, 20 Sep 2025 15:27:52 -0700
Subject: [PATCH 06/30] A ton of changes and improvements

implemented Jerome's feedback in virtually all docs. Docs are properly organized now.
---
 .gitignore                                    |   3 +-
 src/content/docs/r2/sql/get-started.mdx       | 210 ++++++++++++++++++
 .../platform/limitations-best-practices.mdx   |  26 +--
 src/content/docs/r2/sql/platform/pricing.mdx  |   2 +-
 .../docs/r2/sql/platform/sql-reference.mdx    |  23 +-
 src/content/docs/r2/sql/query-data.mdx        |   7 +-
 src/content/docs/r2/sql/troubleshooting.mdx   |  10 +-
 .../{ => tutorials}/end-to-end-pipeline.mdx   |  76 +++----
 src/content/docs/r2/sql/tutorials/index.mdx   |   7 +
 9 files changed, 292 insertions(+), 72 deletions(-)
 create mode 100644 src/content/docs/r2/sql/get-started.mdx
 rename src/content/docs/r2/sql/{ => tutorials}/end-to-end-pipeline.mdx (84%)
 create mode 100644 src/content/docs/r2/sql/tutorials/index.mdx

diff --git a/.gitignore b/.gitignore
index 501cf6fc5247c5..673fe364a8a3ec 100644
--- a/.gitignore
+++ b/.gitignore
@@ -29,4 +29,5 @@ pnpm-debug.log*
 /assets/secrets
 /worker/functions/
 
-.idea
\ No newline at end of file
+.idea
+package-lock.json
diff --git a/src/content/docs/r2/sql/get-started.mdx b/src/content/docs/r2/sql/get-started.mdx
new file mode 100644
index 00000000000000..cc6773163e5977
--- /dev/null
+++ b/src/content/docs/r2/sql/get-started.mdx
@@ -0,0 +1,210 @@
+---
+pcx_content_type: get-started
+title: Getting started
+head: []
+sidebar:
+  order: 2
+description: Learn how to get up and running with R2 SQL using R2 Data Catalog and Pipelines
+---
+import {
+	Render,
+	LinkCard,
+} from "~/components";
+
+## Overview
+
+This guide will instruct you through:
+
+- Creating an [R2 bucket](/r2/buckets/) and enabling its [data catalog](/r2/data-catalog/).
+- Using Wrangler to create a Pipeline Stream, Sink, and the SQL that reads from the stream and writes it to the sink
+- Sending some data to the stream via the HTTP Streams endpoint
+- Querying the data using R2 SQL
+
+## Prerequisites
+
+1. Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up).
+2. Install [Node.js](https://nodejs.org/en/).
+3. Install [Wrangler](/workers/wranger/install-and-update)
+
+:::note[Node.js version manager]
+Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions. Wrangler requires a Node version of 16.17.0 or later.
+:::
+
+## 1. Set up authentication
+
+You'll need API tokens to interact with Cloudflare services.
+
+### Custom API Token
+1. Go to **My Profile** → **API Tokens** in the Cloudflare dashboard
+2. Select **Create Token** → **Custom token**
+3. Add the following permissions:
+   - **Workers Pipelines** - Read, Send, Edit
+	 - **Workers R2 Storage** - Edit, Read
+   - **Workers R2 Data Catalog** - Edit, Read
+   - **Workers R2 SQL** - Read
+
+Export your new token as an environment variable:
+
+```bash
+export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
+```
+
+If this is your first time using Wrangler, make sure to login.
+```bash
+npx wrangler login
+```
+
+## 2. Create an R2 bucket
+
+Create a new R2 bucket:
+
+```bash
+npx wrangler r2 bucket create r2-sql-demo
+```
+
+## 3. Enable R2 Data Catalog
+
+Enable [R2 Data Catalog](/r2/data-catalog/) feature on your bucket to use Apache Iceberg tables:
+
+```bash
+npx wrangler r2 bucket catalog enable r2-sql-demo
+```
+## 4. Create the data Pipeline
+
+### 1. Create the Pipeline Stream
+
+First, create a schema file called `demo_schema.json` with the following `json` schema:
+```json
+{
+  "fields": [
+    {"name": "user_id", "type": "int64", "required": true},
+    {"name": "payload", "type": "string", "required": false},
+		{"name": "numbers", "type": "int32", "required": false}
+  ]
+}
+```
+Next, crete the stream we'll use to ingest events to:
+
+```bash
+npx wrangler pipelines streams create demo_stream \
+  --schema-file demo_schema.json \
+	--http-enabled true \
+  --http-auth false
+```
+:::note
+Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
+:::
+
+```bash
+# The http ingest endpoint from the output (see example below)
+export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example below)
+```
+The output should look like this:
+```sh
+🌀 Creating stream 'demo_stream'...
+✨ Successfully created stream 'demo_stream' with id 'stream_id'.
+
+Creation Summary:
+General:
+  Name:  demo_stream
+
+HTTP Ingest:
+  Enabled:         Yes
+  Authentication:  No
+  Endpoint:        https://stream_id.ingest.cloudflare.com
+  CORS Origins:    None
+
+Input Schema:
+┌────────────┬────────┬────────────┬──────────┐
+│ Field Name │ Type   │ Unit/Items │ Required │
+├────────────┼────────┼────────────┼──────────┤
+│ user_id    │ int64  │            │ Yes      │
+├────────────┼────────┼────────────┼──────────┤
+│ payload    │ string │            │ No       │
+├────────────┼────────┼────────────┼──────────┤
+│ numbers    │ int32  │            │ No       │
+└────────────┴────────┴────────────┴──────────┘
+```
+
+
+### 2. Create the Pipeline Sink
+
+Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
+
+```bash
+npx wrangler pipelines sinks create demo_sink \
+  --type "r2-data-catalog" \
+	--bucket "r2-sql-demo" \
+	--roll-interval 30 \
+	--namespace "demo" \
+	--table "first_table" \
+	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
+```
+
+:::note
+This creates a `sink` configuration that will write to the Iceberg table demo.first_table in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`
+:::
+
+### 3. Create the Pipeline
+
+Pipelines are SQL statements read data from the stream, does some work, and writes it to the sink
+
+```bash
+npx wrangler pipelines create demo_pipeline \
+  --sql "INSERT INTO demo_sink SELECT * FROM demo_stream WHERE numbers > 5;"
+```
+:::note
+Note that there is a filter on this statement that will only send events where `numbers` is greater than 5
+:::
+
+## 5. Send some data
+
+Next, let's send some events to our stream:
+
+```curl
+curl -X POST "$STREAM_ENDPOINT" \
+  -H "Authorization: Bearer YOUR_API_TOKEN" \
+  -H "Content-Type: application/json" \
+  -d '[
+    {
+      "user_id": 1,
+      "payload": "you should see this",
+      "numbers": 42
+    },
+    {
+      "user_id": 2,
+      "payload": "you should also see this",
+      "numbers": 100
+    },
+    {
+      "user_id": 3,
+      "payload": null,
+      "numbers": 1
+    },
+    {
+      "user_id": 4,
+      "numbers": null
+    }
+  ]'
+```
+This will send 4 events in one `POST`. Since our Pipeline is filtering out records with `numbers` less than 5, `user_id` `3` and `4` should not appear in the table. Feel free to change values and send more events.
+
+## 6. Query the table with R2 SQL
+
+After you've sent your events to the stream, it will take about 30 seconds for the data to show in the table since that's what we configured our `roll interval` to be in the Sink.
+
+```bash
+npx wrangler r2 sql query "SELECT * FROM demo.first_table LIMIT 10"
+```
+
+<LinkCard
+	title="Managing R2 Data Catalogs"
+	href="/r2/data-catalog/manage-catalogs/"
+	description="Enable or disable R2 Data Catalog on your bucket, retrieve configuration details, and authenticate your Iceberg engine."
+/>
+
+<LinkCard
+	title="Try another example"
+	href="/r2/sql/tutorials/end-to-end-pipeline"
+	description="Detailed tutorial for setting up a simple fruad detection data pipeline and generate events for it in Python."
+/>
diff --git a/src/content/docs/r2/sql/platform/limitations-best-practices.mdx b/src/content/docs/r2/sql/platform/limitations-best-practices.mdx
index da626501f8ff63..adb53dfab59804 100644
--- a/src/content/docs/r2/sql/platform/limitations-best-practices.mdx
+++ b/src/content/docs/r2/sql/platform/limitations-best-practices.mdx
@@ -21,20 +21,20 @@ R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2
 
 | Feature | Supported | Notes |
 | :---- | :---- | :---- |
-| Basic SELECT | Yes | Columns, \*, aliases |
-| SQL Functions | No | No COUNT, AVG, etc. |
-| Single table FROM | Yes | With aliasing |
+| Basic SELECT | Yes | Columns, \* |
+| Aggregation functions | No | No COUNT, AVG, etc. |
+| Single table FROM | Yes | Note, aliasing not supported|
+| WHERE clause | Yes | Filters, comparisons, equality, etc |
 | JOINs | No | No table joins |
-| WHERE with time | Yes | Required |
 | Array filtering | No | No array type support |
 | JSON filtering | No | No nested object queries |
 | Simple LIMIT | Yes | 1-10,000 range |
-| ORDER BY | Yes | Only on partition key |
+| ORDER BY | Yes | Any columns of the partition key only|
 | GROUP BY | No | Not supported |
 
 ## Supported SQL Clauses
 
-R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, and `LIMIT`. All other SQL clauses are not supported at the moment. New features will release often, keep an eye on this page and the changelog\[LINK TO CHANGE LOG\] for the latest.
+R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, and `LIMIT`. All other SQL clauses are not supported at the moment. New features will be released in the future, keep an eye on this page and the changelog\[LINK TO CHANGE LOG\] for the latest.
 
 ---
 
@@ -50,7 +50,7 @@ R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, and `LI
 - **No JSON field querying**: Cannot query individual fields from JSON objects
 - **No SQL functions**: Functions like `AVG()`, `COUNT()`, `MAX()`, `MIN()`, quantiles are not supported
 - **No synthetic data**: Cannot create synthetic columns like `SELECT 1 AS what, "hello" AS greeting`
-- **Field aliasing**: `SELECT field AS another_name`
+- **No field aliasing**: `SELECT field AS another_name`
 
 
 ### Examples
@@ -85,7 +85,7 @@ SELECT 1 AS synthetic_column
 - **No schema evolution**: Schema cannot be altered (no ALTER TABLE, migrations)
 - **Immutable datasets**: No UPDATE or DELETE operations allowed
 - **Fully defined schema**: Dynamic or union-type fields are not supported
-- **Table aliasing**: `SELECT * FROM table_name AS alias`
+- **No table aliasing**: `SELECT * FROM table_name AS alias`
 
 ### Examples
 
@@ -105,13 +105,12 @@ SELECT * FROM (SELECT * FROM events WHERE status = 200)
 
 ### Supported Features
 
-- **Time filtering**: Queries should include a time filter
-- **Simple type filtering**: Supports `string`, `boolean`, and `number` types
+- **Simple type filtering**: Supports `string`, `boolean`, `number` types, and timestamps expressed as RFC3339
 - **Boolean logic**: Supports `AND`, `OR`, `NOT` operators
 - **Comparison operators**: `>`, `>=`, `=`, `<`, `<=`, `!=`
 - **Grouped conditions**: `WHERE col_a="hello" AND (col_b>5 OR col_c != 3)`
-- **Pattern mating:** `WHERE col_a LIKE ‘%hello w%’`
-- **NULL Handling:** `WHERE col_a IS NOT NULL`
+- **Pattern matching:** `WHERE col_a LIKE ‘hello w%’` (prefix matching only)
+- **NULL Handling :** `WHERE col_a IS NOT NULL` (`IS`/`IS NOT`)
 
 ### Limitations
 
@@ -208,5 +207,4 @@ The following SQL clauses are **not supported**:
 2. **Use specific column selection** instead of `SELECT *` when possible for better performance
 3. **Structure your data** to avoid nested JSON objects if you need to filter on those fields
 
----
-
+---
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/platform/pricing.mdx b/src/content/docs/r2/sql/platform/pricing.mdx
index 2b41cd9c6df209..b408b2f4192f63 100644
--- a/src/content/docs/r2/sql/platform/pricing.mdx
+++ b/src/content/docs/r2/sql/platform/pricing.mdx
@@ -14,4 +14,4 @@ R2 SQL is currently not billed during open beta but will eventually be billed on
 
 During the first phase of the R2 SQL open beta, you will not be billed for R2 SQL usage. You will be billed only for R2 usage.
 
-We plan to price based on the volume of data queried by R2 SQL. We will provide at least 30 days' notice and exact pricing before charging.
\ No newline at end of file
+We plan to price based on the volume of data queried by R2 SQL. We will provide at least 30 days notice and exact pricing before charging.
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/platform/sql-reference.mdx b/src/content/docs/r2/sql/platform/sql-reference.mdx
index d020aac3b378d4..be24d1660642c8 100644
--- a/src/content/docs/r2/sql/platform/sql-reference.mdx
+++ b/src/content/docs/r2/sql/platform/sql-reference.mdx
@@ -93,6 +93,7 @@ SELECT * WHERE condition [AND|OR condition ...]
 - `column_name <= value`
 - `column_name < value`
 - `column_name != value`
+- `column_name LIKE value%`
 
 #### Logical Operators
 
@@ -104,11 +105,12 @@ SELECT * WHERE condition [AND|OR condition ...]
 - **integer** \- Whole numbers
 - **float** \- Decimal numbers
 - **string** \- Text values (quoted)
+- **timestamp** - RFC3339 format (`'YYYY-DD-MMT-HH:MM:SSZ'`)
 
 ### Examples
 
 ```sql
-SELECT * FROM table_name WHERE timestamp BETWEEN '2025-01-01' AND '2025-01-02'
+SELECT * FROM table_name WHERE timestamp BETWEEN '2025-09-24T01:00:00Z' AND '2025-09-25T01:00:00Z'
 SELECT * FROM table_name WHERE status = 200
 SELECT * FROM table_name WHERE response_time > 1000
 SELECT * FROM table_name WHERE user_id IS NOT NULL
@@ -123,19 +125,21 @@ SELECT * FROM table_name WHERE (status = 404 OR status = 500) AND timestamp > '2
 ### Syntax
 
 ```sql
---Note: ORDERY BY only supports ordering by the partition key
+--Note: ORDER BY only supports ordering by the partition key
 ORDER BY partition_key [DESC]
 ```
 
-- **Default**: Ascending order (ASC)
+- **ASC**: Ascending order
 - **DESC**: Descending order
+- **Default**: partition_key DESC
+- Can contain any columns from the partition key
 
 ### Examples
 
 ```sql
-SELECT * FROM table_name WHERE ... ORDER BY partitionKey
-SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
-SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
+SELECT * FROM table_name WHERE ... ORDER BY paetition_key_A
+SELECT * FROM table_name WHERE ... ORDER BY partition_key_B DESC
+SELECT * FROM table_name WHERE ... ORDER BY partitionKey_A ASC
 
 ```
 
@@ -151,6 +155,7 @@ LIMIT number
 
 - **Range**: 1 to 10,000
 - **Type**: Integer only
+- **Default**: 500
 
 ### Examples
 
@@ -167,7 +172,7 @@ SELECT * FROM table_name WHERE ... LIMIT 100
 ```sql
 SELECT *
 FROM http_requests
-WHERE timestamp BETWEEN '2024-01-01' AND '2024-01-02'
+WHERE timestamp BETWEEN '2025-09-24T01:00:00Z' AND '2025-09-25T01:00:00Z'
 LIMIT 100
 ```
 
@@ -215,6 +220,8 @@ LIMIT 500
 | `integer` | Whole numbers | `1`, `42`, `-10`, `0` |
 | `float` | Decimal numbers | `1.5`, `3.14`, `-2.7`, `0.0` |
 | `string` | Text values | `'hello'`, `'GET'`, `'2024-01-01'` |
+| `boolean` | boolean values | `true`, `false` |
+| `timestamp` | RFC3339 | `'2025-09-24T01:00:00Z'` |
 
 ### Type Usage in Conditions
 
@@ -237,7 +244,7 @@ SELECT * FROM table_name WHERE country_code = 'US'
 
 ## Operator Precedence
 
-1. **Comparison operators**: `=`, `!=`, `<`, `<=`, `>`, `>=`, `BETWEEN`, `IS NULL`, `IS NOT NULL`
+1. **Comparison operators**: `=`, `!=`, `<`, `<=`, `>`, `>=`, `LIK#`, `BETWEEN`, `IS NULL`, `IS NOT NULL`
 2. **AND** (higher precedence)
 3. **OR** (lower precedence)
 
diff --git a/src/content/docs/r2/sql/query-data.mdx b/src/content/docs/r2/sql/query-data.mdx
index 3905eb47b20380..c30e8d6c9ee1d9 100644
--- a/src/content/docs/r2/sql/query-data.mdx
+++ b/src/content/docs/r2/sql/query-data.mdx
@@ -1,6 +1,8 @@
 ---
 title: Query data in R2 Data Catalog
 pcx_content_type: example
+sidebar:
+  order: 3
 ---
 
 :::note
@@ -12,7 +14,7 @@ R2 SQL is currently in open beta
 - Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up/workers-and-pages).
 - [Create an R2 bucket](/r2/buckets/create-buckets/) and [enable the data catalog](/r2/data-catalog/manage-catalogs/#enable-r2-data-catalog-on-a-bucket).
 - [Create an R2 API token](/r2/api/tokens/) with [R2, R2 SQL, and data catalog permissions](/r2/api/tokens/#permissions).
-- Tables must have a time-based partition key in order be queried by R2 SQL. Read about the current [limitations](/r2/sql/platform/limitations-best-practices) to learn more.
+- Tables must have a time-based partition key in order to be queried by R2 SQL. Read about the current [limitations](/r2/sql/platform/limitations-best-practices) to learn more.
 
 R2 SQL can currently be accessed via Wrangler commands or a REST API.
 
@@ -30,7 +32,7 @@ If this is your first time using Wrangler, make sure to login.
 npx wrangler login
 ```
 
-You'll also want to grab the **warehouse** of the your R2 Data Catalog:
+You'll also want to grab the **warehouse** of the R2 Data Catalog:
 
 ```sh
 ❯ npx wrangler r2 bucket catalog get [BUCKET_NAME]
@@ -71,7 +73,6 @@ curl -X POST \
   -H "Authorization: Bearer ${WRANGLER_R2_SQL_AUTH_TOKEN}" \
   -H "Content-Type: application/json" \
   -d '{
-    "warehouse": "your-warehouse-name",
     "query": "SELECT * FROM namespace.table_name limit 10;"
   }' | jq .
 ```
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/troubleshooting.mdx b/src/content/docs/r2/sql/troubleshooting.mdx
index d233ccdaeffa0c..9a1a18349aa1c7 100644
--- a/src/content/docs/r2/sql/troubleshooting.mdx
+++ b/src/content/docs/r2/sql/troubleshooting.mdx
@@ -4,7 +4,7 @@ pcx_content_type: concept
 tags:
   - SQL
 sidebar:
-  order: 5
+  order: 7
 ---
 
 # R2 SQL Troubleshooting Guide
@@ -23,12 +23,12 @@ This guide covers potential errors and limitations you may encounter when using
 
 ```sql
 -- Invalid - Missing FROM clause
-SELECT user_id WHERE status = 200
+SELECT user_id WHERE status = 200;
 
 -- Valid
 SELECT user_id
 FROM http_requests
-WHERE status = 200 AND timestamp BETWEEN '2024-01-01' AND '2024-01-02'
+WHERE status = 200 AND timestamp BETWEEN '2025-09-24T01:00:00Z' AND '2025-09-25T01:00:00Z';
 ```
 
 **Solution**: Always include `FROM` in your queries.
@@ -47,7 +47,7 @@ WHERE status = 200 AND timestamp BETWEEN '2024-01-01' AND '2024-01-02'
 
 ```sql
 -- Invalid - Aggregate functions not supported
-SELECT COUNT(*) FROM events WHERE timestamp > '2024-01-01'
+SELECT COUNT(*) FROM events WHERE timestamp > '2025-09-24T01:00:00Z'
 SELECT AVG(response_time) FROM http_requests WHERE status = 200
 SELECT MAX(timestamp) FROM logs WHERE user_id = '123'
 ```
@@ -260,7 +260,7 @@ SELECT * FROM events WHERE timestamp > '2024-01-01T10:30:00Z' ORDER BY timestamp
 ### Dynamic Schema Changes
 
 <div className="error-box">
-**Error**: `Sinvalid SQL: only top-level SELECT clause is supported`
+**Error**: `invalid SQL: only top-level SELECT clause is supported`
 </div>
 
 **Problem**: Attempting to modify table schema or reference non-existent columns.
diff --git a/src/content/docs/r2/sql/end-to-end-pipeline.mdx b/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
similarity index 84%
rename from src/content/docs/r2/sql/end-to-end-pipeline.mdx
rename to src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
index 3e236a1e31f28d..cca15b3489b507 100644
--- a/src/content/docs/r2/sql/end-to-end-pipeline.mdx
+++ b/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
@@ -59,7 +59,7 @@ npx wrangler login
 Create a new R2 bucket to store your fraud detection data:
 
 ```bash
-npx wrangler r2 bucket create fraud-detection-data
+npx wrangler r2 bucket create fraud-pipeline
 ```
 
 ## 3. Enable R2 Data Catalog
@@ -67,16 +67,21 @@ npx wrangler r2 bucket create fraud-detection-data
 Enable the Data Catalog feature on your bucket to use Apache Iceberg tables:
 
 ```bash
-npx wrangler r2 bucket catalog enable fraud-detection-data
+npx wrangler r2 bucket catalog enable fraud-pipeline
 ```
+
 :::note
-Make sure to save the Warehouse for use later in this guide
+Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We'll use it later in the tutorial.
 :::
 
+```bash
+export $WAREHOUSE= #Paste your warehouse here
+```
+
 ### Optional - Enable compaction on your R2 Data Catalog
-R2 Data Catalog can automatically compact tables for you. In production event streaming use cases, it's common to end up with many small files so it's recommended to enable compaction. Since this is a sample use case, this is optional.
+R2 Data Catalog can automatically compact tables for you. In production event streaming use cases, it's common to end up with many small files, so it's recommended to enable compaction. Since this is a sample use case, this is optional.
 ```bash
-npx wrangler r2 bucket catalog compaction enable fraud-detection-data --token $WRANGLER_R2_SQL_AUTH_TOKEN
+npx wrangler r2 bucket catalog compaction enable fraud-pipeline --token $WRANGLER_R2_SQL_AUTH_TOKEN
 ```
 
 ## 4. Set up the pipeline infrastructure
@@ -93,8 +98,7 @@ First, create a schema file called `raw_transactions_schema.json` with the follo
       {"name": "transaction_timestamp", "type": "string", "required": false},
       {"name": "location", "type": "string", "required": false},
       {"name": "merchant_category", "type": "string", "required": false},
-      {"name": "is_fraud", "type": "string", "required": false},
-      {"name": "ingestion_timestamp", "type": "string", "required": false}
+      {"name": "is_fraud", "type": "bool", "required": false}
     ]
 }
 ```
@@ -102,10 +106,10 @@ First, create a schema file called `raw_transactions_schema.json` with the follo
 Create a stream to receive incoming fraud detection events:
 
 ```bash
-npx wrangler pipelines streams create rawtransactionstream \
+npx wrangler pipelines streams create raw_stream \
   --schema-file raw_transactions_schema.json \
 	--http-enabled true \
-  --http-auth true
+  --http-auth false
 ```
 :::note
 Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
@@ -117,12 +121,12 @@ export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example b
 
 The output should look like this:
 ```sh
-🌀 Creating stream 'rawtransactionstream'...
-✨ Successfully created stream 'rawtransactionstream' with id 'stream_id'.
+🌀 Creating stream 'raw_stream'...
+✨ Successfully created stream 'raw_stream' with id 'stream_id'.
 
 Creation Summary:
 General:
-  Name:  rawtransactionstream
+  Name:  raw_stream
 
 HTTP Ingest:
   Enabled:         Yes
@@ -146,22 +150,18 @@ Input Schema:
 ├───────────────────────┼────────┼────────────┼──────────┤
 │ merchant_category     │ string │            │ No       │
 ├───────────────────────┼────────┼────────────┼──────────┤
-│ is_fraud              │ string │            │ No       │
-├───────────────────────┼────────┼────────────┼──────────┤
-│ ingestion_timestamp   │ string │            │ No       │
+│ is_fraud              │ bool   │            │ No       │
 └───────────────────────┴────────┴────────────┴──────────┘
 ```
 
-
-
 ### Create the data sink
 
 Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
 
 ```bash
-npx wrangler pipelines sinks create rawtransactionsink \
+npx wrangler pipelines sinks create raw_sink \
   --type "r2-data-catalog" \
-	--bucket "fraud-detection-data" \
+	--bucket "fraud-pipeline" \
 	--roll-interval 30 \
 	--namespace "fraud_detection" \
 	--table "transactions" \
@@ -169,7 +169,7 @@ npx wrangler pipelines sinks create rawtransactionsink \
 ```
 
 :::note
-This creates a `sink` configuration that will write to the Iceberg table fraud_detection.transactions every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partion the table by `DAY`
+This creates a `sink` configuration that will write to the Iceberg table fraud_detection.transactions in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`
 :::
 
 ### Create the pipeline
@@ -177,8 +177,8 @@ This creates a `sink` configuration that will write to the Iceberg table fraud_d
 Connect your stream to your sink with SQL:
 
 ```bash
-npx wrangler pipelines create transactionspipeline \
-  --sql "INSERT INTO rawtransactionsink SELECT * FROM rawtransactionstream"
+npx wrangler pipelines create raw_events_pipeline \
+  --sql "INSERT INTO raw_sink SELECT * FROM raw_stream"
 ```
 
 ## 5. Generate fraud detection data
@@ -200,7 +200,7 @@ API_TOKEN = os.environ["WRANGLER_R2_SQL_AUTH_TOKEN"] #the same one created earli
 EVENTS_TO_SEND = 1000 # Feel free to adjust this
 
 def generate_transaction():
-    """Generate some random transactions with occassional fraud"""
+    """Generate some random transactions with occasional fraud"""
 
     # User IDs
     high_risk_users = [1001, 1002, 1003, 1004, 1005]
@@ -263,8 +263,7 @@ def generate_transaction():
         "transaction_timestamp": transaction_time.isoformat(),
         "location": location,
         "merchant_category": merchant_category,
-        "is_fraud": "TRUE" if is_fraud else "FALSE",
-        "ingestion_timestamp": datetime.now(timezone.utc).isoformat()
+        "is_fraud": True if is_fraud else False
     }
 
 def send_batch_to_stream(events, batch_size=100):
@@ -280,7 +279,7 @@ def send_batch_to_stream(events, batch_size=100):
 
     for i in range(0, len(events), batch_size):
         batch = events[i:i + batch_size]
-        fraud_in_batch = sum(1 for event in batch if event["is_fraud"] == "TRUE")
+        fraud_in_batch = sum(1 for event in batch if event["is_fraud"] == True)
 
         try:
             response = requests.post(STREAM_ENDPOINT, headers=headers, json=batch)
@@ -309,7 +308,7 @@ def main():
         if (i + 1) % 100 == 0:
             print(f"Generated {i + 1} events...")
 
-    fraud_events = sum(1 for event in events if event["is_fraud"] == "TRUE")
+    fraud_events = sum(1 for event in events if event["is_fraud"] == True)
     print(f"📊 Generated {len(events)} total events ({fraud_events} fraud, {fraud_events/len(events)*100:.1f}%)")
 
     # Send to stream
@@ -339,7 +338,7 @@ Now you can analyze your fraud detection data using R2 SQL. Here are some exampl
 ### View recent transactions
 
 ```bash
-npx wrangler r2 sql query "YOUR_WAREHOUSE" "
+npx wrangler r2 sql query "$WAREHOUSE" "
 SELECT
     transaction_id,
     user_id,
@@ -350,32 +349,29 @@ SELECT
     transaction_timestamp
 FROM fraud_detection.transactions
 WHERE __ingest_ts > '2025-09-24T01:00:00Z'
-AND is_fraud = 'TRUE'
+AND is_fraud = true
 LIMIT 10"
 ```
-:::note
-Replace `YOUR_WAREHOUSE` with your R2 Data Catalog warehouse. This in the form of `{YOUR_ACCOUNT_ID}_{BUCKET_NAME}`. This can be found in the dash under the settings in your bucket. Adjust the `__ingest_ts` date in the query as needed.
-:::
 
 ### Let's filter the raw transactions into a new table to highlight high-value transactions
 
 Create a new sink that will write the filtered data to a new Apache Iceberg table in R2 Data Catalog:
 
 ```bash
-npx wrangler pipelines sinks create filteredfraudsink \
+npx wrangler pipelines sinks create fraud_filter_sink \
   --type "r2-data-catalog" \
-	--bucket "fraud-detection-data" \
+	--bucket "fraud-pipeline" \
 	--roll-interval 30 \
 	--namespace "fraud_detection" \
 	--table "fraud_transactions" \
 	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
 ```
 
-Now you'll create a new SQL query to process data from the original `rawtransactionstream` stream and only write flagged transactions that are over the `amount` of 1000.
+Now you'll create a new SQL query to process data from the original `raw_stream` stream and only write flagged transactions that are over the `amount` of 1000.
 
 ```bash
-npx wrangler pipelines create fraudpipeline \
-  --sql "INSERT INTO filteredfraudsink SELECT * FROM rawtransactionstream WHERE is_fraud='TRUE' and amount > 1000"
+npx wrangler pipelines create fraud_events_pipeline \
+  --sql "INSERT INTO fraud_filter_sink SELECT * FROM raw_stream WHERE is_fraud=true and amount > 1000"
 ```
 
 :::note
@@ -384,7 +380,7 @@ It may take a few minutes for the new Pipeline to fully Initialize and start pro
 
 Let's query the table and check the results:
 ```bash
-npx wrangler r2 sql query "YOUR_WAREHOUSE" "
+npx wrangler r2 sql query "$WAREHOUSE" "
 SELECT
     transaction_id,
     user_id,
@@ -398,7 +394,7 @@ LIMIT 10"
 ```
 Let's also verify that the non-fraudulent events are being filtered out:
 ```bash
-npx wrangler r2 sql query "YOUR_WAREHOUSE" "
+npx wrangler r2 sql query "$WAREHOUSE" "
 SELECT
     transaction_id,
     user_id,
@@ -408,7 +404,7 @@ SELECT
     is_fraud,
     transaction_timestamp
 FROM fraud_detection.fraud_transactions
-WHERE is_fraud = 'FALSE'
+WHERE is_fraud = false
 LIMIT 10"
 ```
 You should see the following output:
diff --git a/src/content/docs/r2/sql/tutorials/index.mdx b/src/content/docs/r2/sql/tutorials/index.mdx
new file mode 100644
index 00000000000000..78c229f8741630
--- /dev/null
+++ b/src/content/docs/r2/sql/tutorials/index.mdx
@@ -0,0 +1,7 @@
+---
+title: Tutorials
+pcx_content_type: navigation
+sidebar:
+  group:
+    hideIndex: true
+---

From 9512bde1bea1c150737ce93a76555ff1aaaafbe4 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Sat, 20 Sep 2025 15:38:40 -0700
Subject: [PATCH 07/30] Update get-started.mdx

---
 src/content/docs/r2/sql/get-started.mdx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2/sql/get-started.mdx b/src/content/docs/r2/sql/get-started.mdx
index cc6773163e5977..3b4a518140d710 100644
--- a/src/content/docs/r2/sql/get-started.mdx
+++ b/src/content/docs/r2/sql/get-started.mdx
@@ -39,7 +39,7 @@ You'll need API tokens to interact with Cloudflare services.
 2. Select **Create Token** → **Custom token**
 3. Add the following permissions:
    - **Workers Pipelines** - Read, Send, Edit
-	 - **Workers R2 Storage** - Edit, Read
+   - **Workers R2 Storage** - Edit, Read
    - **Workers R2 Data Catalog** - Edit, Read
    - **Workers R2 SQL** - Read
 

From 579cbf2b6a849938f49b014e21b3c9d85b7ea654 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Sat, 20 Sep 2025 15:39:30 -0700
Subject: [PATCH 08/30] Update end-to-end-pipeline.mdx

---
 src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx b/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
index cca15b3489b507..6759f1cb0d8273 100644
--- a/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
+++ b/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
@@ -41,7 +41,7 @@ You'll need API tokens to interact with Cloudflare services.
    - **Workers R2 Storage** - Edit, Read
    - **Workers R2 Data Catalog** - Edit, Read
    - **Workers R2 SQL** - Read
-	 - **Workers R2 SQL** - Read, Send, Edit
+   - **Workers R2 SQL** - Read, Send, Edit
 
 Export your new token as an environment variable:
 

From 3b1acc70e06b30d47761ca7cf8732d3555df81d1 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Mon, 22 Sep 2025 13:11:13 -0700
Subject: [PATCH 09/30] added dash steps/tabs, moved out of r2, reformatted
 most of the R2 SQL docs

---
 src/content/dash-routes/index.json            |   2 +-
 .../docs/{r2/sql => r2-sql}/get-started.mdx   | 165 ++++++++++++--
 src/content/docs/r2-sql/index.mdx             |  55 +++++
 src/content/docs/r2-sql/query-data.mdx        | 133 ++++++++++++
 .../platform => r2-sql/reference}/index.mdx   |   2 +-
 .../reference}/limitations-best-practices.mdx |   0
 .../platform => r2-sql/reference}/pricing.mdx |   0
 .../reference}/sql-reference.mdx              |   0
 .../{r2/sql => r2-sql}/troubleshooting.mdx    |   2 +
 .../tutorials/end-to-end-pipeline.mdx         | 201 +++++++++++++++---
 .../{r2/sql => r2-sql}/tutorials/index.mdx    |   0
 src/content/docs/r2/r2-sql.mdx                |   9 +
 src/content/docs/r2/sql/index.mdx             |  21 --
 src/content/docs/r2/sql/query-data.mdx        |  78 -------
 src/content/products/r2-sql.yaml              |  12 ++
 src/icons/r2-sql.svg                          |   1 +
 16 files changed, 533 insertions(+), 148 deletions(-)
 rename src/content/docs/{r2/sql => r2-sql}/get-started.mdx (61%)
 create mode 100644 src/content/docs/r2-sql/index.mdx
 create mode 100644 src/content/docs/r2-sql/query-data.mdx
 rename src/content/docs/{r2/sql/platform => r2-sql/reference}/index.mdx (81%)
 rename src/content/docs/{r2/sql/platform => r2-sql/reference}/limitations-best-practices.mdx (100%)
 rename src/content/docs/{r2/sql/platform => r2-sql/reference}/pricing.mdx (100%)
 rename src/content/docs/{r2/sql/platform => r2-sql/reference}/sql-reference.mdx (100%)
 rename src/content/docs/{r2/sql => r2-sql}/troubleshooting.mdx (99%)
 rename src/content/docs/{r2/sql => r2-sql}/tutorials/end-to-end-pipeline.mdx (72%)
 rename src/content/docs/{r2/sql => r2-sql}/tutorials/index.mdx (100%)
 create mode 100644 src/content/docs/r2/r2-sql.mdx
 delete mode 100644 src/content/docs/r2/sql/index.mdx
 delete mode 100644 src/content/docs/r2/sql/query-data.mdx
 create mode 100644 src/content/products/r2-sql.yaml
 create mode 100644 src/icons/r2-sql.svg

diff --git a/src/content/dash-routes/index.json b/src/content/dash-routes/index.json
index c9037feda8e904..7cba51353839fc 100644
--- a/src/content/dash-routes/index.json
+++ b/src/content/dash-routes/index.json
@@ -261,7 +261,7 @@
 	},
 	{
 		"name": "Pipelines",
-		"deeplink": "/?to=/:account/workers/pipelines",
+		"deeplink": "/?to=/:account/pipelines",
 		"parent": ["Storage & Databases"]
 	},
 	{
diff --git a/src/content/docs/r2/sql/get-started.mdx b/src/content/docs/r2-sql/get-started.mdx
similarity index 61%
rename from src/content/docs/r2/sql/get-started.mdx
rename to src/content/docs/r2-sql/get-started.mdx
index 3b4a518140d710..909218bee3ed01 100644
--- a/src/content/docs/r2/sql/get-started.mdx
+++ b/src/content/docs/r2-sql/get-started.mdx
@@ -8,6 +8,10 @@ description: Learn how to get up and running with R2 SQL using R2 Data Catalog a
 ---
 import {
 	Render,
+	Steps,
+	Tabs,
+	TabItem,
+	DashButton,
 	LinkCard,
 } from "~/components";
 
@@ -34,19 +38,28 @@ Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://gith
 
 You'll need API tokens to interact with Cloudflare services.
 
-### Custom API Token
-1. Go to **My Profile** → **API Tokens** in the Cloudflare dashboard
-2. Select **Create Token** → **Custom token**
-3. Add the following permissions:
-   - **Workers Pipelines** - Read, Send, Edit
-   - **Workers R2 Storage** - Edit, Read
-   - **Workers R2 Data Catalog** - Edit, Read
-   - **Workers R2 SQL** - Read
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+   <DashButton url="/?to=/:account/r2/overview" />
+
+2. Select **Manage API tokens**.
+
+3. Select **Create API token**.
+
+4. Select the **R2 Token** text to edit your API token name.
+
+5. Under **Permissions**, choose the **Admin Read & Write** permission.
+
+6. Select **Create API Token**.
+
+7. Note the **Token value**.
+
+</Steps>
 
 Export your new token as an environment variable:
 
 ```bash
-export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
+export WRANGLER_R2_SQL_AUTH_TOKEN= #paste your token here
 ```
 
 If this is your first time using Wrangler, make sure to login.
@@ -54,23 +67,75 @@ If this is your first time using Wrangler, make sure to login.
 npx wrangler login
 ```
 
-## 2. Create an R2 bucket
+## 2. Create an R2 bucket and enable R2 Data Catalog
+
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
+
+Create an R2 bucket:
+
+	```bash
+	npx wrangler r2 bucket create r2-sql-demo
+	```
+
+</TabItem>
+<TabItem label='Dashboard'>
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+   <DashButton url="/?to=/:account/r2/overview" />
 
-Create a new R2 bucket:
+2. Select **Create bucket**.
+
+3. Enter the bucket name: r2-sql-demo
+
+4. Select **Create bucket**.
+</Steps>
+</TabItem>
+</Tabs>
+
+## 2. Enable R2 Data Catalog
+
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
+
+Enable the catalog on your R2 bucket:
 
 ```bash
-npx wrangler r2 bucket create r2-sql-demo
+npx wrangler r2 bucket catalog enable r2-sql-demo
 ```
 
-## 3. Enable R2 Data Catalog
+When you run this command, take note of the "Warehouse". You will need these later.
+
+</TabItem>
+<TabItem label='Dashboard'>
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+   <DashButton url="/?to=/:account/r2/overview" />
+
+2. Select the bucket: r2-sql-demo.
+
+3. Switch to the **Settings** tab, scroll down to **R2 Data Catalog**, and select **Enable**.
+
+4. Once enabled, note the **Catalog URI** and **Warehouse name**.
+</Steps>
+</TabItem>
+</Tabs>
 
-Enable [R2 Data Catalog](/r2/data-catalog/) feature on your bucket to use Apache Iceberg tables:
+
+:::note
+Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We'll use it later in the tutorial.
+:::
 
 ```bash
-npx wrangler r2 bucket catalog enable r2-sql-demo
+export $WAREHOUSE= #Paste your warehouse here
 ```
-## 4. Create the data Pipeline
 
+## 3. Create the data Pipeline
+
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
 ### 1. Create the Pipeline Stream
 
 First, create a schema file called `demo_schema.json` with the following `json` schema:
@@ -157,13 +222,75 @@ npx wrangler pipelines create demo_pipeline \
 Note that there is a filter on this statement that will only send events where `numbers` is greater than 5
 :::
 
+</TabItem>
+<TabItem label='Dashboard'>
+<Steps>
+1. In the Cloudflare dashboard, go to **Pipelines** > **Pipelines**.
+   <DashButton url="/?to=/:account/pipelines" />
+
+2. Select **Create Pipeline**.
+
+3. **Connect to a Stream**:
+   - Pipeline name: `demo`
+   - Enable HTTP endpoint for sending data: Enabled
+   - HTTP authentication: Disabled (default)
+   - Select **Next**
+
+4. **Define Input Schema**:
+   - Select **JSON editor**
+   - Copy in the schema:
+    ```json
+    {
+      "fields": [
+        {"name": "user_id", "type": "int64", "required": true},
+        {"name": "payload", "type": "string", "required": false},
+        {"name": "numbers", "type": "int32", "required": false}
+      ]
+    }
+    ```
+
+   - Select **Next**
+
+5. **Define Sink**:
+   - Select your R2 bucket: `r2-sql-demo`
+   - Storage type: **R2 Data Catalog**
+   - Namespace: `fraud_detection`
+   - Table name: `transactions`
+   - **Advanced Settings**: Change **Maximum Time Interval** to `30 seconds`
+   - Select **Next**
+
+6. **Credentials**:
+   - Disable **Automatically create an Account API token for your sink**
+   - Enter **Catalog Token** from step 1
+   - Select **Next**
+
+7. **Pipeline Definition**:
+   - Leave the default SQL query:
+     ```sql
+     INSERT INTO demo_sink SELECT * FROM demo_stream;
+     ```
+   - Select **Create Pipeline**
+
+8. :::note
+    Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
+   :::
+
+</Steps>
+
+```bash
+# The http ingest endpoint
+export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example below)
+```
+</TabItem>
+</Tabs>
+
+
 ## 5. Send some data
 
 Next, let's send some events to our stream:
 
 ```curl
 curl -X POST "$STREAM_ENDPOINT" \
-  -H "Authorization: Bearer YOUR_API_TOKEN" \
   -H "Content-Type: application/json" \
   -d '[
     {
@@ -194,7 +321,7 @@ This will send 4 events in one `POST`. Since our Pipeline is filtering out recor
 After you've sent your events to the stream, it will take about 30 seconds for the data to show in the table since that's what we configured our `roll interval` to be in the Sink.
 
 ```bash
-npx wrangler r2 sql query "SELECT * FROM demo.first_table LIMIT 10"
+npx wrangler r2 sql query "$WAREHOUSE" "SELECT * FROM demo.first_table LIMIT 10"
 ```
 
 <LinkCard
@@ -205,6 +332,6 @@ npx wrangler r2 sql query "SELECT * FROM demo.first_table LIMIT 10"
 
 <LinkCard
 	title="Try another example"
-	href="/r2/sql/tutorials/end-to-end-pipeline"
+	href="/r2-sql/tutorials/end-to-end-pipeline"
 	description="Detailed tutorial for setting up a simple fruad detection data pipeline and generate events for it in Python."
 />
diff --git a/src/content/docs/r2-sql/index.mdx b/src/content/docs/r2-sql/index.mdx
new file mode 100644
index 00000000000000..554d31c511cd99
--- /dev/null
+++ b/src/content/docs/r2-sql/index.mdx
@@ -0,0 +1,55 @@
+---
+pcx_content_type: navigation
+title: R2 SQL
+sidebar:
+  order: 7
+head:
+  - tag: title
+    content: R2 SQL
+description: A distributed SQL engine for R2 Data Catalog
+---
+
+## Query Apache Iceberg tables in R2 Data Catalog Using R2 SQL
+
+
+:::note
+R2 SQL is in public beta, and any developer with an R2 subscription can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL. We will update [the pricing page](/r2-sql/reference/pricing) and provide at least 30 days notice before enabling billing.
+:::
+
+R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying [Apache Iceberg](https://iceberg.apache.org/) tables stored in [R2 data catalog](https://developers.cloudflare.com/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
+
+```sh
+❯ npx wrangler r2 sql query "3373912de3f5202317188ae01300bd6_data-catalog" \
+"SELECT * FROM default.transactions LIMIT 10"
+
+ ⛅️ wrangler 4.38.0
+────────────────────────────────────────────────────────────────────────────
+▲ [WARNING] 🚧 `wrangler r2 sql query` is an open-beta command. Please report any issues to https://github.com/cloudflare/workers-sdk/issues/new/choose
+
+
+┌─────────────────────────────┬──────────────────────────────────────┬─────────┬──────────┬──────────────────────────────────┬───────────────┬───────────────────┬──────────┐
+│ __ingest_ts                 │ transaction_id                       │ user_id │ amount   │ transaction_timestamp            │ location      │ merchant_category │ is_fraud │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.872554Z │ fdc1beed-157c-4d2d-90cf-630fdea58051 │ 1679    │ 13241.59 │ 2025-09-20T02:23:04.269988+00:00 │ NEW_YORK      │ RESTAURANT        │ false    │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.724378Z │ ea7ef106-8284-4d08-9348-ad33989b6381 │ 1279    │ 17615.79 │ 2025-09-20T02:23:04.271090+00:00 │ MIAMI         │ GAS_STATION       │ true     │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.724330Z │ afcdee4d-5c71-42be-97ec-e282b6937a8c │ 1843    │ 7311.65  │ 2025-09-20T06:23:04.267890+00:00 │ SEATTLE       │ GROCERY           │ true     │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.657007Z │ b99d14e0-dbe0-49bc-a417-0ee57f8bed99 │ 1976    │ 15228.21 │ 2025-09-16T23:23:04.269426+00:00 │ NEW_YORK      │ RETAIL            │ false    │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.656992Z │ 712cd094-ad4c-4d24-819a-0d3daaaceea1 │ 1184    │ 7570.89  │ 2025-09-20T00:23:04.269163+00:00 │ LOS_ANGELES   │ RESTAURANT        │ true     │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.656912Z │ b5a1aab3-676d-4492-92b8-aabcde6db261 │ 1196    │ 46611.25 │ 2025-09-20T16:23:04.268693+00:00 │ NEW_YORK      │ RETAIL            │ true     │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.613740Z │ 432d3976-8d89-4813-9099-ea2afa2c0e70 │ 1720    │ 21547.9  │ 2025-09-20T05:23:04.273681+00:00 │ SAN FRANCISCO │ GROCERY           │ true     │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.532068Z │ 25e0b851-3092-4ade-842f-e3189e07d4ee │ 1562    │ 29311.54 │ 2025-09-20T05:23:04.277405+00:00 │ NEW_YORK      │ RETAIL            │ false    │
+├─────────────────────────────┼──────────────────────────────────────┼─────────┼──────────┼──────────────────────────────────┼───────────────┼───────────────────┼──────────┤
+│ 2025-09-20T22:30:11.526037Z │ 8001746d-05fe-42fe-a189-40caf81d7aa2 │ 1817    │ 15976.5  │ 2025-09-15T16:23:04.266632+00:00 │ SEATTLE       │ RESTAURANT        │ true     │
+└─────────────────────────────┴──────────────────────────────────────┴─────────┴──────────┴──────────────────────────────────┴───────────────┴───────────────────┴──────────┘
+Read 11.3 kB across 4 files from R2
+On average, 3.36 kB / s
+```
+
+Create an end to end data pipeline and query your first table in R2 SQL by following [this step by step guide](/r2-sql/tutorials/end-to-end-pipeline/), learn how to create a data pipeline that takes a stream of events and automatically creates an Apache Iceberg table, making them accessible with R2 SQL.
\ No newline at end of file
diff --git a/src/content/docs/r2-sql/query-data.mdx b/src/content/docs/r2-sql/query-data.mdx
new file mode 100644
index 00000000000000..a4aeee435eb273
--- /dev/null
+++ b/src/content/docs/r2-sql/query-data.mdx
@@ -0,0 +1,133 @@
+---
+title: Query data in R2 Data Catalog
+pcx_content_type: configuration
+description: Understand how to query data with R2 SQL
+sidebar:
+  order: 3
+---
+import {
+	Render,
+	LinkCard,
+} from "~/components";
+
+:::note
+R2 SQL is currently in open beta
+:::
+
+Learn how to:
+- Create an API key with the necessary permissions.
+- Query data with R2 SQL.
+
+R2 SQL can currently be accessed via Wrangler commands or a REST API.
+
+## Create an API key with the right permissions
+
+To query Apache Iceberg tables in R2 Data Catalog, you must provide a Cloudflare API token with R2 SQL, R2 Data Catalog, and R2 storage permissions.
+
+### Create API token in the dashboard
+
+Create an [API token](https://dash.cloudflare.com/profile/api-tokens) with:
+
+- Access to R2 Data Catalog (**minimum**: read-only)
+- Access to R2 storage (**minimum**: read-only)
+- Access to R2 SQL (**minimum**: read-only)
+
+Wrangler now supports the environment variable `WRANGLER_R2_SQL_AUTH_TOKEN` which you can `export` your token as.
+
+### Create API token via API
+
+To create an API token programmatically for use with R2 SQL, you'll need to specify  R2 SQL, R2 Data Catalog, and R2 storage permission groups in your [Access Policy](/r2/api/tokens/#access-policy).
+
+#### Example Access Policy
+
+```json
+[
+	{
+		"id": "f267e341f3dd4697bd3b9f71dd96247f",
+		"effect": "allow",
+		"resources": {
+			"com.cloudflare.edge.r2.bucket.4793d734c0b8e484dfc37ec392b5fa8a_default_my-bucket": "*",
+			"com.cloudflare.edge.r2.bucket.4793d734c0b8e484dfc37ec392b5fa8a_eu_my-eu-bucket": "*"
+		},
+		"permission_groups": [
+			{
+				"id": "45db74139a62490b9b60eb7c4f34994b",
+				"name": "Workers R2 Data Catalog Read"
+			},
+			{
+				"id": "6a018a9f2fc74eb6b293b0c548f38b39",
+				"name": "Workers R2 Storage Bucket Item Read"
+			},
+			{
+				"id": "f45430d92e2b4a6cb9f94f2594c141b8",
+        "name": "Workers R2 SQL Read"
+			}
+		]
+	}
+]
+```
+
+
+## Query data via Wrangler
+
+Export your R2 API token as an environment variable:
+
+```bash
+export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
+```
+
+If this is your first time using Wrangler, make sure to login.
+```bash
+npx wrangler login
+```
+
+:::note
+You'll want to copy the **warehouse** of the R2 Data Catalog:
+:::
+
+```sh
+❯ npx wrangler r2 bucket catalog get [BUCKET_NAME]
+
+ ⛅️ wrangler 4.38.0
+────────────────────────────────────────────────────────────────────────────
+▲ [WARNING] 🚧 `wrangler r2 bucket catalog get` is an open-beta command. Please report any issues to https://github.com/cloudflare/workers-sdk/issues/new/choose
+
+
+Catalog URI:  https://catalog.cloudflarestorage.com/[ACCOUNT_ID]/[BUCKET_NAME]
+Warehouse:    [ACCOUNT_ID]_[BUCKET_NAME]
+Status:       active
+```
+
+To query R2 SQL with Wrangler, simply run:
+
+```sh
+npx wrangler r2 sql query "YOUR_WAREHOUSE" "SELECT * FROM namespace.table_name limit 10;"
+```
+For a full list of supported sql commands, check out the [R2 SQL reference page](/r2-sql/reference/sql-reference).
+
+
+## REST API
+Below is an example of using R2 SQL via the REST endpoint:
+
+```bash
+curl -X POST \
+  "https://api.sql.cloudflarestorage.com/api/v1/accounts/{ACCOUNT_ID}/r2-sql/query/{BUCKET_NAME}" \
+  -H "Authorization: Bearer ${WRANGLER_R2_SQL_AUTH_TOKEN}" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "query": "SELECT * FROM namespace.table_name limit 10;"
+  }'
+```
+
+Learn more:
+<LinkCard
+	title="Manage R2 Data Catalogs"
+	href="/r2/data-catalog/manage-catalogs/"
+	description="Enable or disable R2 Data Catalog on your bucket, retrieve configuration details, and authenticate your Iceberg engine."
+/>
+
+<LinkCard
+	title="Build an end to end data pipeline"
+	href="/r2-sql/tutorials/end-to-end-pipeline"
+	description="Detailed tutorial for setting up a simple fruad detection data pipeline and generate events for it in Python."
+/>
diff --git a/src/content/docs/r2/sql/platform/index.mdx b/src/content/docs/r2-sql/reference/index.mdx
similarity index 81%
rename from src/content/docs/r2/sql/platform/index.mdx
rename to src/content/docs/r2-sql/reference/index.mdx
index ef43ff93fe3c19..ab0a6ad35089fb 100644
--- a/src/content/docs/r2/sql/platform/index.mdx
+++ b/src/content/docs/r2-sql/reference/index.mdx
@@ -1,5 +1,5 @@
 ---
-title: Platform
+title: Reference
 pcx_content_type: navigation
 sidebar:
   group:
diff --git a/src/content/docs/r2/sql/platform/limitations-best-practices.mdx b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
similarity index 100%
rename from src/content/docs/r2/sql/platform/limitations-best-practices.mdx
rename to src/content/docs/r2-sql/reference/limitations-best-practices.mdx
diff --git a/src/content/docs/r2/sql/platform/pricing.mdx b/src/content/docs/r2-sql/reference/pricing.mdx
similarity index 100%
rename from src/content/docs/r2/sql/platform/pricing.mdx
rename to src/content/docs/r2-sql/reference/pricing.mdx
diff --git a/src/content/docs/r2/sql/platform/sql-reference.mdx b/src/content/docs/r2-sql/reference/sql-reference.mdx
similarity index 100%
rename from src/content/docs/r2/sql/platform/sql-reference.mdx
rename to src/content/docs/r2-sql/reference/sql-reference.mdx
diff --git a/src/content/docs/r2/sql/troubleshooting.mdx b/src/content/docs/r2-sql/troubleshooting.mdx
similarity index 99%
rename from src/content/docs/r2/sql/troubleshooting.mdx
rename to src/content/docs/r2-sql/troubleshooting.mdx
index 9a1a18349aa1c7..ad4688334bbb3b 100644
--- a/src/content/docs/r2/sql/troubleshooting.mdx
+++ b/src/content/docs/r2-sql/troubleshooting.mdx
@@ -7,6 +7,8 @@ sidebar:
   order: 7
 ---
 
+
+
 # R2 SQL Troubleshooting Guide
 
 This guide covers potential errors and limitations you may encounter when using R2 SQL. R2 SQL is in open beta and supported functionality will evolve and change over time.
diff --git a/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx b/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
similarity index 72%
rename from src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
rename to src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
index 6759f1cb0d8273..f8b6d7face7e29 100644
--- a/src/content/docs/r2/sql/tutorials/end-to-end-pipeline.mdx
+++ b/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
@@ -6,12 +6,21 @@ products:
   - R2
   - R2 Data Catalog
   - R2 SQL
+  - Pipelines
 ---
 
+import {
+	Render,
+	Steps,
+	Tabs,
+	TabItem,
+	DashButton,
+	LinkCard,
+} from "~/components";
 
-# Build a fraud detection pipeline with the Cloudflare Data Platform
+# Build an end to end data pipeline with the Cloudflare Data Platform
 
-In this guide, you will learn how to build a complete data pipeline using Cloudflare Pipelines, R2 Data Catalog, and R2 SQL. This also includes a sample Python script that creates and sends financial transaction data to your Pipeline that can be queried by R2 SQL or any Apache Iceberg-compatible query engine.
+In this tutorial, you will learn how to build a complete data pipeline using Cloudflare Pipelines, R2 Data Catalog, and R2 SQL. This also includes a sample Python script that creates and sends financial transaction data to your Pipeline that can be queried by R2 SQL or any Apache Iceberg-compatible query engine.
 
 This tutorial demonstrates how to:
 - Set up R2 Data Catalog to store our transaction events in an Apache Iceberg table
@@ -21,7 +30,6 @@ This tutorial demonstrates how to:
 
 
 ## Prerequisites
-
 1. Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up).
 2. Install [Node.js](https://nodejs.org/en/).
 3. Install [Python 3.8+](https://python.org) for the data generation script.
@@ -34,19 +42,37 @@ Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://gith
 
 You'll need API tokens to interact with Cloudflare services.
 
-### Custom API Token
-1. Go to **My Profile** → **API Tokens** in the Cloudflare dashboard
-2. Select **Create Token** → **Custom token**
-3. Add the following permissions:
-   - **Workers R2 Storage** - Edit, Read
-   - **Workers R2 Data Catalog** - Edit, Read
-   - **Workers R2 SQL** - Read
-   - **Workers R2 SQL** - Read, Send, Edit
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **API tokens** page.
+   <DashButton url="/?to=/:account/api-tokens" />
+
+2. Select **Create Token**.
+
+3. Select **Get started** next to Create Custom Token.
+
+4. Enter a name for your API token.
+
+5. Under **Permissions**, choose:
+    - **Workers Pipelines** with Read, Send, and Edit permissions
+    - **Workers R2 Data Catalog** with Read and Edit permissions
+    - **Workers R2 SQL** with Read permissions
+    - **Workers R2 Storage** with Read and Edit permissions
+
+6. Optionally add a TTL to this token
+
+7. Select **Continue to summary**.
+
+8. Click **Create Token**
+
+8. Note the **Token value**.
+
+</Steps>
 
 Export your new token as an environment variable:
 
 ```bash
-export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
+export WRANGLER_R2_SQL_AUTH_TOKEN= #paste your token here
 ```
 
 If this is your first time using Wrangler, make sure to login.
@@ -54,22 +80,63 @@ If this is your first time using Wrangler, make sure to login.
 npx wrangler login
 ```
 
-## 2. Create an R2 bucket
+## 2. Create an R2 bucket and enable R2 Data Catalog
 
-Create a new R2 bucket to store your fraud detection data:
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
 
-```bash
-npx wrangler r2 bucket create fraud-pipeline
-```
+Create an R2 bucket:
+
+	```bash
+	npx wrangler r2 bucket create fraud-pipeline
+	```
+
+</TabItem>
+<TabItem label='Dashboard'>
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+   <DashButton url="/?to=/:account/r2/overview" />
+
+2. Select **Create bucket**.
 
-## 3. Enable R2 Data Catalog
+3. Enter the bucket name: fraud-pipeline
 
-Enable the Data Catalog feature on your bucket to use Apache Iceberg tables:
+4. Select **Create bucket**.
+</Steps>
+</TabItem>
+</Tabs>
+
+## 2. Enable R2 Data Catalog
+
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
+
+Enable the catalog on your R2 bucket:
 
 ```bash
 npx wrangler r2 bucket catalog enable fraud-pipeline
 ```
 
+When you run this command, take note of the "Warehouse" and "Catalog URI". You will need these later.
+
+</TabItem>
+<TabItem label='Dashboard'>
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+   <DashButton url="/?to=/:account/r2/overview" />
+
+2. Select the bucket: fraud-pipeline.
+
+3. Switch to the **Settings** tab, scroll down to **R2 Data Catalog**, and select **Enable**.
+
+4. Once enabled, note the **Catalog URI** and **Warehouse name**.
+</Steps>
+</TabItem>
+</Tabs>
+
+
 :::note
 Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We'll use it later in the tutorial.
 :::
@@ -80,14 +147,34 @@ export $WAREHOUSE= #Paste your warehouse here
 
 ### Optional - Enable compaction on your R2 Data Catalog
 R2 Data Catalog can automatically compact tables for you. In production event streaming use cases, it's common to end up with many small files, so it's recommended to enable compaction. Since this is a sample use case, this is optional.
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
+
 ```bash
 npx wrangler r2 bucket catalog compaction enable fraud-pipeline --token $WRANGLER_R2_SQL_AUTH_TOKEN
 ```
 
+</TabItem>
+<TabItem label='Dashboard'>
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+   <DashButton url="/?to=/:account/r2/overview" />
+
+2. Select the bucket: fraud-pipeline.
+
+3. Switch to the **Settings** tab, scroll down to **R2 Data Catalog**, click on edit icon, and select **Enable**.
+
+4. You can choose a target file size or leave the default. Click save.
+</Steps>
+</TabItem>
+</Tabs>
+
 ## 4. Set up the pipeline infrastructure
 
 ### Create the Pipeline stream
-
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
 First, create a schema file called `raw_transactions_schema.json` with the following `json` schema:
 ```json
 {
@@ -106,7 +193,7 @@ First, create a schema file called `raw_transactions_schema.json` with the follo
 Create a stream to receive incoming fraud detection events:
 
 ```bash
-npx wrangler pipelines streams create raw_stream \
+npx wrangler pipelines streams create raw_events_stream \
   --schema-file raw_transactions_schema.json \
 	--http-enabled true \
   --http-auth false
@@ -121,12 +208,12 @@ export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example b
 
 The output should look like this:
 ```sh
-🌀 Creating stream 'raw_stream'...
-✨ Successfully created stream 'raw_stream' with id 'stream_id'.
+🌀 Creating stream 'raw_events_stream'...
+✨ Successfully created stream 'raw_events_stream' with id 'stream_id'.
 
 Creation Summary:
 General:
-  Name:  raw_stream
+  Name:  raw_events_stream
 
 HTTP Ingest:
   Enabled:         Yes
@@ -159,7 +246,7 @@ Input Schema:
 Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
 
 ```bash
-npx wrangler pipelines sinks create raw_sink \
+npx wrangler pipelines sinks create raw_events_sink \
   --type "r2-data-catalog" \
 	--bucket "fraud-pipeline" \
 	--roll-interval 30 \
@@ -178,8 +265,66 @@ Connect your stream to your sink with SQL:
 
 ```bash
 npx wrangler pipelines create raw_events_pipeline \
-  --sql "INSERT INTO raw_sink SELECT * FROM raw_stream"
+  --sql "INSERT INTO raw_events_sink SELECT * FROM raw_events_stream"
 ```
+</TabItem>
+<TabItem label='Dashboard'>
+<Steps>
+1. In the Cloudflare dashboard, go to **Pipelines** > **Pipelines**.
+   <DashButton url="/?to=/:account/pipelines" />
+
+2. Select **Create Pipeline**.
+
+3. **Connect to a Stream**:
+   - Pipeline name: `raw_events`
+   - Enable HTTP endpoint for sending data: Enabled
+   - HTTP authentication: Disabled (default)
+   - Select **Next**
+
+4. **Define Input Schema**:
+   - Select **JSON editor**
+   - Copy in the schema:
+      ```json
+	  {
+        "fields": [
+            {"name": "transaction_id", "type": "string", "required": true},
+            {"name": "user_id", "type": "int64", "required": true},
+            {"name": "amount", "type": "f64", "required": false},
+            {"name": "transaction_timestamp", "type": "string", "required": false},
+            {"name": "location", "type": "string", "required": false},
+            {"name": "merchant_category", "type": "string", "required": false},
+            {"name": "is_fraud", "type": "bool", "required": false}
+        ]
+	  }
+		```
+
+   - Select **Next**
+
+5. **Define Sink**:
+   - Select your R2 bucket: `fraud-pipeline`
+   - Storage type: **R2 Data Catalog**
+   - Namespace: `fraud_detection`
+   - Table name: `transactions`
+   - **Advanced Settings**: Change **Maximum Time Interval** to `30 seconds`
+   - Select **Next**
+
+6. **Credentials**:
+   - Disable **Automatically create an Account API token for your sink**
+   - Enter **Catalog Token** from step 1
+   - Select **Next**
+
+7. **Pipeline Definition**:
+   - Leave the default SQL query:
+     ```sql
+     INSERT INTO raw_events_sink SELECT * FROM raw_events_stream;
+     ```
+   - Select **Create Pipeline**
+
+8. After pipeline creation, note the **Stream ID** for the next step.
+</Steps>
+
+</TabItem>
+</Tabs>
 
 ## 5. Generate fraud detection data
 
@@ -367,11 +512,11 @@ npx wrangler pipelines sinks create fraud_filter_sink \
 	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
 ```
 
-Now you'll create a new SQL query to process data from the original `raw_stream` stream and only write flagged transactions that are over the `amount` of 1000.
+Now you'll create a new SQL query to process data from the original `raw_events_stream` stream and only write flagged transactions that are over the `amount` of 1000.
 
 ```bash
 npx wrangler pipelines create fraud_events_pipeline \
-  --sql "INSERT INTO fraud_filter_sink SELECT * FROM raw_stream WHERE is_fraud=true and amount > 1000"
+  --sql "INSERT INTO fraud_filter_sink SELECT * FROM raw_events_stream WHERE is_fraud=true and amount > 1000"
 ```
 
 :::note
diff --git a/src/content/docs/r2/sql/tutorials/index.mdx b/src/content/docs/r2-sql/tutorials/index.mdx
similarity index 100%
rename from src/content/docs/r2/sql/tutorials/index.mdx
rename to src/content/docs/r2-sql/tutorials/index.mdx
diff --git a/src/content/docs/r2/r2-sql.mdx b/src/content/docs/r2/r2-sql.mdx
new file mode 100644
index 00000000000000..44656fe71508e6
--- /dev/null
+++ b/src/content/docs/r2/r2-sql.mdx
@@ -0,0 +1,9 @@
+---
+pcx_content_type: navigation
+title: R2 SQL
+external_link: /r2-sql/
+sidebar:
+  order: 7
+  group:
+    badge: Beta
+---
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/index.mdx b/src/content/docs/r2/sql/index.mdx
deleted file mode 100644
index a97dd2bfbd417b..00000000000000
--- a/src/content/docs/r2/sql/index.mdx
+++ /dev/null
@@ -1,21 +0,0 @@
----
-pcx_content_type: navigation
-title: R2 SQL
-sidebar:
-  order: 7
-  group:
-    badge: Beta
-head: []
-description: A distributed SQL engine for R2 Data Catalog
----
-
-## Efficiently Query Apache Iceberg tables in R2 Data Catalog Using R2 SQL.
-
-
-:::note
-R2 SQL is in public beta, and any developer with an R2 subscription can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL
-:::
-
-R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying Apache Iceberg tables stored in [R2 data catalog](https://developers.cloudflare.com/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
-
-Create an end to end data pipeline and query your first table in R2 SQL by following [this step by step guide](/r2/sql/end-to-end-pipeline/), learn how to create a data pipeline that takes a stream of events and automatically creates an Apache Iceberg table, making them accessible with R2 SQL.
\ No newline at end of file
diff --git a/src/content/docs/r2/sql/query-data.mdx b/src/content/docs/r2/sql/query-data.mdx
deleted file mode 100644
index c30e8d6c9ee1d9..00000000000000
--- a/src/content/docs/r2/sql/query-data.mdx
+++ /dev/null
@@ -1,78 +0,0 @@
----
-title: Query data in R2 Data Catalog
-pcx_content_type: example
-sidebar:
-  order: 3
----
-
-:::note
-R2 SQL is currently in open beta
-:::
-
-## Prerequisites
-
-- Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up/workers-and-pages).
-- [Create an R2 bucket](/r2/buckets/create-buckets/) and [enable the data catalog](/r2/data-catalog/manage-catalogs/#enable-r2-data-catalog-on-a-bucket).
-- [Create an R2 API token](/r2/api/tokens/) with [R2, R2 SQL, and data catalog permissions](/r2/api/tokens/#permissions).
-- Tables must have a time-based partition key in order to be queried by R2 SQL. Read about the current [limitations](/r2/sql/platform/limitations-best-practices) to learn more.
-
-R2 SQL can currently be accessed via Wrangler commands or a REST API.
-
-## Wrangler
-
-
-Export your R2 API token as an environment variable:
-
-```bash
-export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
-```
-
-If this is your first time using Wrangler, make sure to login.
-```bash
-npx wrangler login
-```
-
-You'll also want to grab the **warehouse** of the R2 Data Catalog:
-
-```sh
-❯ npx wrangler r2 bucket catalog get [BUCKET_NAME]
-
- ⛅️ wrangler 4.38.0
-────────────────────────────────────────────────────────────────────────────
-▲ [WARNING] 🚧 `wrangler r2 bucket catalog get` is an open-beta command. Please report any issues to https://github.com/cloudflare/workers-sdk/issues/new/choose
-
-
-Catalog URI:  https://catalog.cloudflarestorage.com/[ACCOUNT_ID]/[BUCKET_NAME]
-Warehouse:    [ACCOUNT_ID]_[BUCKET_NAME]
-Status:       active
-```
-
-To query R2 SQL with Wrangler, simply run:
-
-```sh
-npx wrangler r2 sql query "YOUR_WAREHOUSE" "SELECT * FROM namespace.table_name limit 10;"
-```
-For a full list of supported sql commands, check out the [R2 SQL reference page](/r2/sql/platform/sql-reference).
-
-
-## REST API
-
-Set your environment variable
-
-```bash
-export ACCOUNT_ID="your-cloudflare-account-id"
-export BUCKET_NAME="your-r2-bucket-name"
-export WRANGLER_R2_SQL_AUTH_TOKEN="your_token_here"
-```
-
-Now you're ready to use the REST endpoint
-
-```bash
-curl -X POST \
-  "https://api.sql.cloudflarestorage.com/api/v1/accounts/${ACCOUNT_ID}/r2-sql/query/${BUCKET_NAME}" \
-  -H "Authorization: Bearer ${WRANGLER_R2_SQL_AUTH_TOKEN}" \
-  -H "Content-Type: application/json" \
-  -d '{
-    "query": "SELECT * FROM namespace.table_name limit 10;"
-  }' | jq .
-```
\ No newline at end of file
diff --git a/src/content/products/r2-sql.yaml b/src/content/products/r2-sql.yaml
new file mode 100644
index 00000000000000..4c72d34cd28cab
--- /dev/null
+++ b/src/content/products/r2-sql.yaml
@@ -0,0 +1,12 @@
+
+name: R2 SQL
+
+product:
+  title: R2 SQL
+  url: /r2-sql/
+  group: Developer platform
+
+meta:
+  title: R2 SQL docs
+  description: Cloudflare's serverless, distributed query engine for data stored in R2 Data Catalog
+  author: '@cloudflare'
\ No newline at end of file
diff --git a/src/icons/r2-sql.svg b/src/icons/r2-sql.svg
new file mode 100644
index 00000000000000..3d391a2de4036a
--- /dev/null
+++ b/src/icons/r2-sql.svg
@@ -0,0 +1 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="40" height="40" viewBox="0 0 40 40"><path fill-rule="evenodd" d="M30.289 6.423c-2.43-.813-5.958-1.362-9.977-1.362-4.018 0-7.545.549-9.976 1.362-1.228.41-2.033.842-2.48 1.195q-.14.111-.204.18c.052.171.196.395.562.67.524.394 1.372.783 2.563 1.119 2.368.666 5.731 1.023 9.536 1.023s7.167-.357 9.535-1.023c1.191-.336 2.04-.725 2.563-1.119.366-.275.51-.499.562-.67a2 2 0 0 0-.204-.18c-.447-.353-1.252-.784-2.48-1.195m-20.24 5.624c-.885-.25-1.71-.552-2.424-.922v4.393c0 .196.097.514.625.941.535.433 1.391.869 2.576 1.252 2.36.764 5.71 1.222 9.486 1.222 3.778 0 7.128-.458 9.487-1.222 1.185-.383 2.041-.82 2.576-1.252.528-.427.625-.745.625-.94v-4.394c-.715.37-1.539.673-2.424.922-2.7.76-6.336 1.124-10.264 1.124s-7.564-.364-10.263-1.124m25.576 3.471V7.622c0-2.829-6.856-5.122-15.313-5.122C11.857 2.5 5 4.793 5 7.622v24.756c0 2.829 6.856 5.122 15.313 5.122 8.456 0 15.312-2.293 15.312-5.122zM33 19.134c-.7.393-1.505.726-2.375 1.008-2.708.877-6.358 1.352-10.313 1.352-3.954 0-7.604-.475-10.312-1.352-.87-.282-1.676-.615-2.375-1.008v4.28c0 .196.097.514.625.942.535.432 1.391.868 2.576 1.252 2.36.763 5.71 1.221 9.486 1.221 3.778 0 7.128-.458 9.487-1.221 1.185-.384 2.041-.82 2.576-1.252.528-.428.625-.746.625-.941v-4.28Zm-23 8.904c-.87-.281-1.676-.615-2.375-1.007v5.143c.044.048.116.117.231.208.447.353 1.252.785 2.48 1.195 2.43.813 5.958 1.362 9.976 1.362s7.546-.549 9.977-1.362c1.228-.41 2.033-.842 2.48-1.195a2 2 0 0 0 .231-.208v-5.143c-.7.392-1.505.726-2.375 1.007-2.708.877-6.358 1.352-10.313 1.352-3.954 0-7.604-.475-10.312-1.352m23.06 4.06-.01.016zm-25.495 0 .01.016zm3.997-15.726c.725 0 1.313-.573 1.313-1.28s-.588-1.281-1.313-1.281c-.724 0-1.312.573-1.312 1.28s.588 1.281 1.313 1.281Zm1.313 6.83c0 .706-.588 1.28-1.313 1.28-.724 0-1.312-.574-1.312-1.28 0-.708.588-1.281 1.313-1.281.724 0 1.312.573 1.312 1.28Zm-1.313 9.176c.725 0 1.313-.573 1.313-1.28s-.588-1.28-1.313-1.28c-.724 0-1.312.572-1.312 1.28 0 .707.588 1.28 1.313 1.28Z" clip-rule="evenodd"/></svg>
\ No newline at end of file

From 5a2776806d5a0eeb06e8facf6549cde5a8b6cb2f Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Mon, 22 Sep 2025 13:27:03 -0700
Subject: [PATCH 10/30] added new R2 SQL token env variable

---
 .../docs/workers/wrangler/system-environment-variables.mdx     | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/src/content/docs/workers/wrangler/system-environment-variables.mdx b/src/content/docs/workers/wrangler/system-environment-variables.mdx
index d24c93dacafc7c..c8864ecc75c06c 100644
--- a/src/content/docs/workers/wrangler/system-environment-variables.mdx
+++ b/src/content/docs/workers/wrangler/system-environment-variables.mdx
@@ -84,6 +84,8 @@ Wrangler supports the following environment variables:
 - `DOCKER_HOST` <Type text="string" /> <MetaInfo text="optional" />
   - Used for local development of [Containers](/containers/local-dev). Wrangler will attempt to automatically find the correct socket to use to communicate with your container engine. If that does not work (usually surfacing as an `internal error` when attempting to connect to your Container), you can try setting the socket path using this environment variable.
 
+* `WRANGLER_R2_SQL_AUTH_TOKEN` <Type text="string" /> <MetaInfo text="optional" />
+  - API token used for executing queries with [R2 SQL](/r2-sql).
 ## Example `.env` file
 
 The following is an example `.env` file:
@@ -96,6 +98,7 @@ WRANGLER_SEND_METRICS=true
 CLOUDFLARE_API_BASE_URL=https://api.cloudflare.com/client/v4
 WRANGLER_LOG=debug
 WRANGLER_LOG_PATH=../Desktop/my-logs/my-log-file.log
+WRANGLER_R2_SQL_AUTH_TOKEN=<YOUR_R2_API_TOKEN_VALUE>
 ```
 
 ## Deprecated global variables

From dde1d628cf417fdbefa5d4b597c659b339440d79 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Mon, 22 Sep 2025 13:56:15 -0700
Subject: [PATCH 11/30] adding wrangler commands

---
 src/content/docs/r2-sql/index.mdx             |  2 +-
 src/content/docs/r2-sql/platform/index.mdx    |  7 ++++++
 .../{reference => platform}/pricing.mdx       |  0
 .../r2-sql/platform/wrangler-commands.mdx     | 14 +++++++++++
 .../docs/workers/wrangler/commands.mdx        |  6 +++++
 .../workers/wrangler-commands/r2-sql.mdx      | 24 +++++++++++++++++++
 6 files changed, 52 insertions(+), 1 deletion(-)
 create mode 100644 src/content/docs/r2-sql/platform/index.mdx
 rename src/content/docs/r2-sql/{reference => platform}/pricing.mdx (100%)
 create mode 100644 src/content/docs/r2-sql/platform/wrangler-commands.mdx
 create mode 100644 src/content/partials/workers/wrangler-commands/r2-sql.mdx

diff --git a/src/content/docs/r2-sql/index.mdx b/src/content/docs/r2-sql/index.mdx
index 554d31c511cd99..2bb44f23e21e14 100644
--- a/src/content/docs/r2-sql/index.mdx
+++ b/src/content/docs/r2-sql/index.mdx
@@ -13,7 +13,7 @@ description: A distributed SQL engine for R2 Data Catalog
 
 
 :::note
-R2 SQL is in public beta, and any developer with an R2 subscription can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL. We will update [the pricing page](/r2-sql/reference/pricing) and provide at least 30 days notice before enabling billing.
+R2 SQL is in public beta, and any developer with an R2 subscription can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL. We will update [the pricing page](/r2-sql/platform/pricing) and provide at least 30 days notice before enabling billing.
 :::
 
 R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying [Apache Iceberg](https://iceberg.apache.org/) tables stored in [R2 data catalog](https://developers.cloudflare.com/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
diff --git a/src/content/docs/r2-sql/platform/index.mdx b/src/content/docs/r2-sql/platform/index.mdx
new file mode 100644
index 00000000000000..ef43ff93fe3c19
--- /dev/null
+++ b/src/content/docs/r2-sql/platform/index.mdx
@@ -0,0 +1,7 @@
+---
+title: Platform
+pcx_content_type: navigation
+sidebar:
+  group:
+    hideIndex: true
+---
diff --git a/src/content/docs/r2-sql/reference/pricing.mdx b/src/content/docs/r2-sql/platform/pricing.mdx
similarity index 100%
rename from src/content/docs/r2-sql/reference/pricing.mdx
rename to src/content/docs/r2-sql/platform/pricing.mdx
diff --git a/src/content/docs/r2-sql/platform/wrangler-commands.mdx b/src/content/docs/r2-sql/platform/wrangler-commands.mdx
new file mode 100644
index 00000000000000..76e85fae5e3720
--- /dev/null
+++ b/src/content/docs/r2-sql/platform/wrangler-commands.mdx
@@ -0,0 +1,14 @@
+---
+pcx_content_type: concept
+title: Wrangler commands
+sidebar:
+  order: 80
+---
+
+import { Render, Type, MetaInfo } from "~/components";
+
+<Render file="wrangler-commands/r2-sql" product="workers" />
+
+## Global commands
+
+<Render file="wrangler-commands/global-flags" product="workers" />
\ No newline at end of file
diff --git a/src/content/docs/workers/wrangler/commands.mdx b/src/content/docs/workers/wrangler/commands.mdx
index 383044d7e36322..622ef7b15c76b6 100644
--- a/src/content/docs/workers/wrangler/commands.mdx
+++ b/src/content/docs/workers/wrangler/commands.mdx
@@ -36,6 +36,7 @@ Wrangler offers a number of commands to manage your Cloudflare Workers.
 - [`kv bulk`](#kv-bulk) - Manage multiple key-value pairs within a Workers KV namespace in batches.
 - [`r2 bucket`](#r2-bucket) - Manage Workers R2 buckets.
 - [`r2 object`](#r2-object) - Manage Workers R2 objects.
+- [`r2 sql`](#r2-sql) - Query tables in R2 Data Catalog with R2 SQL.
 - [`secret`](#secret) - Manage the secret variables for a Worker.
 - [`secret bulk`](#secret-bulk) - Manage multiple secret variables for a Worker.
 - [`secrets-store secret`](#secrets-store-secret) - Manage account secrets within a secrets store.
@@ -356,6 +357,11 @@ wrangler delete [<SCRIPT>] [OPTIONS]
 
 <Render file="wrangler-commands/r2" product="workers" />
 
+---
+## r2 SQL
+
+<Render file="wrangler-commands/r2-sql" product="workers" />
+
 ---
 
 ## `secret`
diff --git a/src/content/partials/workers/wrangler-commands/r2-sql.mdx b/src/content/partials/workers/wrangler-commands/r2-sql.mdx
new file mode 100644
index 00000000000000..8cf74660289c80
--- /dev/null
+++ b/src/content/partials/workers/wrangler-commands/r2-sql.mdx
@@ -0,0 +1,24 @@
+---
+{}
+---
+
+import { Render, AnchorHeading, Type, MetaInfo } from "~/components";
+
+:::note
+
+R2 SQL is currently in open beta. Report R2 SQL bugs in [GitHub](https://github.com/cloudflare/workers-sdk/issues/new/choose). R2 SQL expects there to be a [WRANGLER_R2_SQL_AUTH_TOKEN](/workers/wrangler/system-environment-variables) environment variable to be set.
+
+:::
+
+<AnchorHeading title="`query`" slug="r2-sql-query" depth={3} />
+
+Query a table in R2 Data Catalog using R2 SQL
+
+```txt
+wrangler r2 sql query <warehouse> <query>
+```
+
+- `warehouse` <Type text="string" /> <MetaInfo text="required" />
+	- Your R2 Data Catalog warehouse - in the form of ACCOUNT_ID_BUCKET_NAME
+- `query` <Type text="string" /> <MetaInfo text="required" />
+	- The SQL query to execute. Refer to the [SQL reference](/r2-sql/reference/sql-reference/).
\ No newline at end of file

From 74b405c47a326f9edbbfa74c0476bcd71f627187 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Mon, 22 Sep 2025 14:08:34 -0700
Subject: [PATCH 12/30] Update .gitignore

---
 .gitignore | 1 -
 1 file changed, 1 deletion(-)

diff --git a/.gitignore b/.gitignore
index 673fe364a8a3ec..a62898367df894 100644
--- a/.gitignore
+++ b/.gitignore
@@ -30,4 +30,3 @@ pnpm-debug.log*
 /worker/functions/
 
 .idea
-package-lock.json

From d08b951697537b1522097c6c0a8d32136146cfb2 Mon Sep 17 00:00:00 2001
From: Jun Lee <junlee@cloudflare.com>
Date: Tue, 23 Sep 2025 10:24:41 +0100
Subject: [PATCH 13/30] PCX Review

---
 src/content/docs/r2-sql/get-started.mdx       |  63 +++++----
 src/content/docs/r2-sql/index.mdx             |   2 +-
 src/content/docs/r2-sql/platform/pricing.mdx  |   4 +-
 src/content/docs/r2-sql/query-data.mdx        |  18 ++-
 .../reference/limitations-best-practices.mdx  |  37 +++---
 .../docs/r2-sql/reference/sql-reference.mdx   |   7 +-
 src/content/docs/r2-sql/troubleshooting.mdx   |  58 ++++----
 .../r2-sql/tutorials/end-to-end-pipeline.mdx  | 125 ++++++++++--------
 8 files changed, 174 insertions(+), 140 deletions(-)

diff --git a/src/content/docs/r2-sql/get-started.mdx b/src/content/docs/r2-sql/get-started.mdx
index 909218bee3ed01..b87465a67211de 100644
--- a/src/content/docs/r2-sql/get-started.mdx
+++ b/src/content/docs/r2-sql/get-started.mdx
@@ -20,26 +20,29 @@ import {
 This guide will instruct you through:
 
 - Creating an [R2 bucket](/r2/buckets/) and enabling its [data catalog](/r2/data-catalog/).
-- Using Wrangler to create a Pipeline Stream, Sink, and the SQL that reads from the stream and writes it to the sink
-- Sending some data to the stream via the HTTP Streams endpoint
-- Querying the data using R2 SQL
+- Using Wrangler to create a Pipeline Stream, Sink, and the SQL that reads from the stream and writes it to the sink.
+- Sending some data to the stream via the HTTP Streams endpoint.
+- Querying the data using R2 SQL.
 
 ## Prerequisites
 
 1. Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up).
 2. Install [Node.js](https://nodejs.org/en/).
-3. Install [Wrangler](/workers/wranger/install-and-update)
+3. Install [Wrangler](/workers/wranger/install-and-update).
 
 :::note[Node.js version manager]
-Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions. Wrangler requires a Node version of 16.17.0 or later.
+Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions.
+
+Wrangler requires a Node version of 16.17.0 or later.
 :::
 
 ## 1. Set up authentication
 
-You'll need API tokens to interact with Cloudflare services.
+You will need API tokens to interact with Cloudflare services.
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+
    <DashButton url="/?to=/:account/r2/overview" />
 
 2. Select **Manage API tokens**.
@@ -63,6 +66,7 @@ export WRANGLER_R2_SQL_AUTH_TOKEN= #paste your token here
 ```
 
 If this is your first time using Wrangler, make sure to login.
+
 ```bash
 npx wrangler login
 ```
@@ -83,18 +87,19 @@ Create an R2 bucket:
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+
    <DashButton url="/?to=/:account/r2/overview" />
 
 2. Select **Create bucket**.
 
-3. Enter the bucket name: r2-sql-demo
+3. Enter the bucket name: `r2-sql-demo`
 
 4. Select **Create bucket**.
 </Steps>
 </TabItem>
 </Tabs>
 
-## 2. Enable R2 Data Catalog
+## 3. Enable R2 Data Catalog
 
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
@@ -112,9 +117,10 @@ When you run this command, take note of the "Warehouse". You will need these lat
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+
    <DashButton url="/?to=/:account/r2/overview" />
 
-2. Select the bucket: r2-sql-demo.
+2. Select the bucket: `r2-sql-demo`.
 
 3. Switch to the **Settings** tab, scroll down to **R2 Data Catalog**, and select **Enable**.
 
@@ -125,20 +131,22 @@ When you run this command, take note of the "Warehouse". You will need these lat
 
 
 :::note
-Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We'll use it later in the tutorial.
+Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We will use it later in the tutorial.
 :::
 
 ```bash
 export $WAREHOUSE= #Paste your warehouse here
 ```
 
-## 3. Create the data Pipeline
+## 4. Create the data Pipeline
 
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
-### 1. Create the Pipeline Stream
+
+### 4.1. Create the Pipeline Stream
 
 First, create a schema file called `demo_schema.json` with the following `json` schema:
+
 ```json
 {
   "fields": [
@@ -148,7 +156,7 @@ First, create a schema file called `demo_schema.json` with the following `json`
   ]
 }
 ```
-Next, crete the stream we'll use to ingest events to:
+Next, create the stream we will use to ingest events to:
 
 ```bash
 npx wrangler pipelines streams create demo_stream \
@@ -157,14 +165,16 @@ npx wrangler pipelines streams create demo_stream \
   --http-auth false
 ```
 :::note
-Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
+Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you will use to send data to your pipeline.
 :::
 
 ```bash
 # The http ingest endpoint from the output (see example below)
 export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example below)
 ```
+
 The output should look like this:
+
 ```sh
 🌀 Creating stream 'demo_stream'...
 ✨ Successfully created stream 'demo_stream' with id 'stream_id'.
@@ -191,8 +201,7 @@ Input Schema:
 └────────────┴────────┴────────────┴──────────┘
 ```
 
-
-### 2. Create the Pipeline Sink
+### 4.2. Create the Pipeline Sink
 
 Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
 
@@ -207,25 +216,26 @@ npx wrangler pipelines sinks create demo_sink \
 ```
 
 :::note
-This creates a `sink` configuration that will write to the Iceberg table demo.first_table in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`
+This creates a `sink` configuration that will write to the Iceberg table `demo.first_table` in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`.
 :::
 
-### 3. Create the Pipeline
+### 4.3. Create the Pipeline
 
-Pipelines are SQL statements read data from the stream, does some work, and writes it to the sink
+Pipelines are SQL statements that reads data from the stream, does some work, and writes it to the sink.
 
 ```bash
 npx wrangler pipelines create demo_pipeline \
   --sql "INSERT INTO demo_sink SELECT * FROM demo_stream WHERE numbers > 5;"
 ```
 :::note
-Note that there is a filter on this statement that will only send events where `numbers` is greater than 5
+Note that there is a filter on this statement that will only send events where `numbers` is greater than 5.
 :::
 
 </TabItem>
 <TabItem label='Dashboard'>
 <Steps>
-1. In the Cloudflare dashboard, go to **Pipelines** > **Pipelines**.
+1. In the Cloudflare dashboard, go to the Pipelines page.
+
    <DashButton url="/?to=/:account/pipelines" />
 
 2. Select **Create Pipeline**.
@@ -272,7 +282,7 @@ Note that there is a filter on this statement that will only send events where `
    - Select **Create Pipeline**
 
 8. :::note
-    Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
+    Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you will use to send data to your pipeline.
    :::
 
 </Steps>
@@ -287,7 +297,7 @@ export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example b
 
 ## 5. Send some data
 
-Next, let's send some events to our stream:
+Next, send some events to our stream:
 
 ```curl
 curl -X POST "$STREAM_ENDPOINT" \
@@ -314,16 +324,19 @@ curl -X POST "$STREAM_ENDPOINT" \
     }
   ]'
 ```
+
 This will send 4 events in one `POST`. Since our Pipeline is filtering out records with `numbers` less than 5, `user_id` `3` and `4` should not appear in the table. Feel free to change values and send more events.
 
 ## 6. Query the table with R2 SQL
 
-After you've sent your events to the stream, it will take about 30 seconds for the data to show in the table since that's what we configured our `roll interval` to be in the Sink.
+After you have sent your events to the stream, it will take about 30 seconds for the data to show in the table, since that is what we configured our `roll interval` to be in the Sink.
 
 ```bash
 npx wrangler r2 sql query "$WAREHOUSE" "SELECT * FROM demo.first_table LIMIT 10"
 ```
 
+## Additional resources
+
 <LinkCard
 	title="Managing R2 Data Catalogs"
 	href="/r2/data-catalog/manage-catalogs/"
@@ -333,5 +346,5 @@ npx wrangler r2 sql query "$WAREHOUSE" "SELECT * FROM demo.first_table LIMIT 10"
 <LinkCard
 	title="Try another example"
 	href="/r2-sql/tutorials/end-to-end-pipeline"
-	description="Detailed tutorial for setting up a simple fruad detection data pipeline and generate events for it in Python."
+	description="Detailed tutorial for setting up a simple fraud detection data pipeline, and generate events for it in Python."
 />
diff --git a/src/content/docs/r2-sql/index.mdx b/src/content/docs/r2-sql/index.mdx
index 2bb44f23e21e14..05daa63ab84b7e 100644
--- a/src/content/docs/r2-sql/index.mdx
+++ b/src/content/docs/r2-sql/index.mdx
@@ -16,7 +16,7 @@ description: A distributed SQL engine for R2 Data Catalog
 R2 SQL is in public beta, and any developer with an R2 subscription can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL. We will update [the pricing page](/r2-sql/platform/pricing) and provide at least 30 days notice before enabling billing.
 :::
 
-R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying [Apache Iceberg](https://iceberg.apache.org/) tables stored in [R2 data catalog](https://developers.cloudflare.com/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
+R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying [Apache Iceberg](https://iceberg.apache.org/) tables stored in [R2 data catalog](/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
 
 ```sh
 ❯ npx wrangler r2 sql query "3373912de3f5202317188ae01300bd6_data-catalog" \
diff --git a/src/content/docs/r2-sql/platform/pricing.mdx b/src/content/docs/r2-sql/platform/pricing.mdx
index b408b2f4192f63..a29f911d5e8328 100644
--- a/src/content/docs/r2-sql/platform/pricing.mdx
+++ b/src/content/docs/r2-sql/platform/pricing.mdx
@@ -10,8 +10,8 @@ head:
 ---
 
 
-R2 SQL is currently not billed during open beta but will eventually be billed on the amount of data queried.
+R2 SQL is currently not billed during open beta, but will eventually be billed on the amount of data queried.
 
-During the first phase of the R2 SQL open beta, you will not be billed for R2 SQL usage. You will be billed only for R2 usage.
+During the first phase of the R2 SQL open beta, you will not be billed for R2 SQL usage. You will only be billed for R2 usage.
 
 We plan to price based on the volume of data queried by R2 SQL. We will provide at least 30 days notice and exact pricing before charging.
\ No newline at end of file
diff --git a/src/content/docs/r2-sql/query-data.mdx b/src/content/docs/r2-sql/query-data.mdx
index a4aeee435eb273..8c68521610cc32 100644
--- a/src/content/docs/r2-sql/query-data.mdx
+++ b/src/content/docs/r2-sql/query-data.mdx
@@ -11,7 +11,7 @@ import {
 } from "~/components";
 
 :::note
-R2 SQL is currently in open beta
+R2 SQL is currently in open beta.
 :::
 
 Learn how to:
@@ -32,11 +32,11 @@ Create an [API token](https://dash.cloudflare.com/profile/api-tokens) with:
 - Access to R2 storage (**minimum**: read-only)
 - Access to R2 SQL (**minimum**: read-only)
 
-Wrangler now supports the environment variable `WRANGLER_R2_SQL_AUTH_TOKEN` which you can `export` your token as.
+Wrangler now supports the environment variable `WRANGLER_R2_SQL_AUTH_TOKEN` which you can use to `export` your token.
 
 ### Create API token via API
 
-To create an API token programmatically for use with R2 SQL, you'll need to specify  R2 SQL, R2 Data Catalog, and R2 storage permission groups in your [Access Policy](/r2/api/tokens/#access-policy).
+To create an API token programmatically for use with R2 SQL, you will need to specify  R2 SQL, R2 Data Catalog, and R2 storage permission groups in your [Access Policy](/r2/api/tokens/#access-policy).
 
 #### Example Access Policy
 
@@ -77,12 +77,13 @@ export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
 ```
 
 If this is your first time using Wrangler, make sure to login.
+
 ```bash
 npx wrangler login
 ```
 
 :::note
-You'll want to copy the **warehouse** of the R2 Data Catalog:
+You will want to copy the `Warehouse` of the R2 Data Catalog:
 :::
 
 ```sh
@@ -103,10 +104,12 @@ To query R2 SQL with Wrangler, simply run:
 ```sh
 npx wrangler r2 sql query "YOUR_WAREHOUSE" "SELECT * FROM namespace.table_name limit 10;"
 ```
-For a full list of supported sql commands, check out the [R2 SQL reference page](/r2-sql/reference/sql-reference).
+
+For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/reference/sql-reference).
 
 
 ## REST API
+
 Below is an example of using R2 SQL via the REST endpoint:
 
 ```bash
@@ -119,7 +122,8 @@ curl -X POST \
   }'
 ```
 
-Learn more:
+## Additional resources
+
 <LinkCard
 	title="Manage R2 Data Catalogs"
 	href="/r2/data-catalog/manage-catalogs/"
@@ -129,5 +133,5 @@ Learn more:
 <LinkCard
 	title="Build an end to end data pipeline"
 	href="/r2-sql/tutorials/end-to-end-pipeline"
-	description="Detailed tutorial for setting up a simple fruad detection data pipeline and generate events for it in Python."
+	description="Detailed tutorial for setting up a simple fraud detection data pipeline, and generate events for it in Python."
 />
diff --git a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
index adb53dfab59804..dd084898bfebfa 100644
--- a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
+++ b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
@@ -8,29 +8,28 @@ sidebar:
 
 ---
 
-# R2 SQL Limitations and Best Practices
-
 ## Overview
 
-R2 SQL is in public beta, limitations and best practices will change over time.
+:::note
+R2 SQL is in public beta. Limitations and best practices will change over time.
+:::
 
 R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2 data catalog. This document outlines the supported features, limitations, and best practices of R2 SQL.
 
-
 ## Quick Reference
 
-| Feature | Supported | Notes |
-| :---- | :---- | :---- |
-| Basic SELECT | Yes | Columns, \* |
-| Aggregation functions | No | No COUNT, AVG, etc. |
-| Single table FROM | Yes | Note, aliasing not supported|
-| WHERE clause | Yes | Filters, comparisons, equality, etc |
-| JOINs | No | No table joins |
-| Array filtering | No | No array type support |
-| JSON filtering | No | No nested object queries |
-| Simple LIMIT | Yes | 1-10,000 range |
-| ORDER BY | Yes | Any columns of the partition key only|
-| GROUP BY | No | Not supported |
+| Feature               | Supported | Notes                                |
+| :----                 | :----     | :----                                |
+| Basic SELECT          | Yes       | Columns, \*                          |
+| Aggregation functions | No        | No COUNT, AVG, etc.                  |
+| Single table FROM     | Yes       | Note, aliasing not supported         |
+| WHERE clause          | Yes       | Filters, comparisons, equality, etc  |
+| JOINs                 | No        | No table joins                       |
+| Array filtering       | No        | No array type support                |
+| JSON filtering        | No        | No nested object queries             |
+| Simple LIMIT          | Yes       | 1-10,000 range                       |
+| ORDER BY              | Yes       | Any columns of the partition key only|
+| GROUP BY              | No        | Not supported                        |
 
 ## Supported SQL Clauses
 
@@ -203,8 +202,8 @@ The following SQL clauses are **not supported**:
 
 ## Best Practices
 
-1. **Always include time filters** in your WHERE clause to ensure efficient queries
-2. **Use specific column selection** instead of `SELECT *` when possible for better performance
-3. **Structure your data** to avoid nested JSON objects if you need to filter on those fields
+1. Always include time filters in your WHERE clause to ensure efficient queries.
+2. Use specific column selection instead of `SELECT *` when possible for better performance.
+3. Structure your data to avoid nested JSON objects if you need to filter on those fields.
 
 ---
\ No newline at end of file
diff --git a/src/content/docs/r2-sql/reference/sql-reference.mdx b/src/content/docs/r2-sql/reference/sql-reference.mdx
index be24d1660642c8..aef301b89164ea 100644
--- a/src/content/docs/r2-sql/reference/sql-reference.mdx
+++ b/src/content/docs/r2-sql/reference/sql-reference.mdx
@@ -11,9 +11,12 @@ sidebar:
 
 ## Overview
 
-R2 SQL is in public beta, supported SQL grammar will change over time.
 
-This reference documents the R2 SQL syntax based on the currently supported grammar in public beta.
+:::note
+R2 SQL is in public beta. Supported SQL grammar may change over time.
+:::
+
+This page documents the R2 SQL syntax based on the currently supported grammar in public beta.
 
 ---
 
diff --git a/src/content/docs/r2-sql/troubleshooting.mdx b/src/content/docs/r2-sql/troubleshooting.mdx
index ad4688334bbb3b..4e9b566d335fd8 100644
--- a/src/content/docs/r2-sql/troubleshooting.mdx
+++ b/src/content/docs/r2-sql/troubleshooting.mdx
@@ -7,11 +7,7 @@ sidebar:
   order: 7
 ---
 
-
-
-# R2 SQL Troubleshooting Guide
-
-This guide covers potential errors and limitations you may encounter when using R2 SQL. R2 SQL is in open beta and supported functionality will evolve and change over time.
+This guide covers potential errors and limitations you may encounter when using R2 SQL. R2 SQL is in open beta, and supported functionality will evolve and change over time.
 
 ## Query Structure Errors
 
@@ -45,7 +41,7 @@ WHERE status = 200 AND timestamp BETWEEN '2025-09-24T01:00:00Z' AND '2025-09-25T
 **Error**: `Function not supported`
 </div>
 
-**Problem**: Trying to use aggregate or SQL functions in SELECT.
+**Problem**: Cannot use aggregate or SQL functions in SELECT.
 
 ```sql
 -- Invalid - Aggregate functions not supported
@@ -54,7 +50,7 @@ SELECT AVG(response_time) FROM http_requests WHERE status = 200
 SELECT MAX(timestamp) FROM logs WHERE user_id = '123'
 ```
 
-**Solution**: Use basic column selection and handle aggregation in your application code.
+**Solution**: Use basic column selection, and handle aggregation in your application code.
 
 ### JSON Field Access
 
@@ -62,7 +58,7 @@ SELECT MAX(timestamp) FROM logs WHERE user_id = '123'
 **Error**: `Cannot access nested fields`
 </div>
 
-**Problem**: Attempting to query individual fields from JSON objects.
+**Problem**: Cannot query individual fields from JSON objects.
 
 ```sql
 -- Invalid - JSON field access not supported
@@ -82,7 +78,7 @@ SELECT json_field FROM logs
 **Error**: `aliases (`AS`) are not supported`
 </div>
 
-**Problem**: Creating synthetic columns with literal values.
+**Problem**: Cannot create synthetic columns with literal values.
 
 ```sql
 -- Invalid - Synthetic data not supported
@@ -92,7 +88,7 @@ SELECT user_id, 'active' as status, 1 as priority FROM users
 SELECT user_id, status, priority FROM users WHERE status = 'active'
 ```
 
-**Solution**: Add the required data to your table schema or handle it in post-processing.
+**Solution**: Add the required data to your table schema, or handle it in post-processing.
 
 ---
 
@@ -104,7 +100,7 @@ SELECT user_id, status, priority FROM users WHERE status = 'active'
 **Error**: `Multiple tables not supported` or `JOIN operations not allowed`
 </div>
 
-**Problem**: Attempting to query multiple tables or use JOINs.
+**Problem**: Cannot query multiple tables or use JOINs.
 
 ```sql
 -- Invalid - Multiple tables not supported
@@ -118,8 +114,8 @@ SELECT * FROM table2 WHERE id IN ('id1', 'id2', 'id3')
 ```
 
 **Solution**:
-- Denormalize your data by including necessary fields in a single table
-- Perform multiple queries and join data in your application
+- Denormalize your data by including necessary fields in a single table.
+- Perform multiple queries and join data in your application.
 
 ### Subqueries
 
@@ -127,7 +123,7 @@ SELECT * FROM table2 WHERE id IN ('id1', 'id2', 'id3')
 **Error**: `only table name is supported in `FROM` clause`
 </div>
 
-**Problem**: Using subqueries in FROM clause.
+**Problem**: Cannot use subqueries in FROM clause.
 
 ```sql
 -- Invalid - Subqueries not supported
@@ -149,7 +145,7 @@ SELECT user_id FROM events WHERE status = 200
 **Error**: `This feature is not implemented: GetFieldAccess`
 </div>
 
-**Problem**: Attempting to filter on array fields.
+**Problem**: Cannot filter on array fields.
 
 ```sql
 -- Invalid - Array filtering not supported
@@ -162,9 +158,9 @@ SELECT * FROM logs WHERE tags_string LIKE '%error%'
 ```
 
 **Solution**:
-- Denormalize array data into separate columns
-- Use string concatenation of array values for pattern matching
-- Restructure your schema to avoid array types
+- Denormalize array data into separate columns.
+- Use string concatenation of array values for pattern matching.
+- Restructure your schema to avoid array types.
 
 ### JSON Object Filtering
 
@@ -172,7 +168,7 @@ SELECT * FROM logs WHERE tags_string LIKE '%error%'
 **Error**: `unsupported binary operator` or `Error during planning: could not parse compound`
 </div>
 
-**Problem**: Filtering on fields inside JSON objects.
+**Problem**: Cannot filter on fields inside JSON objects.
 
 ```sql
 -- Invalid - JSON field filtering not supported
@@ -186,8 +182,8 @@ SELECT * FROM logs WHERE json_data IS NOT NULL
 ```
 
 **Solution**:
-- Denormalize frequently queried JSON fields into separate columns
-- Filter on the entire JSON field and handle parsing in your application
+- Denormalize frequently queried JSON fields into separate columns.
+- Filter on the entire JSON field, and handle parsing in your application.
 
 ### Column Comparisons
 
@@ -195,7 +191,7 @@ SELECT * FROM logs WHERE json_data IS NOT NULL
 **Error**: `right argument to a binary expression must be a literal`
 </div>
 
-**Problem**: Comparing one column to another in WHERE clause.
+**Problem**: Cannot compare one column to another in WHERE clause.
 
 ```sql
 -- Invalid - Column comparisons not supported
@@ -207,7 +203,7 @@ SELECT * FROM logs WHERE request_size > response_size
 SELECT * FROM events WHERE duration > 0
 ```
 
-**Solution**: Handle comparisons in your application layer
+**Solution**: Handle comparisons in your application layer.
 
 ---
 
@@ -219,7 +215,7 @@ SELECT * FROM events WHERE duration > 0
 **Error**: `maximum LIMIT is 10000`
 </div>
 
-**Problem**: Using invalid LIMIT values.
+**Problem**: Cannot use invalid LIMIT values.
 
 ```sql
 -- Invalid - Out of range limits
@@ -238,7 +234,7 @@ SELECT * FROM events LIMIT 10000
 **Error**: `OFFSET not supported`
 </div>
 
-**Problem**: Attempting to use pagination syntax.
+**Problem**: Cannot use pagination syntax.
 
 ```sql
 -- Invalid - Pagination not supported
@@ -265,7 +261,7 @@ SELECT * FROM events WHERE timestamp > '2024-01-01T10:30:00Z' ORDER BY timestamp
 **Error**: `invalid SQL: only top-level SELECT clause is supported`
 </div>
 
-**Problem**: Attempting to modify table schema or reference non-existent columns.
+**Problem**: Cannot modify table schema or reference non-existent columns.
 
 ```sql
 -- Invalid - Schema changes not supported
@@ -274,8 +270,8 @@ UPDATE events SET status = 200 WHERE user_id = '123'
 ```
 
 **Solution**:
-- Plan your schema carefully before data ingestion
-- Ensure all column names exist in your current schema
+- Plan your schema carefully before data ingestion.
+- Ensure all column names exist in your current schema.
 
 ---
 
@@ -285,19 +281,19 @@ UPDATE events SET status = 200 WHERE user_id = '123'
 
 If your queries are running slowly:
 
-1. **Always include partition (timestamp) filters**: This is the most important optimization
+1. **Always include partition (timestamp) filters**: This is the most important optimization.
    ```sql
    -- Good
    WHERE timestamp BETWEEN '2024-01-01' AND '2024-01-02'
    ```
 
-2. **Use selective filtering**: Include specific conditions to reduce result sets
+2. **Use selective filtering**: Include specific conditions to reduce result sets.
    ```sql
    -- Good
    WHERE status = 200 AND country = 'US' AND timestamp > '2024-01-01'
    ```
 
-3. **Limit result size**: Use appropriate LIMIT values
+3. **Limit result size**: Use appropriate LIMIT values.
    ```sql
    -- Good for exploration
    SELECT * FROM events WHERE timestamp > '2024-01-01' LIMIT 100
diff --git a/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx b/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
index f8b6d7face7e29..09f68a651db62b 100644
--- a/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
+++ b/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
@@ -10,16 +10,14 @@ products:
 ---
 
 import {
-	Render,
-	Steps,
-	Tabs,
-	TabItem,
-	DashButton,
-	LinkCard,
+  Render,
+  Steps,
+  Tabs,
+  TabItem,
+  DashButton,
+  LinkCard,
 } from "~/components";
 
-# Build an end to end data pipeline with the Cloudflare Data Platform
-
 In this tutorial, you will learn how to build a complete data pipeline using Cloudflare Pipelines, R2 Data Catalog, and R2 SQL. This also includes a sample Python script that creates and sends financial transaction data to your Pipeline that can be queried by R2 SQL or any Apache Iceberg-compatible query engine.
 
 This tutorial demonstrates how to:
@@ -35,16 +33,19 @@ This tutorial demonstrates how to:
 3. Install [Python 3.8+](https://python.org) for the data generation script.
 
 :::note[Node.js version manager]
-Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions. Wrangler requires a Node version of 16.17.0 or later.
+Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions.
+
+Wrangler requires a Node version of 16.17.0 or later.
 :::
 
 ## 1. Set up authentication
 
-You'll need API tokens to interact with Cloudflare services.
+You will need API tokens to interact with Cloudflare services.
 
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **API tokens** page.
+
    <DashButton url="/?to=/:account/api-tokens" />
 
 2. Select **Create Token**.
@@ -59,13 +60,13 @@ You'll need API tokens to interact with Cloudflare services.
     - **Workers R2 SQL** with Read permissions
     - **Workers R2 Storage** with Read and Edit permissions
 
-6. Optionally add a TTL to this token
+6. Optionally, add a TTL to this token.
 
 7. Select **Continue to summary**.
 
 8. Click **Create Token**
 
-8. Note the **Token value**.
+9. Note the **Token value**.
 
 </Steps>
 
@@ -75,7 +76,8 @@ Export your new token as an environment variable:
 export WRANGLER_R2_SQL_AUTH_TOKEN= #paste your token here
 ```
 
-If this is your first time using Wrangler, make sure to login.
+If this is your first time using Wrangler, make sure to log in.
+
 ```bash
 npx wrangler login
 ```
@@ -87,27 +89,28 @@ npx wrangler login
 
 Create an R2 bucket:
 
-	```bash
-	npx wrangler r2 bucket create fraud-pipeline
-	```
+  ```bash
+  npx wrangler r2 bucket create fraud-pipeline
+  ```
 
 </TabItem>
 <TabItem label='Dashboard'>
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+
    <DashButton url="/?to=/:account/r2/overview" />
 
 2. Select **Create bucket**.
 
-3. Enter the bucket name: fraud-pipeline
+3. Enter the bucket name: `fraud-pipeline`
 
 4. Select **Create bucket**.
 </Steps>
 </TabItem>
 </Tabs>
 
-## 2. Enable R2 Data Catalog
+## 3. Enable R2 Data Catalog
 
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
@@ -125,9 +128,10 @@ When you run this command, take note of the "Warehouse" and "Catalog URI". You w
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+
    <DashButton url="/?to=/:account/r2/overview" />
 
-2. Select the bucket: fraud-pipeline.
+2. Select the bucket: `fraud-pipeline`.
 
 3. Switch to the **Settings** tab, scroll down to **R2 Data Catalog**, and select **Enable**.
 
@@ -138,15 +142,17 @@ When you run this command, take note of the "Warehouse" and "Catalog URI". You w
 
 
 :::note
-Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We'll use it later in the tutorial.
+Copy the `warehouse` (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We will use it later in the tutorial.
 :::
 
 ```bash
 export $WAREHOUSE= #Paste your warehouse here
 ```
 
-### Optional - Enable compaction on your R2 Data Catalog
-R2 Data Catalog can automatically compact tables for you. In production event streaming use cases, it's common to end up with many small files, so it's recommended to enable compaction. Since this is a sample use case, this is optional.
+### (Optional) Enable compaction on your R2 Data Catalog
+
+R2 Data Catalog can automatically compact tables for you. In production event streaming use cases, it is common to end up with many small files, so it is recommended to enable compaction. Since the tutorial only demonstrates a sample use case, this step is optional.
+
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
 
@@ -159,9 +165,10 @@ npx wrangler r2 bucket catalog compaction enable fraud-pipeline --token $WRANGLE
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+
    <DashButton url="/?to=/:account/r2/overview" />
 
-2. Select the bucket: fraud-pipeline.
+2. Select the bucket: `fraud-pipeline`.
 
 3. Switch to the **Settings** tab, scroll down to **R2 Data Catalog**, click on edit icon, and select **Enable**.
 
@@ -172,10 +179,13 @@ npx wrangler r2 bucket catalog compaction enable fraud-pipeline --token $WRANGLE
 
 ## 4. Set up the pipeline infrastructure
 
-### Create the Pipeline stream
+### 4.1. Create the Pipeline stream
+
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
+
 First, create a schema file called `raw_transactions_schema.json` with the following `json` schema:
+
 ```json
 {
     "fields": [
@@ -195,18 +205,21 @@ Create a stream to receive incoming fraud detection events:
 ```bash
 npx wrangler pipelines streams create raw_events_stream \
   --schema-file raw_transactions_schema.json \
-	--http-enabled true \
+  --http-enabled true \
   --http-auth false
 ```
+
 :::note
-Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you'll use to send data to your pipeline.
+Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you will use to send data to your pipeline.
 :::
+
 ```bash
 # The http ingest endpoint from the output (see example below)
 export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example below)
 ```
 
 The output should look like this:
+
 ```sh
 🌀 Creating stream 'raw_events_stream'...
 ✨ Successfully created stream 'raw_events_stream' with id 'stream_id'.
@@ -241,25 +254,25 @@ Input Schema:
 └───────────────────────┴────────┴────────────┴──────────┘
 ```
 
-### Create the data sink
+### 4.2. Create the data sink
 
 Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
 
 ```bash
 npx wrangler pipelines sinks create raw_events_sink \
   --type "r2-data-catalog" \
-	--bucket "fraud-pipeline" \
-	--roll-interval 30 \
-	--namespace "fraud_detection" \
-	--table "transactions" \
-	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
+  --bucket "fraud-pipeline" \
+  --roll-interval 30 \
+  --namespace "fraud_detection" \
+  --table "transactions" \
+  --catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
 ```
 
 :::note
-This creates a `sink` configuration that will write to the Iceberg table fraud_detection.transactions in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`
+This creates a `sink` configuration that will write to the Iceberg table `fraud_detection.transactions` in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`.
 :::
 
-### Create the pipeline
+### 4.3. Create the pipeline
 
 Connect your stream to your sink with SQL:
 
@@ -267,10 +280,12 @@ Connect your stream to your sink with SQL:
 npx wrangler pipelines create raw_events_pipeline \
   --sql "INSERT INTO raw_events_sink SELECT * FROM raw_events_stream"
 ```
+
 </TabItem>
 <TabItem label='Dashboard'>
 <Steps>
 1. In the Cloudflare dashboard, go to **Pipelines** > **Pipelines**.
+
    <DashButton url="/?to=/:account/pipelines" />
 
 2. Select **Create Pipeline**.
@@ -285,7 +300,7 @@ npx wrangler pipelines create raw_events_pipeline \
    - Select **JSON editor**
    - Copy in the schema:
       ```json
-	  {
+      {
         "fields": [
             {"name": "transaction_id", "type": "string", "required": true},
             {"name": "user_id", "type": "int64", "required": true},
@@ -295,8 +310,8 @@ npx wrangler pipelines create raw_events_pipeline \
             {"name": "merchant_category", "type": "string", "required": false},
             {"name": "is_fraud", "type": "bool", "required": false}
         ]
-	  }
-		```
+     }
+      ```
 
    - Select **Next**
 
@@ -480,7 +495,7 @@ python fraud_data_generator.py
 
 Now you can analyze your fraud detection data using R2 SQL. Here are some example queries:
 
-### View recent transactions
+### 6.1. View recent transactions
 
 ```bash
 npx wrangler r2 sql query "$WAREHOUSE" "
@@ -498,21 +513,21 @@ AND is_fraud = true
 LIMIT 10"
 ```
 
-### Let's filter the raw transactions into a new table to highlight high-value transactions
+### 6.2. Filter the raw transactions into a new table to highlight high-value transactions
 
 Create a new sink that will write the filtered data to a new Apache Iceberg table in R2 Data Catalog:
 
 ```bash
 npx wrangler pipelines sinks create fraud_filter_sink \
   --type "r2-data-catalog" \
-	--bucket "fraud-pipeline" \
-	--roll-interval 30 \
-	--namespace "fraud_detection" \
-	--table "fraud_transactions" \
-	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
+  --bucket "fraud-pipeline" \
+  --roll-interval 30 \
+  --namespace "fraud_detection" \
+  --table "fraud_transactions" \
+  --catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
 ```
 
-Now you'll create a new SQL query to process data from the original `raw_events_stream` stream and only write flagged transactions that are over the `amount` of 1000.
+Now you will create a new SQL query to process data from the original `raw_events_stream` stream and only write flagged transactions that are over the `amount` of 1,000.
 
 ```bash
 npx wrangler pipelines create fraud_events_pipeline \
@@ -520,10 +535,11 @@ npx wrangler pipelines create fraud_events_pipeline \
 ```
 
 :::note
-It may take a few minutes for the new Pipeline to fully Initialize and start processing the data. Also keep in mind the 30 second `roll-interval`
+It may take a few minutes for the new Pipeline to fully Initialize and start processing the data. Also keep in mind the 30 second `roll-interval`.
 :::
 
-Let's query the table and check the results:
+Query the table and check the results:
+
 ```bash
 npx wrangler r2 sql query "$WAREHOUSE" "
 SELECT
@@ -537,7 +553,9 @@ SELECT
 FROM fraud_detection.fraud_transactions
 LIMIT 10"
 ```
-Let's also verify that the non-fraudulent events are being filtered out:
+
+Also verify that the non-fraudulent events are being filtered out:
+
 ```bash
 npx wrangler r2 sql query "$WAREHOUSE" "
 SELECT
@@ -553,15 +571,16 @@ WHERE is_fraud = false
 LIMIT 10"
 ```
 You should see the following output:
+
 ```text
 Query executed successfully with no results
 ```
 
 ## Conclusion
 
-You have successfully built an end to end data pipeline using Cloudflare's data platform. Through this tutorial, you've learned to:
+You have successfully built an end to end data pipeline using Cloudflare's data platform. Through this tutorial, you hve learned to:
 
-1. **Use R2 Data Catalog** - Leveraged Apache Iceberg tables for efficient data storage
-2. **Set up Cloudflare Pipelines** - Created streams, sinks, and pipelines for data ingestion
-3. **Generated sample data** - Created transaction data with some basic fraud patterns
-4. **Query your tables with R2 SQL** - Access raw and processed data tables stored in R2 Data Catalog
+1. **Use R2 Data Catalog**: Leveraged Apache Iceberg tables for efficient data storage
+2. **Set up Cloudflare Pipelines**: Created streams, sinks, and pipelines for data ingestion
+3. **Generated sample data**: Created transaction data with some basic fraud patterns
+4. **Query your tables with R2 SQL**: Access raw and processed data tables stored in R2 Data Catalog

From 741c9ed4970a0d4624982d14882be73e4349d05a Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 06:48:46 -0700
Subject: [PATCH 14/30] Update
 src/content/docs/r2-sql/reference/limitations-best-practices.mdx

Co-authored-by: netgusto <mail@jeromeschneider.fr>
---
 .../docs/r2-sql/reference/limitations-best-practices.mdx        | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
index dd084898bfebfa..8375bc81dd5b9e 100644
--- a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
+++ b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
@@ -33,7 +33,7 @@ R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2
 
 ## Supported SQL Clauses
 
-R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, and `LIMIT`. All other SQL clauses are not supported at the moment. New features will be released in the future, keep an eye on this page and the changelog\[LINK TO CHANGE LOG\] for the latest.
+R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, `ORDER BY`, and `LIMIT`. All other SQL clauses are not supported at the moment. New features will be released in the future, keep an eye on this page and the changelog\[LINK TO CHANGE LOG\] for the latest.
 
 ---
 

From 79680f63c731c2c88d246653200279c8544afa58 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 06:58:01 -0700
Subject: [PATCH 15/30] adding improvements from the latest round of reviews

---
 src/content/docs/r2-sql/get-started.mdx       | 20 +++++++-------
 src/content/docs/r2-sql/query-data.mdx        | 14 ++++++----
 .../r2-sql/tutorials/end-to-end-pipeline.mdx  | 26 +++++++++----------
 3 files changed, 30 insertions(+), 30 deletions(-)

diff --git a/src/content/docs/r2-sql/get-started.mdx b/src/content/docs/r2-sql/get-started.mdx
index b87465a67211de..1fc38613963bc6 100644
--- a/src/content/docs/r2-sql/get-started.mdx
+++ b/src/content/docs/r2-sql/get-started.mdx
@@ -28,7 +28,7 @@ This guide will instruct you through:
 
 1. Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up).
 2. Install [Node.js](https://nodejs.org/en/).
-3. Install [Wrangler](/workers/wranger/install-and-update).
+3. Install [Wrangler](/workers/wrangler/install-and-update).
 
 :::note[Node.js version manager]
 Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions.
@@ -47,13 +47,13 @@ You will need API tokens to interact with Cloudflare services.
 
 2. Select **Manage API tokens**.
 
-3. Select **Create API token**.
+3. Select **Create User API token**.
 
 4. Select the **R2 Token** text to edit your API token name.
 
 5. Under **Permissions**, choose the **Admin Read & Write** permission.
 
-6. Select **Create API Token**.
+6. Select **Create User API Token**.
 
 7. Note the **Token value**.
 
@@ -99,8 +99,6 @@ Create an R2 bucket:
 </TabItem>
 </Tabs>
 
-## 3. Enable R2 Data Catalog
-
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
 
@@ -138,12 +136,12 @@ Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We
 export $WAREHOUSE= #Paste your warehouse here
 ```
 
-## 4. Create the data Pipeline
+## 3. Create the data Pipeline
 
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
 
-### 4.1. Create the Pipeline Stream
+### 3.1. Create the Pipeline Stream
 
 First, create a schema file called `demo_schema.json` with the following `json` schema:
 
@@ -201,7 +199,7 @@ Input Schema:
 └────────────┴────────┴────────────┴──────────┘
 ```
 
-### 4.2. Create the Pipeline Sink
+### 3.2. Create the Pipeline Sink
 
 Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
 
@@ -219,7 +217,7 @@ npx wrangler pipelines sinks create demo_sink \
 This creates a `sink` configuration that will write to the Iceberg table `demo.first_table` in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`.
 :::
 
-### 4.3. Create the Pipeline
+### 3.3. Create the Pipeline
 
 Pipelines are SQL statements that reads data from the stream, does some work, and writes it to the sink.
 
@@ -295,7 +293,7 @@ export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example b
 </Tabs>
 
 
-## 5. Send some data
+## 4. Send some data
 
 Next, send some events to our stream:
 
@@ -327,7 +325,7 @@ curl -X POST "$STREAM_ENDPOINT" \
 
 This will send 4 events in one `POST`. Since our Pipeline is filtering out records with `numbers` less than 5, `user_id` `3` and `4` should not appear in the table. Feel free to change values and send more events.
 
-## 6. Query the table with R2 SQL
+## 5. Query the table with R2 SQL
 
 After you have sent your events to the stream, it will take about 30 seconds for the data to show in the table, since that is what we configured our `roll interval` to be in the Sink.
 
diff --git a/src/content/docs/r2-sql/query-data.mdx b/src/content/docs/r2-sql/query-data.mdx
index 8c68521610cc32..b596f8f7111ce4 100644
--- a/src/content/docs/r2-sql/query-data.mdx
+++ b/src/content/docs/r2-sql/query-data.mdx
@@ -8,6 +8,9 @@ sidebar:
 import {
 	Render,
 	LinkCard,
+	Tabs,
+	TabItem,
+	Steps
 } from "~/components";
 
 :::note
@@ -24,8 +27,8 @@ R2 SQL can currently be accessed via Wrangler commands or a REST API.
 
 To query Apache Iceberg tables in R2 Data Catalog, you must provide a Cloudflare API token with R2 SQL, R2 Data Catalog, and R2 storage permissions.
 
-### Create API token in the dashboard
-
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Dashboard'>
 Create an [API token](https://dash.cloudflare.com/profile/api-tokens) with:
 
 - Access to R2 Data Catalog (**minimum**: read-only)
@@ -34,8 +37,8 @@ Create an [API token](https://dash.cloudflare.com/profile/api-tokens) with:
 
 Wrangler now supports the environment variable `WRANGLER_R2_SQL_AUTH_TOKEN` which you can use to `export` your token.
 
-### Create API token via API
-
+</TabItem>
+<TabItem label='Via API'>
 To create an API token programmatically for use with R2 SQL, you will need to specify  R2 SQL, R2 Data Catalog, and R2 storage permission groups in your [Access Policy](/r2/api/tokens/#access-policy).
 
 #### Example Access Policy
@@ -66,7 +69,8 @@ To create an API token programmatically for use with R2 SQL, you will need to sp
 	}
 ]
 ```
-
+</TabItem>
+</Tabs>
 
 ## Query data via Wrangler
 
diff --git a/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx b/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
index 09f68a651db62b..6e370cf45d231d 100644
--- a/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
+++ b/src/content/docs/r2-sql/tutorials/end-to-end-pipeline.mdx
@@ -110,13 +110,11 @@ Create an R2 bucket:
 </TabItem>
 </Tabs>
 
-## 3. Enable R2 Data Catalog
+Enable the catalog on your R2 bucket:
 
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
 
-Enable the catalog on your R2 bucket:
-
 ```bash
 npx wrangler r2 bucket catalog enable fraud-pipeline
 ```
@@ -177,9 +175,9 @@ npx wrangler r2 bucket catalog compaction enable fraud-pipeline --token $WRANGLE
 </TabItem>
 </Tabs>
 
-## 4. Set up the pipeline infrastructure
+## 3. Set up the pipeline infrastructure
 
-### 4.1. Create the Pipeline stream
+### 3.1. Create the Pipeline stream
 
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
@@ -191,7 +189,7 @@ First, create a schema file called `raw_transactions_schema.json` with the follo
     "fields": [
       {"name": "transaction_id", "type": "string", "required": true},
       {"name": "user_id", "type": "int64", "required": true},
-      {"name": "amount", "type": "f64", "required": false},
+      {"name": "amount", "type": "float64", "required": false},
       {"name": "transaction_timestamp", "type": "string", "required": false},
       {"name": "location", "type": "string", "required": false},
       {"name": "merchant_category", "type": "string", "required": false},
@@ -242,7 +240,7 @@ Input Schema:
 ├───────────────────────┼────────┼────────────┼──────────┤
 │ user_id               │ int64  │            │ Yes      │
 ├───────────────────────┼────────┼────────────┼──────────┤
-│ amount                │ f64    │            │ No       │
+│ amount                │float64 │            │ No       │
 ├───────────────────────┼────────┼────────────┼──────────┤
 │ transaction_timestamp │ string │            │ No       │
 ├───────────────────────┼────────┼────────────┼──────────┤
@@ -254,7 +252,7 @@ Input Schema:
 └───────────────────────┴────────┴────────────┴──────────┘
 ```
 
-### 4.2. Create the data sink
+### 3.2. Create the data sink
 
 Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
 
@@ -272,7 +270,7 @@ npx wrangler pipelines sinks create raw_events_sink \
 This creates a `sink` configuration that will write to the Iceberg table `fraud_detection.transactions` in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`.
 :::
 
-### 4.3. Create the pipeline
+### 3.3. Create the pipeline
 
 Connect your stream to your sink with SQL:
 
@@ -304,7 +302,7 @@ npx wrangler pipelines create raw_events_pipeline \
         "fields": [
             {"name": "transaction_id", "type": "string", "required": true},
             {"name": "user_id", "type": "int64", "required": true},
-            {"name": "amount", "type": "f64", "required": false},
+            {"name": "amount", "type": "float64", "required": false},
             {"name": "transaction_timestamp", "type": "string", "required": false},
             {"name": "location", "type": "string", "required": false},
             {"name": "merchant_category", "type": "string", "required": false},
@@ -341,7 +339,7 @@ npx wrangler pipelines create raw_events_pipeline \
 </TabItem>
 </Tabs>
 
-## 5. Generate fraud detection data
+## 4. Generate sample fraud detection data
 
 Create a Python script to generate realistic transaction data with fraud patterns:
 
@@ -491,11 +489,11 @@ pip install requests
 python fraud_data_generator.py
 ```
 
-## 6. Query your fraud data with R2 SQL
+## 5. Query the data with R2 SQL
 
 Now you can analyze your fraud detection data using R2 SQL. Here are some example queries:
 
-### 6.1. View recent transactions
+### 5.1. View recent transactions
 
 ```bash
 npx wrangler r2 sql query "$WAREHOUSE" "
@@ -513,7 +511,7 @@ AND is_fraud = true
 LIMIT 10"
 ```
 
-### 6.2. Filter the raw transactions into a new table to highlight high-value transactions
+### 5.2. Filter the raw transactions into a new table to highlight high-value transactions
 
 Create a new sink that will write the filtered data to a new Apache Iceberg table in R2 Data Catalog:
 

From be116163d7edb74347126c2e7e6ef2580b4622ec Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 07:15:19 -0700
Subject: [PATCH 16/30] fixed min permissions needed

---
 src/content/docs/r2-sql/query-data.mdx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2-sql/query-data.mdx b/src/content/docs/r2-sql/query-data.mdx
index b596f8f7111ce4..cab46cf540d15a 100644
--- a/src/content/docs/r2-sql/query-data.mdx
+++ b/src/content/docs/r2-sql/query-data.mdx
@@ -31,7 +31,7 @@ To query Apache Iceberg tables in R2 Data Catalog, you must provide a Cloudflare
 <TabItem label='Dashboard'>
 Create an [API token](https://dash.cloudflare.com/profile/api-tokens) with:
 
-- Access to R2 Data Catalog (**minimum**: read-only)
+- Access to R2 Data Catalog (**minimum**: edit)
 - Access to R2 storage (**minimum**: read-only)
 - Access to R2 SQL (**minimum**: read-only)
 

From 205b4a435aaa96ef6a7dc5f5336395c60bab4f46 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 07:31:05 -0700
Subject: [PATCH 17/30] more improvements from reviews

---
 .../reference/limitations-best-practices.mdx  | 22 +++++++++----------
 .../docs/r2-sql/reference/sql-reference.mdx   | 13 +++++------
 src/content/docs/r2-sql/troubleshooting.mdx   |  6 ++---
 3 files changed, 18 insertions(+), 23 deletions(-)

diff --git a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
index 8375bc81dd5b9e..8810832e8ed1b0 100644
--- a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
+++ b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
@@ -33,7 +33,7 @@ R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2
 
 ## Supported SQL Clauses
 
-R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, `ORDER BY`, and `LIMIT`. All other SQL clauses are not supported at the moment. New features will be released in the future, keep an eye on this page and the changelog\[LINK TO CHANGE LOG\] for the latest.
+R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, `ORDER BY`, and `LIMIT`. All other SQL clauses are not supported at the moment. New features will be released in the future, keep an eye on this page for the latest.
 
 ---
 
@@ -56,14 +56,14 @@ R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, `ORDER
 
 ```sql
 -- Valid
-SELECT timestamp, user_id, status
-SELECT *
+SELECT timestamp, user_id, status FROM my_table;
+SELECT * FROM my_table;
 
 -- Invalid
-SELECT user_id AS uid, timestamp AS ts
-SELECT COUNT(*) FROM events
-SELECT json_field.property FROM table
-SELECT 1 AS synthetic_column
+SELECT user_id AS uid, timestamp AS ts FROM my_table;
+SELECT COUNT(*) FROM events FROM FROM my_table;
+SELECT json_field.property FROM my_table;
+SELECT 1 AS synthetic_column FROM my_table;
 ```
 
 ---
@@ -128,7 +128,6 @@ SELECT * FROM logs WHERE status = 200 AND user_type = 'premium'
 SELECT * FROM requests WHERE (method = 'GET' OR method = 'POST') AND response_time < 1000
 
 --Invalid
-SELECT * FROM events -- Missing time filter
 SELECT * FROM logs WHERE tags[0] = 'error' -- Array filtering
 SELECT * FROM requests WHERE metadata.user_id = '123' -- JSON field filtering
 SELECT * FROM events WHERE col_a = col_b -- Column comparison
@@ -141,8 +140,8 @@ SELECT * FROM logs WHERE response_time + latency > 5000 -- Arithmetic
 
 ### Supported Features
 
-- **ASC**: Ascending order (Default)
-- **DESC**: Descending order
+- **ASC**: Ascending order
+- **DESC**: Descending order (Default, on full partition key)
 
 ### Limitations
 
@@ -153,7 +152,6 @@ SELECT * FROM logs WHERE response_time + latency > 5000 -- Arithmetic
 ```sql
 SELECT * FROM table_name WHERE ... ORDER BY partitionKey
 SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
-SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
 ```
 
 ---
@@ -175,7 +173,7 @@ SELECT * FROM table_name WHERE ... ORDER BY partitionKey DESC
 
 ```sql
 -- Valid
-SELECT * FROM events WHERE ... LIMIT 100
+SELECT * FROM events LIMIT 100
 SELECT * FROM logs WHERE ... LIMIT 10000
 
 -- Invalid
diff --git a/src/content/docs/r2-sql/reference/sql-reference.mdx b/src/content/docs/r2-sql/reference/sql-reference.mdx
index aef301b89164ea..326b500d5043a7 100644
--- a/src/content/docs/r2-sql/reference/sql-reference.mdx
+++ b/src/content/docs/r2-sql/reference/sql-reference.mdx
@@ -64,11 +64,6 @@ SELECT timestamp, user_id, response_code FROM table_name
 SELECT * FROM table_name
 ```
 
-### Examples
-
-```sql
-SELECT column_name FROM table_name
-```
 
 ---
 
@@ -89,14 +84,14 @@ SELECT * WHERE condition [AND|OR condition ...]
 
 #### Value Comparisons
 
-- `column_name BETWEEN value AND value`
+- `column_name BETWEEN value' AND 'value`
 - `column_name = value`
 - `column_name >= value`
 - `column_name > value`
 - `column_name <= value`
 - `column_name < value`
 - `column_name != value`
-- `column_name LIKE value%`
+- `column_name LIKE 'value%'`
 
 #### Logical Operators
 
@@ -109,6 +104,8 @@ SELECT * WHERE condition [AND|OR condition ...]
 - **float** \- Decimal numbers
 - **string** \- Text values (quoted)
 - **timestamp** - RFC3339 format (`'YYYY-DD-MMT-HH:MM:SSZ'`)
+- **date** - Date32/Data64 expressed as a string (`'YYYY-MM-DD'`)
+- **boolean** - Explicitly valued (true, false)
 
 ### Examples
 
@@ -247,7 +244,7 @@ SELECT * FROM table_name WHERE country_code = 'US'
 
 ## Operator Precedence
 
-1. **Comparison operators**: `=`, `!=`, `<`, `<=`, `>`, `>=`, `LIK#`, `BETWEEN`, `IS NULL`, `IS NOT NULL`
+1. **Comparison operators**: `=`, `!=`, `<`, `<=`, `>`, `>=`, `LIKE`, `BETWEEN`, `IS NULL`, `IS NOT NULL`
 2. **AND** (higher precedence)
 3. **OR** (lower precedence)
 
diff --git a/src/content/docs/r2-sql/troubleshooting.mdx b/src/content/docs/r2-sql/troubleshooting.mdx
index 4e9b566d335fd8..148cd392018e2d 100644
--- a/src/content/docs/r2-sql/troubleshooting.mdx
+++ b/src/content/docs/r2-sql/troubleshooting.mdx
@@ -14,7 +14,7 @@ This guide covers potential errors and limitations you may encounter when using
 ### Missing Required Clauses
 
 <div className="error-box">
-**Error**: `expected exactly 1 table in `FROM` clause`
+**Error**: `expected exactly 1 table in FROM clause`
 </div>
 
 **Problem**: R2 SQL requires specific clauses in your query.
@@ -75,7 +75,7 @@ SELECT json_field FROM logs
 ### Synthetic Data
 
 <div className="error-box">
-**Error**: `aliases (`AS`) are not supported`
+**Error**: `aliases (AS) are not supported`
 </div>
 
 **Problem**: Cannot create synthetic columns with literal values.
@@ -120,7 +120,7 @@ SELECT * FROM table2 WHERE id IN ('id1', 'id2', 'id3')
 ### Subqueries
 
 <div className="error-box">
-**Error**: `only table name is supported in `FROM` clause`
+**Error**: `only table name is supported in FROM clause`
 </div>
 
 **Problem**: Cannot use subqueries in FROM clause.

From f5d33f564b7e137ea8dd57e336d66abc98340526 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 07:48:59 -0700
Subject: [PATCH 18/30] Update src/content/docs/r2-sql/platform/pricing.mdx

Co-authored-by: Nikita Lapkov <5737185+laplab@users.noreply.github.com>
---
 src/content/docs/r2-sql/platform/pricing.mdx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2-sql/platform/pricing.mdx b/src/content/docs/r2-sql/platform/pricing.mdx
index a29f911d5e8328..5269c09143d7bc 100644
--- a/src/content/docs/r2-sql/platform/pricing.mdx
+++ b/src/content/docs/r2-sql/platform/pricing.mdx
@@ -10,7 +10,7 @@ head:
 ---
 
 
-R2 SQL is currently not billed during open beta, but will eventually be billed on the amount of data queried.
+R2 SQL is currently not billed during open beta, but will eventually be billed based on the amount of data queried.
 
 During the first phase of the R2 SQL open beta, you will not be billed for R2 SQL usage. You will only be billed for R2 usage.
 

From 5004c643307d7671fe06f9ae09c7f55e923b2e38 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 07:51:36 -0700
Subject: [PATCH 19/30] Update
 src/content/docs/r2-sql/reference/limitations-best-practices.mdx

Co-authored-by: Nikita Lapkov <5737185+laplab@users.noreply.github.com>
---
 .../docs/r2-sql/reference/limitations-best-practices.mdx        | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
index 8810832e8ed1b0..f53beeaed0dae8 100644
--- a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
+++ b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
@@ -27,7 +27,7 @@ R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2
 | JOINs                 | No        | No table joins                       |
 | Array filtering       | No        | No array type support                |
 | JSON filtering        | No        | No nested object queries             |
-| Simple LIMIT          | Yes       | 1-10,000 range                       |
+| Simple LIMIT          | Yes       | 1-10,000 range, no pagination support                       |
 | ORDER BY              | Yes       | Any columns of the partition key only|
 | GROUP BY              | No        | Not supported                        |
 

From b7693e4e8cabacf2ad9279cc6d5611c2d41b3ea1 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 07:53:20 -0700
Subject: [PATCH 20/30] Update
 src/content/docs/r2-sql/reference/sql-reference.mdx

Co-authored-by: Nikita Lapkov <5737185+laplab@users.noreply.github.com>
---
 src/content/docs/r2-sql/reference/sql-reference.mdx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/content/docs/r2-sql/reference/sql-reference.mdx b/src/content/docs/r2-sql/reference/sql-reference.mdx
index 326b500d5043a7..c8051ed762062e 100644
--- a/src/content/docs/r2-sql/reference/sql-reference.mdx
+++ b/src/content/docs/r2-sql/reference/sql-reference.mdx
@@ -131,7 +131,7 @@ ORDER BY partition_key [DESC]
 
 - **ASC**: Ascending order
 - **DESC**: Descending order
-- **Default**: partition_key DESC
+- **Default**: DESC on all columns of the partition key
 - Can contain any columns from the partition key
 
 ### Examples

From ca29d7db3e87a292c40cb029932e44c84efb63dd Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 08:00:39 -0700
Subject: [PATCH 21/30] Adding improvements from Nikita's review

---
 src/content/docs/r2-sql/platform/pricing.mdx               | 3 ---
 .../docs/r2-sql/reference/limitations-best-practices.mdx   | 2 +-
 src/content/docs/r2-sql/reference/sql-reference.mdx        | 7 ++++---
 3 files changed, 5 insertions(+), 7 deletions(-)

diff --git a/src/content/docs/r2-sql/platform/pricing.mdx b/src/content/docs/r2-sql/platform/pricing.mdx
index a29f911d5e8328..651d8b9ea3233a 100644
--- a/src/content/docs/r2-sql/platform/pricing.mdx
+++ b/src/content/docs/r2-sql/platform/pricing.mdx
@@ -9,9 +9,6 @@ head:
 
 ---
 
-
-R2 SQL is currently not billed during open beta, but will eventually be billed on the amount of data queried.
-
 During the first phase of the R2 SQL open beta, you will not be billed for R2 SQL usage. You will only be billed for R2 usage.
 
 We plan to price based on the volume of data queried by R2 SQL. We will provide at least 30 days notice and exact pricing before charging.
\ No newline at end of file
diff --git a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
index 8810832e8ed1b0..0d07fc29fb5ff4 100644
--- a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
+++ b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
@@ -11,7 +11,7 @@ sidebar:
 ## Overview
 
 :::note
-R2 SQL is in public beta. Limitations and best practices will change over time.
+R2 SQL is in open beta. Limitations and best practices will change over time.
 :::
 
 R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2 data catalog. This document outlines the supported features, limitations, and best practices of R2 SQL.
diff --git a/src/content/docs/r2-sql/reference/sql-reference.mdx b/src/content/docs/r2-sql/reference/sql-reference.mdx
index 326b500d5043a7..3f331ecc7e5ac5 100644
--- a/src/content/docs/r2-sql/reference/sql-reference.mdx
+++ b/src/content/docs/r2-sql/reference/sql-reference.mdx
@@ -25,8 +25,8 @@ This page documents the R2 SQL syntax based on the currently supported grammar i
 ```sql
 SELECT column_list
 FROM table_name
-WHERE conditions
-[ORDER BY column_name [DESC, ASC]]
+WHERE conditions --optional
+[ORDER BY column_name [DESC | ASC]]
 [LIMIT number]
 ```
 
@@ -220,8 +220,9 @@ LIMIT 500
 | `integer` | Whole numbers | `1`, `42`, `-10`, `0` |
 | `float` | Decimal numbers | `1.5`, `3.14`, `-2.7`, `0.0` |
 | `string` | Text values | `'hello'`, `'GET'`, `'2024-01-01'` |
-| `boolean` | boolean values | `true`, `false` |
+| `boolean` | Boolean values | `true`, `false` |
 | `timestamp` | RFC3339 | `'2025-09-24T01:00:00Z'` |
+| `date` | 'YYYY-MM-DD' | `'2025-09-24'` |
 
 ### Type Usage in Conditions
 

From 831805969619932a250ea018390f6afbf20a548e Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 10:07:06 -0700
Subject: [PATCH 22/30] changed the getting started to match Pipelines for
 consistency

---
 src/content/docs/r2-sql/get-started.mdx | 380 ++++++++++++------------
 1 file changed, 194 insertions(+), 186 deletions(-)

diff --git a/src/content/docs/r2-sql/get-started.mdx b/src/content/docs/r2-sql/get-started.mdx
index 1fc38613963bc6..cd57592ae11c75 100644
--- a/src/content/docs/r2-sql/get-started.mdx
+++ b/src/content/docs/r2-sql/get-started.mdx
@@ -4,8 +4,9 @@ title: Getting started
 head: []
 sidebar:
   order: 2
-description: Learn how to get up and running with R2 SQL using R2 Data Catalog and Pipelines
+description: Create your first pipeline to ingest streaming data and write to R2 Data Catalog as an Apache Iceberg table.
 ---
+
 import {
 	Render,
 	Steps,
@@ -15,110 +16,75 @@ import {
 	LinkCard,
 } from "~/components";
 
-## Overview
-
 This guide will instruct you through:
 
-- Creating an [R2 bucket](/r2/buckets/) and enabling its [data catalog](/r2/data-catalog/).
-- Using Wrangler to create a Pipeline Stream, Sink, and the SQL that reads from the stream and writes it to the sink.
-- Sending some data to the stream via the HTTP Streams endpoint.
-- Querying the data using R2 SQL.
+- Creating your first [R2 bucket](/r2/buckets/) and enabling its [data catalog](/r2/data-catalog/).
+- Creating an [API token](/r2/api/tokens/) needed for pipelines to authenticate with your data catalog.
+- Creating your first pipeline with a simple ecommerce schema that writes to an [Apache Iceberg](https://iceberg.apache.org/) table managed by R2 Data Catalog.
+- Sending sample ecommerce data via HTTP endpoint.
+- Validating data in your bucket and querying it with R2 SQL.
 
 ## Prerequisites
 
-1. Sign up for a [Cloudflare account](https://dash.cloudflare.com/sign-up).
-2. Install [Node.js](https://nodejs.org/en/).
-3. Install [Wrangler](/workers/wrangler/install-and-update).
-
-:::note[Node.js version manager]
-Use a Node version manager like [Volta](https://volta.sh/) or [nvm](https://github.com/nvm-sh/nvm) to avoid permission issues and change Node.js versions.
-
-Wrangler requires a Node version of 16.17.0 or later.
-:::
+<Render file="prereqs" product="workers" />
 
-## 1. Set up authentication
+## 1. Create an R2 bucket
 
-You will need API tokens to interact with Cloudflare services.
+<Tabs syncKey='CLIvDash'>
+<TabItem label='Wrangler CLI'>
 
 <Steps>
-1. In the Cloudflare dashboard, go to the **R2 object storage** page.
-
-   <DashButton url="/?to=/:account/r2/overview" />
-
-2. Select **Manage API tokens**.
-
-3. Select **Create User API token**.
-
-4. Select the **R2 Token** text to edit your API token name.
+1. If not already logged in, run:
 
-5. Under **Permissions**, choose the **Admin Read & Write** permission.
+	```
+	npx wrangler login
+	```
 
-6. Select **Create User API Token**.
+2. Create an R2 bucket:
 
-7. Note the **Token value**.
+	```
+	npx wrangler r2 bucket create pipelines-tutorial
+	```
 
 </Steps>
 
-Export your new token as an environment variable:
-
-```bash
-export WRANGLER_R2_SQL_AUTH_TOKEN= #paste your token here
-```
-
-If this is your first time using Wrangler, make sure to login.
-
-```bash
-npx wrangler login
-```
-
-## 2. Create an R2 bucket and enable R2 Data Catalog
-
-<Tabs syncKey='CLIvDash'>
-<TabItem label='Wrangler CLI'>
-
-Create an R2 bucket:
-
-	```bash
-	npx wrangler r2 bucket create r2-sql-demo
-	```
-
 </TabItem>
 <TabItem label='Dashboard'>
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
-
    <DashButton url="/?to=/:account/r2/overview" />
 
 2. Select **Create bucket**.
 
-3. Enter the bucket name: `r2-sql-demo`
+3. Enter the bucket name: pipelines-tutorial
 
 4. Select **Create bucket**.
 </Steps>
 </TabItem>
 </Tabs>
 
+## 2. Enable R2 Data Catalog
+
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
 
 Enable the catalog on your R2 bucket:
 
-```bash
-npx wrangler r2 bucket catalog enable r2-sql-demo
+```
+npx wrangler r2 bucket catalog enable pipelines-tutorial
 ```
 
-When you run this command, take note of the "Warehouse". You will need these later.
+When you run this command, take note of the "Warehouse" and "Catalog URI". You will need these later.
 
 </TabItem>
 <TabItem label='Dashboard'>
 
 <Steps>
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
-
    <DashButton url="/?to=/:account/r2/overview" />
 
-2. Select the bucket: `r2-sql-demo`.
+2. Select the bucket: pipelines-tutorial.
 
 3. Switch to the **Settings** tab, scroll down to **R2 Data Catalog**, and select **Enable**.
 
@@ -127,119 +93,112 @@ When you run this command, take note of the "Warehouse". You will need these lat
 </TabItem>
 </Tabs>
 
+## 3. Create an API token
+
+Pipelines must authenticate to R2 Data Catalog with an [R2 API token](/r2/api/tokens/) that has catalog and R2 permissions.
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+   <DashButton url="/?to=/:account/r2/overview" />
+
+2. Select **Manage API tokens**.
+
+3. Select **Create API token**.
+
+4. Select the **R2 Token** text to edit your API token name.
+
+5. Under **Permissions**, choose the **Admin Read & Write** permission.
+
+6. Select **Create API Token**.
+
+7. Note the **Token value**.
+
+</Steps>
 
 :::note
-Copy the warehouse (ACCOUNTID_BUCKETNAME) and paste it in the `export` below. We will use it later in the tutorial.
+This token also includes the R2 SQL Read permission, which allows you to query your data with R2 SQL.
 :::
 
-```bash
-export $WAREHOUSE= #Paste your warehouse here
-```
-
-## 3. Create the data Pipeline
+## 4. Create a pipeline
 
 <Tabs syncKey='CLIvDash'>
 <TabItem label='Wrangler CLI'>
 
-### 3.1. Create the Pipeline Stream
-
-First, create a schema file called `demo_schema.json` with the following `json` schema:
+First, create a schema file that defines your ecommerce data structure:
 
+**Create `schema.json`:**
 ```json
 {
   "fields": [
-    {"name": "user_id", "type": "int64", "required": true},
-    {"name": "payload", "type": "string", "required": false},
-		{"name": "numbers", "type": "int32", "required": false}
+    {
+      "name": "user_id",
+      "type": "string",
+      "required": true
+    },
+    {
+      "name": "event_type",
+      "type": "string",
+      "required": true
+    },
+    {
+      "name": "product_id",
+      "type": "string",
+      "required": false
+    },
+    {
+      "name": "amount",
+      "type": "float64",
+      "required": false
+    }
   ]
 }
 ```
-Next, create the stream we will use to ingest events to:
 
-```bash
-npx wrangler pipelines streams create demo_stream \
-  --schema-file demo_schema.json \
-	--http-enabled true \
-  --http-auth false
-```
-:::note
-Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you will use to send data to your pipeline.
-:::
+Use the interactive setup to create a pipeline that writes to R2 Data Catalog:
 
 ```bash
-# The http ingest endpoint from the output (see example below)
-export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example below)
-```
-
-The output should look like this:
-
-```sh
-🌀 Creating stream 'demo_stream'...
-✨ Successfully created stream 'demo_stream' with id 'stream_id'.
-
-Creation Summary:
-General:
-  Name:  demo_stream
-
-HTTP Ingest:
-  Enabled:         Yes
-  Authentication:  No
-  Endpoint:        https://stream_id.ingest.cloudflare.com
-  CORS Origins:    None
-
-Input Schema:
-┌────────────┬────────┬────────────┬──────────┐
-│ Field Name │ Type   │ Unit/Items │ Required │
-├────────────┼────────┼────────────┼──────────┤
-│ user_id    │ int64  │            │ Yes      │
-├────────────┼────────┼────────────┼──────────┤
-│ payload    │ string │            │ No       │
-├────────────┼────────┼────────────┼──────────┤
-│ numbers    │ int32  │            │ No       │
-└────────────┴────────┴────────────┴──────────┘
+npx wrangler pipelines setup
 ```
 
-### 3.2. Create the Pipeline Sink
+Follow the prompts:
 
-Create a sink that writes data to your R2 bucket as Apache Iceberg tables:
+1. **Pipeline name**: Enter `ecommerce`
 
-```bash
-npx wrangler pipelines sinks create demo_sink \
-  --type "r2-data-catalog" \
-	--bucket "r2-sql-demo" \
-	--roll-interval 30 \
-	--namespace "demo" \
-	--table "first_table" \
-	--catalog-token $WRANGLER_R2_SQL_AUTH_TOKEN
-```
+2. **Stream configuration**:
+   - Enable HTTP endpoint: `yes`
+   - Require authentication: `no` (for simplicity)
+   - Configure custom CORS origins: `no`
+   - Schema definition: `Load from file`
+   - Schema file path: `schema.json` (or your file path)
 
-:::note
-This creates a `sink` configuration that will write to the Iceberg table `demo.first_table` in your R2 Data Catalog every 30 seconds. Pipelines automatically appends an `__ingest_ts` column that is used to partition the table by `DAY`.
-:::
+3. **Sink configuration**:
+   - Destination type: `Data Catalog Table`
+   - R2 bucket name: `pipelines-tutorial`
+   - Namespace: `default`
+   - Table name: `ecommerce`
+   - Catalog API token: Enter your token from step 3
+   - Compression: `zstd`
+   - Roll file when size reaches (MB): `100`
+   - Roll file when time reaches (seconds): `10` (for faster data visibility in this tutorial)
 
-### 3.3. Create the Pipeline
+4. **SQL transformation**: Choose `Use simple ingestion query` to use:
+   ```sql
+   INSERT INTO ecommerce_sink SELECT * FROM ecommerce_stream
+   ```
 
-Pipelines are SQL statements that reads data from the stream, does some work, and writes it to the sink.
-
-```bash
-npx wrangler pipelines create demo_pipeline \
-  --sql "INSERT INTO demo_sink SELECT * FROM demo_stream WHERE numbers > 5;"
-```
-:::note
-Note that there is a filter on this statement that will only send events where `numbers` is greater than 5.
-:::
+After setup completes, note the HTTP endpoint URL displayed in the final output.
 
 </TabItem>
 <TabItem label='Dashboard'>
-<Steps>
-1. In the Cloudflare dashboard, go to the Pipelines page.
 
+<Steps>
+1. In the Cloudflare dashboard, go to **Pipelines** > **Pipelines**.
    <DashButton url="/?to=/:account/pipelines" />
 
 2. Select **Create Pipeline**.
 
 3. **Connect to a Stream**:
-   - Pipeline name: `demo`
+   - Pipeline name: `ecommerce`
    - Enable HTTP endpoint for sending data: Enabled
    - HTTP authentication: Disabled (default)
    - Select **Next**
@@ -247,94 +206,137 @@ Note that there is a filter on this statement that will only send events where `
 4. **Define Input Schema**:
    - Select **JSON editor**
    - Copy in the schema:
-    ```json
-    {
-      "fields": [
-        {"name": "user_id", "type": "int64", "required": true},
-        {"name": "payload", "type": "string", "required": false},
-        {"name": "numbers", "type": "int32", "required": false}
-      ]
-    }
-    ```
-
+     ```json
+     {
+       "fields": [
+         {
+           "name": "user_id",
+           "type": "string",
+           "required": true
+         },
+         {
+           "name": "event_type",
+           "type": "string",
+           "required": true
+         },
+         {
+           "name": "product_id",
+           "type": "string",
+           "required": false
+         },
+         {
+           "name": "amount",
+           "type": "f64",
+           "required": false
+         }
+       ]
+     }
+     ```
    - Select **Next**
 
 5. **Define Sink**:
-   - Select your R2 bucket: `r2-sql-demo`
+   - Select your R2 bucket: `pipelines-tutorial`
    - Storage type: **R2 Data Catalog**
-   - Namespace: `fraud_detection`
-   - Table name: `transactions`
-   - **Advanced Settings**: Change **Maximum Time Interval** to `30 seconds`
+   - Namespace: `default`
+   - Table name: `ecommerce`
+   - **Advanced Settings**: Change **Maximum Time Interval** to `10 seconds`
    - Select **Next**
 
 6. **Credentials**:
    - Disable **Automatically create an Account API token for your sink**
-   - Enter **Catalog Token** from step 1
+   - Enter **Catalog Token** from step 3
    - Select **Next**
 
 7. **Pipeline Definition**:
    - Leave the default SQL query:
      ```sql
-     INSERT INTO demo_sink SELECT * FROM demo_stream;
+     INSERT INTO ecommerce_sink SELECT * FROM ecommerce_stream;
      ```
    - Select **Create Pipeline**
 
-8. :::note
-    Note the **HTTP Ingest Endpoint URL** from the output. This is the endpoint you will use to send data to your pipeline.
-   :::
-
+8. After pipeline creation, note the **Stream ID** for the next step.
 </Steps>
 
-```bash
-# The http ingest endpoint
-export STREAM_ENDPOINT= #the http ingest endpoint from the output (see example below)
-```
 </TabItem>
 </Tabs>
 
+## 5. Send sample data
 
-## 4. Send some data
+Send ecommerce events to your pipeline's HTTP endpoint:
 
-Next, send some events to our stream:
-
-```curl
-curl -X POST "$STREAM_ENDPOINT" \
+```bash
+curl -X POST https://{stream-id}.ingest.cloudflare.com \
   -H "Content-Type: application/json" \
   -d '[
     {
-      "user_id": 1,
-      "payload": "you should see this",
-      "numbers": 42
-    },
-    {
-      "user_id": 2,
-      "payload": "you should also see this",
-      "numbers": 100
+      "user_id": "user_12345",
+      "event_type": "purchase",
+      "product_id": "widget-001",
+      "amount": 29.99
     },
     {
-      "user_id": 3,
-      "payload": null,
-      "numbers": 1
+      "user_id": "user_67890",
+      "event_type": "view_product",
+      "product_id": "widget-002"
     },
     {
-      "user_id": 4,
-      "numbers": null
+      "user_id": "user_12345",
+      "event_type": "add_to_cart",
+      "product_id": "widget-003",
+      "amount": 15.50
     }
   ]'
 ```
 
-This will send 4 events in one `POST`. Since our Pipeline is filtering out records with `numbers` less than 5, `user_id` `3` and `4` should not appear in the table. Feel free to change values and send more events.
+Replace `{stream-id}` with your actual stream endpoint from the pipeline setup.
 
-## 5. Query the table with R2 SQL
+## 6. Validate data in your bucket
+
+<Steps>
+1. In the Cloudflare dashboard, go to the **R2 object storage** page.
+
+2. Select your bucket: `pipelines-tutorial`.
+
+3. You should see Iceberg metadata files and data files created by your pipeline. Note: If you aren't seeing any files in your bucket, try waiting a couple of minutes and trying again.
+
+4. The data is organized in the Apache Iceberg format with metadata tracking table versions.
+</Steps>
 
-After you have sent your events to the stream, it will take about 30 seconds for the data to show in the table, since that is what we configured our `roll interval` to be in the Sink.
+## 7. Query your data using R2 SQL
+
+Set up your environment to use R2 SQL:
+
+```bash
+export WRANGLER_R2_SQL_AUTH_TOKEN=YOUR_API_TOKEN
+```
+
+Or create a `.env` file with:
+
+```
+WRANGLER_R2_SQL_AUTH_TOKEN=YOUR_API_TOKEN
+```
+
+Where `YOUR_API_TOKEN` is the token you created in step 3. For more information on setting environment variables, refer to [Wrangler system environment variables](/workers/wrangler/system-environment-variables/).
+
+Query your data:
 
 ```bash
-npx wrangler r2 sql query "$WAREHOUSE" "SELECT * FROM demo.first_table LIMIT 10"
+npx wrangler r2 sql query "YOUR_WAREHOUSE_NAME" "
+SELECT
+    user_id,
+    event_type,
+    product_id,
+    amount
+FROM default.ecommerce
+WHERE event_type = 'purchase'
+LIMIT 10"
 ```
 
-## Additional resources
+Replace `YOUR_WAREHOUSE_NAME` with the warehouse name from step 2.
+
+You can also query this table with any engine that supports Apache Iceberg. To learn more about connecting other engines to R2 Data Catalog, refer to [Connect to Iceberg engines](/r2/data-catalog/config-examples/).
 
+## Learn more
 <LinkCard
 	title="Managing R2 Data Catalogs"
 	href="/r2/data-catalog/manage-catalogs/"
@@ -346,3 +348,9 @@ npx wrangler r2 sql query "$WAREHOUSE" "SELECT * FROM demo.first_table LIMIT 10"
 	href="/r2-sql/tutorials/end-to-end-pipeline"
 	description="Detailed tutorial for setting up a simple fraud detection data pipeline, and generate events for it in Python."
 />
+
+<LinkCard
+	title="Pipelines"
+	href="/pipelines/pipelines/"
+	description="Understand SQL transformations and pipeline configuration."
+/>

From 5a67919e7c8e02267f3793cd326a999447adf18f Mon Sep 17 00:00:00 2001
From: Phillip Jones <pjones@cloudflare.com>
Date: Tue, 23 Sep 2025 14:25:00 -0700
Subject: [PATCH 23/30] Small formatting + other changes

---
 src/content/docs/r2-sql/index.mdx             |  29 +++-
 src/content/docs/r2-sql/platform/index.mdx    |   1 +
 src/content/docs/r2-sql/platform/pricing.mdx  |   7 +-
 .../r2-sql/platform/wrangler-commands.mdx     |   2 +-
 src/content/docs/r2-sql/query-data.mdx        | 155 ++++++++----------
 src/content/docs/r2-sql/reference/index.mdx   |   1 +
 .../reference/limitations-best-practices.mdx  |  32 ++--
 .../r2-sql/{reference => }/sql-reference.mdx  |  28 ++--
 src/content/docs/r2-sql/troubleshooting.mdx   |  46 +++---
 src/content/docs/r2-sql/tutorials/index.mdx   |   1 +
 .../workers/wrangler-commands/r2-sql.mdx      |   4 +-
 11 files changed, 150 insertions(+), 156 deletions(-)
 rename src/content/docs/r2-sql/{reference => }/sql-reference.mdx (86%)

diff --git a/src/content/docs/r2-sql/index.mdx b/src/content/docs/r2-sql/index.mdx
index 05daa63ab84b7e..43a3947e5f7e8a 100644
--- a/src/content/docs/r2-sql/index.mdx
+++ b/src/content/docs/r2-sql/index.mdx
@@ -1,22 +1,37 @@
 ---
-pcx_content_type: navigation
 title: R2 SQL
+
+pcx_content_type: overview
 sidebar:
-  order: 7
+  order: 1
+  badge:
+    text: Beta
 head:
   - tag: title
     content: R2 SQL
 description: A distributed SQL engine for R2 Data Catalog
 ---
 
-## Query Apache Iceberg tables in R2 Data Catalog Using R2 SQL
-
+import {
+	CardGrid,
+	Description,
+	Feature,
+	LinkTitleCard,
+	Plan,
+	RelatedProduct,
+} from "~/components";
 
 :::note
-R2 SQL is in public beta, and any developer with an R2 subscription can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL. We will update [the pricing page](/r2-sql/platform/pricing) and provide at least 30 days notice before enabling billing.
+R2 SQL is in **open beta**, and any developer with an [R2 subscription](/r2/pricing/) can start using it. Currently, outside of standard R2 storage and operations, you will not be billed for your use of R2 SQL. We will update [the pricing page](/r2-sql/platform/pricing) and provide at least 30 days notice before enabling billing.
 :::
 
-R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying [Apache Iceberg](https://iceberg.apache.org/) tables stored in [R2 data catalog](/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
+<Description>
+
+Query Apache Iceberg tables managed by R2 Data Catalog using SQL.
+
+</Description>
+
+R2 SQL is Cloudflare's serverless, distributed, analytics query engine for querying [Apache Iceberg](https://iceberg.apache.org/) tables stored in [R2 Data Catalog](/r2/data-catalog/). R2 SQL is designed to efficiently query large amounts of data by automatically utilizing file pruning, Cloudflare's distributed compute, and R2 object storage.
 
 ```sh
 ❯ npx wrangler r2 sql query "3373912de3f5202317188ae01300bd6_data-catalog" \
@@ -52,4 +67,4 @@ Read 11.3 kB across 4 files from R2
 On average, 3.36 kB / s
 ```
 
-Create an end to end data pipeline and query your first table in R2 SQL by following [this step by step guide](/r2-sql/tutorials/end-to-end-pipeline/), learn how to create a data pipeline that takes a stream of events and automatically creates an Apache Iceberg table, making them accessible with R2 SQL.
\ No newline at end of file
+Create an end-to-end data pipeline by following [this step by step guide](/r2-sql/get-started/), which shows you how to stream events into an Apache Iceberg table and query it with R2 SQL.
diff --git a/src/content/docs/r2-sql/platform/index.mdx b/src/content/docs/r2-sql/platform/index.mdx
index ef43ff93fe3c19..75984ada34efbb 100644
--- a/src/content/docs/r2-sql/platform/index.mdx
+++ b/src/content/docs/r2-sql/platform/index.mdx
@@ -2,6 +2,7 @@
 title: Platform
 pcx_content_type: navigation
 sidebar:
+  order: 7
   group:
     hideIndex: true
 ---
diff --git a/src/content/docs/r2-sql/platform/pricing.mdx b/src/content/docs/r2-sql/platform/pricing.mdx
index 651d8b9ea3233a..9ab389ab964957 100644
--- a/src/content/docs/r2-sql/platform/pricing.mdx
+++ b/src/content/docs/r2-sql/platform/pricing.mdx
@@ -6,9 +6,10 @@ sidebar:
 head:
   - tag: title
     content: R2 SQL - Pricing
-
 ---
 
-During the first phase of the R2 SQL open beta, you will not be billed for R2 SQL usage. You will only be billed for R2 usage.
+R2 SQL is in open beta and available to any developer with an [R2 subscription](/r2/pricing/).
+
+We are not currently billing for R2 SQL during open beta. However, you will be billed for standard [R2 storage and operations](/r2/pricing/) for data accessed by queries.
 
-We plan to price based on the volume of data queried by R2 SQL. We will provide at least 30 days notice and exact pricing before charging.
\ No newline at end of file
+We plan to bill based on the volume of data queried by R2 SQL. We'll provide at least 30 days notice before we make any changes or start charging for R2 SQL usage.
diff --git a/src/content/docs/r2-sql/platform/wrangler-commands.mdx b/src/content/docs/r2-sql/platform/wrangler-commands.mdx
index 76e85fae5e3720..d46ca8d974d9a2 100644
--- a/src/content/docs/r2-sql/platform/wrangler-commands.mdx
+++ b/src/content/docs/r2-sql/platform/wrangler-commands.mdx
@@ -11,4 +11,4 @@ import { Render, Type, MetaInfo } from "~/components";
 
 ## Global commands
 
-<Render file="wrangler-commands/global-flags" product="workers" />
\ No newline at end of file
+<Render file="wrangler-commands/global-flags" product="workers" />
diff --git a/src/content/docs/r2-sql/query-data.mdx b/src/content/docs/r2-sql/query-data.mdx
index cab46cf540d15a..ad1e09ff176f72 100644
--- a/src/content/docs/r2-sql/query-data.mdx
+++ b/src/content/docs/r2-sql/query-data.mdx
@@ -1,45 +1,88 @@
 ---
-title: Query data in R2 Data Catalog
+title: Query data
 pcx_content_type: configuration
 description: Understand how to query data with R2 SQL
 sidebar:
   order: 3
 ---
-import {
-	Render,
-	LinkCard,
-	Tabs,
-	TabItem,
-	Steps
-} from "~/components";
 
-:::note
-R2 SQL is currently in open beta.
-:::
+import { Render, LinkCard, Tabs, TabItem, Steps } from "~/components";
 
-Learn how to:
-- Create an API key with the necessary permissions.
-- Query data with R2 SQL.
+Query [Apache Iceberg](https://iceberg.apache.org/) tables managed by [R2 Data Catalog](/r2/data-catalog/). R2 SQL queries can be made via [Wrangler](/workers/wrangler/) or HTTP API.
 
-R2 SQL can currently be accessed via Wrangler commands or a REST API.
+## Get your warehouse name
 
-## Create an API key with the right permissions
+To query data with R2 SQL, you'll need your warehouse name associated with your [catalog](/r2/data-catalog/manage-catalogs/). To retrieve it, you can run the [`r2 bucket catalog get` command](/workers/wrangler/commands/#r2-bucket-catalog-get):
 
-To query Apache Iceberg tables in R2 Data Catalog, you must provide a Cloudflare API token with R2 SQL, R2 Data Catalog, and R2 storage permissions.
+```bash
+npx wrangler r2 bucket catalog get <BUCKET_NAME>
+```
+
+Alternatively, you can find it in the dashboard by going to the **R2 object storage** page, selecting the bucket, switching to the **Settings** tab, scrolling to **R2 Data Catalog**, and finding **Warehouse name**.
+
+## Query via Wrangler
+
+To begin, install [`npm`](https://docs.npmjs.com/getting-started). Then [install Wrangler, the Developer Platform CLI](/workers/wrangler/install-and-update/).
+
+Wrangler needs an API token with permissions to access R2 Data Catalog, R2 storage, and R2 SQL to execute queries. The `r2 sql query` command looks for the token in the `WRANGLER_R2_SQL_AUTH_TOKEN` environment variable.
+
+Set up your environment:
+
+```bash
+export WRANGLER_R2_SQL_AUTH_TOKEN=YOUR_API_TOKEN
+```
+
+Or create a `.env` file with:
+
+```
+WRANGLER_R2_SQL_AUTH_TOKEN=YOUR_API_TOKEN
+```
+
+Where `YOUR_API_TOKEN` is the token you created with the [required permissions](#authentication). For more information on setting environment variables, refer to [Wrangler system environment variables](/workers/wrangler/system-environment-variables/).
+
+To run a SQL query, run the [`r2 sql query` command](/workers/wrangler/commands/#r2-sql-query):
+
+```bash
+npx wrangler r2 sql query <WAREHOUSE> "SELECT * FROM namespace.table_name limit 10;"
+```
+
+For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/reference/sql-reference).
+
+## Query via API
+
+Below is an example of using R2 SQL via the REST endpoint:
+
+```bash
+curl -X POST \
+  "https://api.sql.cloudflarestorage.com/api/v1/accounts/{ACCOUNT_ID}/r2-sql/query/{BUCKET_NAME}" \
+  -H "Authorization: Bearer ${WRANGLER_R2_SQL_AUTH_TOKEN}" \
+  -H "Content-Type: application/json" \
+  -d '{
+    "query": "SELECT * FROM namespace.table_name limit 10;"
+  }'
+```
+
+The API requires an API token with the appropriate permissions in the Authorization header. Refer to [Authentication](#authentication) for details on creating a token.
+
+For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/reference/sql-reference).
 
-<Tabs syncKey='CLIvDash'>
-<TabItem label='Dashboard'>
-Create an [API token](https://dash.cloudflare.com/profile/api-tokens) with:
+## Authentication
 
-- Access to R2 Data Catalog (**minimum**: edit)
-- Access to R2 storage (**minimum**: read-only)
-- Access to R2 SQL (**minimum**: read-only)
+To query data with R2 SQL, you must provide a Cloudflare API token with R2 SQL, R2 Data Catalog, and R2 storage permissions. R2 SQL requires these permissions to access catalog metadata and read the underlying data files stored in R2.
 
-Wrangler now supports the environment variable `WRANGLER_R2_SQL_AUTH_TOKEN` which you can use to `export` your token.
+### Create API token in the dashboard
 
-</TabItem>
-<TabItem label='Via API'>
-To create an API token programmatically for use with R2 SQL, you will need to specify  R2 SQL, R2 Data Catalog, and R2 storage permission groups in your [Access Policy](/r2/api/tokens/#access-policy).
+Create an [R2 API token](/r2/api/tokens/#permissions) with **Admin Read only** permission. This permission includes:
+
+- Access to R2 Data Catalog (read-only)
+- Access to R2 storage (read-only)
+- Access to R2 SQL (read-only)
+
+Use this token value for the `WRANGLER_R2_SQL_AUTH_TOKEN` environment variable when querying with Wrangler, or in the Authorization header when using the REST API.
+
+### Create API token via API
+
+To create an API token programmatically for use with R2 SQL, you'll need to specify R2 SQL, R2 Data Catalog, and R2 storage permission groups in your [Access Policy](/r2/api/tokens/#access-policy).
 
 #### Example Access Policy
 
@@ -63,68 +106,14 @@ To create an API token programmatically for use with R2 SQL, you will need to sp
 			},
 			{
 				"id": "f45430d92e2b4a6cb9f94f2594c141b8",
-        "name": "Workers R2 SQL Read"
+				"name": "Workers R2 SQL Read"
 			}
 		]
 	}
 ]
 ```
-</TabItem>
-</Tabs>
-
-## Query data via Wrangler
-
-Export your R2 API token as an environment variable:
-
-```bash
-export WRANGLER_R2_SQL_AUTH_TOKEN=your_token_here
-```
-
-If this is your first time using Wrangler, make sure to login.
-
-```bash
-npx wrangler login
-```
-
-:::note
-You will want to copy the `Warehouse` of the R2 Data Catalog:
-:::
-
-```sh
-❯ npx wrangler r2 bucket catalog get [BUCKET_NAME]
-
- ⛅️ wrangler 4.38.0
-────────────────────────────────────────────────────────────────────────────
-▲ [WARNING] 🚧 `wrangler r2 bucket catalog get` is an open-beta command. Please report any issues to https://github.com/cloudflare/workers-sdk/issues/new/choose
-
-
-Catalog URI:  https://catalog.cloudflarestorage.com/[ACCOUNT_ID]/[BUCKET_NAME]
-Warehouse:    [ACCOUNT_ID]_[BUCKET_NAME]
-Status:       active
-```
 
-To query R2 SQL with Wrangler, simply run:
-
-```sh
-npx wrangler r2 sql query "YOUR_WAREHOUSE" "SELECT * FROM namespace.table_name limit 10;"
-```
-
-For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/reference/sql-reference).
-
-
-## REST API
-
-Below is an example of using R2 SQL via the REST endpoint:
-
-```bash
-curl -X POST \
-  "https://api.sql.cloudflarestorage.com/api/v1/accounts/{ACCOUNT_ID}/r2-sql/query/{BUCKET_NAME}" \
-  -H "Authorization: Bearer ${WRANGLER_R2_SQL_AUTH_TOKEN}" \
-  -H "Content-Type: application/json" \
-  -d '{
-    "query": "SELECT * FROM namespace.table_name limit 10;"
-  }'
-```
+To learn more about how to create API tokens for R2 SQL using the API, including required permission groups and usage examples, refer to the [Create API tokens via API documentation](/r2/api/tokens/#create-api-tokens-via-api).
 
 ## Additional resources
 
diff --git a/src/content/docs/r2-sql/reference/index.mdx b/src/content/docs/r2-sql/reference/index.mdx
index ab0a6ad35089fb..187375f796f745 100644
--- a/src/content/docs/r2-sql/reference/index.mdx
+++ b/src/content/docs/r2-sql/reference/index.mdx
@@ -2,6 +2,7 @@
 title: Reference
 pcx_content_type: navigation
 sidebar:
+  order: 8
   group:
     hideIndex: true
 ---
diff --git a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
index 99c598f5328df8..ef6c506750b597 100644
--- a/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
+++ b/src/content/docs/r2-sql/reference/limitations-best-practices.mdx
@@ -1,15 +1,12 @@
 ---
-title: Limitations and Best Practices
+title: Limitations and best practices
 pcx_content_type: concept
 tags:
   - SQL
 sidebar:
   order: 5
-
 ---
 
-## Overview
-
 :::note
 R2 SQL is in open beta. Limitations and best practices will change over time.
 :::
@@ -18,18 +15,18 @@ R2 SQL is designed for querying **partitioned** Apache Iceberg tables in your R2
 
 ## Quick Reference
 
-| Feature               | Supported | Notes                                |
-| :----                 | :----     | :----                                |
-| Basic SELECT          | Yes       | Columns, \*                          |
-| Aggregation functions | No        | No COUNT, AVG, etc.                  |
-| Single table FROM     | Yes       | Note, aliasing not supported         |
-| WHERE clause          | Yes       | Filters, comparisons, equality, etc  |
-| JOINs                 | No        | No table joins                       |
-| Array filtering       | No        | No array type support                |
-| JSON filtering        | No        | No nested object queries             |
-| Simple LIMIT          | Yes       | 1-10,000 range, no pagination support                       |
-| ORDER BY              | Yes       | Any columns of the partition key only|
-| GROUP BY              | No        | Not supported                        |
+| Feature               | Supported | Notes                                 |
+| :-------------------- | :-------- | :------------------------------------ |
+| Basic SELECT          | Yes       | Columns, \*                           |
+| Aggregation functions | No        | No COUNT, AVG, etc.                   |
+| Single table FROM     | Yes       | Note, aliasing not supported          |
+| WHERE clause          | Yes       | Filters, comparisons, equality, etc   |
+| JOINs                 | No        | No table joins                        |
+| Array filtering       | No        | No array type support                 |
+| JSON filtering        | No        | No nested object queries              |
+| Simple LIMIT          | Yes       | 1-10,000 range, no pagination support |
+| ORDER BY              | Yes       | Any columns of the partition key only |
+| GROUP BY              | No        | Not supported                         |
 
 ## Supported SQL Clauses
 
@@ -51,7 +48,6 @@ R2 SQL supports a limited set of SQL clauses: `SELECT`, `FROM`, `WHERE`, `ORDER
 - **No synthetic data**: Cannot create synthetic columns like `SELECT 1 AS what, "hello" AS greeting`
 - **No field aliasing**: `SELECT field AS another_name`
 
-
 ### Examples
 
 ```sql
@@ -204,4 +200,4 @@ The following SQL clauses are **not supported**:
 2. Use specific column selection instead of `SELECT *` when possible for better performance.
 3. Structure your data to avoid nested JSON objects if you need to filter on those fields.
 
----
\ No newline at end of file
+---
diff --git a/src/content/docs/r2-sql/reference/sql-reference.mdx b/src/content/docs/r2-sql/sql-reference.mdx
similarity index 86%
rename from src/content/docs/r2-sql/reference/sql-reference.mdx
rename to src/content/docs/r2-sql/sql-reference.mdx
index 3723aaeacb7ca4..ae072d2f1cb552 100644
--- a/src/content/docs/r2-sql/reference/sql-reference.mdx
+++ b/src/content/docs/r2-sql/sql-reference.mdx
@@ -1,17 +1,13 @@
 ---
-title: SQL Reference
+title: SQL reference
 pcx_content_type: concept
+description: Comprehensive reference for SQL syntax and data types supported in R2 SQL.
 tags:
   - SQL
 sidebar:
-  order: 5
+  order: 4
 ---
 
-# R2 SQL Language Reference
-
-## Overview
-
-
 :::note
 R2 SQL is in public beta. Supported SQL grammar may change over time.
 :::
@@ -64,7 +60,6 @@ SELECT timestamp, user_id, response_code FROM table_name
 SELECT * FROM table_name
 ```
 
-
 ---
 
 ## WHERE Clause
@@ -215,14 +210,14 @@ LIMIT 500
 
 ### Supported Types
 
-| Type | Description | Example Values |
-| :---- | :---- | :---- |
-| `integer` | Whole numbers | `1`, `42`, `-10`, `0` |
-| `float` | Decimal numbers | `1.5`, `3.14`, `-2.7`, `0.0` |
-| `string` | Text values | `'hello'`, `'GET'`, `'2024-01-01'` |
-| `boolean` | Boolean values | `true`, `false` |
-| `timestamp` | RFC3339 | `'2025-09-24T01:00:00Z'` |
-| `date` | 'YYYY-MM-DD' | `'2025-09-24'` |
+| Type        | Description     | Example Values                     |
+| :---------- | :-------------- | :--------------------------------- |
+| `integer`   | Whole numbers   | `1`, `42`, `-10`, `0`              |
+| `float`     | Decimal numbers | `1.5`, `3.14`, `-2.7`, `0.0`       |
+| `string`    | Text values     | `'hello'`, `'GET'`, `'2024-01-01'` |
+| `boolean`   | Boolean values  | `true`, `false`                    |
+| `timestamp` | RFC3339         | `'2025-09-24T01:00:00Z'`           |
+| `date`      | 'YYYY-MM-DD'    | `'2025-09-24'`                     |
 
 ### Type Usage in Conditions
 
@@ -256,4 +251,3 @@ SELECT * FROM table_name WHERE (status = 404 OR status = 500) AND method = 'GET'
 ```
 
 ---
-
diff --git a/src/content/docs/r2-sql/troubleshooting.mdx b/src/content/docs/r2-sql/troubleshooting.mdx
index 148cd392018e2d..6c2adcce08b41a 100644
--- a/src/content/docs/r2-sql/troubleshooting.mdx
+++ b/src/content/docs/r2-sql/troubleshooting.mdx
@@ -1,10 +1,10 @@
 ---
-title: "R2 SQL Troubleshooting Guide"
+title: "Troubleshooting guide"
 pcx_content_type: concept
 tags:
   - SQL
 sidebar:
-  order: 7
+  order: 5
 ---
 
 This guide covers potential errors and limitations you may encounter when using R2 SQL. R2 SQL is in open beta, and supported functionality will evolve and change over time.
@@ -14,7 +14,7 @@ This guide covers potential errors and limitations you may encounter when using
 ### Missing Required Clauses
 
 <div className="error-box">
-**Error**: `expected exactly 1 table in FROM clause`
+	**Error**: `expected exactly 1 table in FROM clause`
 </div>
 
 **Problem**: R2 SQL requires specific clauses in your query.
@@ -37,9 +37,7 @@ WHERE status = 200 AND timestamp BETWEEN '2025-09-24T01:00:00Z' AND '2025-09-25T
 
 ### Unsupported SQL Functions
 
-<div className="error-box">
-**Error**: `Function not supported`
-</div>
+<div className="error-box">**Error**: `Function not supported`</div>
 
 **Problem**: Cannot use aggregate or SQL functions in SELECT.
 
@@ -54,9 +52,7 @@ SELECT MAX(timestamp) FROM logs WHERE user_id = '123'
 
 ### JSON Field Access
 
-<div className="error-box">
-**Error**: `Cannot access nested fields`
-</div>
+<div className="error-box">**Error**: `Cannot access nested fields`</div>
 
 **Problem**: Cannot query individual fields from JSON objects.
 
@@ -74,9 +70,7 @@ SELECT json_field FROM logs
 
 ### Synthetic Data
 
-<div className="error-box">
-**Error**: `aliases (AS) are not supported`
-</div>
+<div className="error-box">**Error**: `aliases (AS) are not supported`</div>
 
 **Problem**: Cannot create synthetic columns with literal values.
 
@@ -97,7 +91,7 @@ SELECT user_id, status, priority FROM users WHERE status = 'active'
 ### Multiple Tables
 
 <div className="error-box">
-**Error**: `Multiple tables not supported` or `JOIN operations not allowed`
+	**Error**: `Multiple tables not supported` or `JOIN operations not allowed`
 </div>
 
 **Problem**: Cannot query multiple tables or use JOINs.
@@ -114,13 +108,14 @@ SELECT * FROM table2 WHERE id IN ('id1', 'id2', 'id3')
 ```
 
 **Solution**:
+
 - Denormalize your data by including necessary fields in a single table.
 - Perform multiple queries and join data in your application.
 
 ### Subqueries
 
 <div className="error-box">
-**Error**: `only table name is supported in FROM clause`
+	**Error**: `only table name is supported in FROM clause`
 </div>
 
 **Problem**: Cannot use subqueries in FROM clause.
@@ -142,7 +137,7 @@ SELECT user_id FROM events WHERE status = 200
 ### Array Filtering
 
 <div className="error-box">
-**Error**: `This feature is not implemented: GetFieldAccess`
+	**Error**: `This feature is not implemented: GetFieldAccess`
 </div>
 
 **Problem**: Cannot filter on array fields.
@@ -158,6 +153,7 @@ SELECT * FROM logs WHERE tags_string LIKE '%error%'
 ```
 
 **Solution**:
+
 - Denormalize array data into separate columns.
 - Use string concatenation of array values for pattern matching.
 - Restructure your schema to avoid array types.
@@ -165,7 +161,8 @@ SELECT * FROM logs WHERE tags_string LIKE '%error%'
 ### JSON Object Filtering
 
 <div className="error-box">
-**Error**: `unsupported binary operator` or `Error during planning: could not parse compound`
+	**Error**: `unsupported binary operator` or `Error during planning: could not
+	parse compound`
 </div>
 
 **Problem**: Cannot filter on fields inside JSON objects.
@@ -182,13 +179,14 @@ SELECT * FROM logs WHERE json_data IS NOT NULL
 ```
 
 **Solution**:
+
 - Denormalize frequently queried JSON fields into separate columns.
 - Filter on the entire JSON field, and handle parsing in your application.
 
 ### Column Comparisons
 
 <div className="error-box">
-**Error**: `right argument to a binary expression must be a literal`
+	**Error**: `right argument to a binary expression must be a literal`
 </div>
 
 **Problem**: Cannot compare one column to another in WHERE clause.
@@ -211,9 +209,7 @@ SELECT * FROM events WHERE duration > 0
 
 ### Invalid Limit Values
 
-<div className="error-box">
-**Error**: `maximum LIMIT is 10000`
-</div>
+<div className="error-box">**Error**: `maximum LIMIT is 10000`</div>
 
 **Problem**: Cannot use invalid LIMIT values.
 
@@ -230,9 +226,7 @@ SELECT * FROM events LIMIT 10000
 
 ### Pagination Attempts
 
-<div className="error-box">
-**Error**: `OFFSET not supported`
-</div>
+<div className="error-box">**Error**: `OFFSET not supported`</div>
 
 **Problem**: Cannot use pagination syntax.
 
@@ -258,7 +252,7 @@ SELECT * FROM events WHERE timestamp > '2024-01-01T10:30:00Z' ORDER BY timestamp
 ### Dynamic Schema Changes
 
 <div className="error-box">
-**Error**: `invalid SQL: only top-level SELECT clause is supported`
+	**Error**: `invalid SQL: only top-level SELECT clause is supported`
 </div>
 
 **Problem**: Cannot modify table schema or reference non-existent columns.
@@ -270,6 +264,7 @@ UPDATE events SET status = 200 WHERE user_id = '123'
 ```
 
 **Solution**:
+
 - Plan your schema carefully before data ingestion.
 - Ensure all column names exist in your current schema.
 
@@ -282,12 +277,14 @@ UPDATE events SET status = 200 WHERE user_id = '123'
 If your queries are running slowly:
 
 1. **Always include partition (timestamp) filters**: This is the most important optimization.
+
    ```sql
    -- Good
    WHERE timestamp BETWEEN '2024-01-01' AND '2024-01-02'
    ```
 
 2. **Use selective filtering**: Include specific conditions to reduce result sets.
+
    ```sql
    -- Good
    WHERE status = 200 AND country = 'US' AND timestamp > '2024-01-01'
@@ -298,4 +295,3 @@ If your queries are running slowly:
    -- Good for exploration
    SELECT * FROM events WHERE timestamp > '2024-01-01' LIMIT 100
    ```
-
diff --git a/src/content/docs/r2-sql/tutorials/index.mdx b/src/content/docs/r2-sql/tutorials/index.mdx
index 78c229f8741630..fe3c8fdcfa1ffc 100644
--- a/src/content/docs/r2-sql/tutorials/index.mdx
+++ b/src/content/docs/r2-sql/tutorials/index.mdx
@@ -2,6 +2,7 @@
 title: Tutorials
 pcx_content_type: navigation
 sidebar:
+  order: 6
   group:
     hideIndex: true
 ---
diff --git a/src/content/partials/workers/wrangler-commands/r2-sql.mdx b/src/content/partials/workers/wrangler-commands/r2-sql.mdx
index 8cf74660289c80..6f8868114a6898 100644
--- a/src/content/partials/workers/wrangler-commands/r2-sql.mdx
+++ b/src/content/partials/workers/wrangler-commands/r2-sql.mdx
@@ -6,7 +6,7 @@ import { Render, AnchorHeading, Type, MetaInfo } from "~/components";
 
 :::note
 
-R2 SQL is currently in open beta. Report R2 SQL bugs in [GitHub](https://github.com/cloudflare/workers-sdk/issues/new/choose). R2 SQL expects there to be a [WRANGLER_R2_SQL_AUTH_TOKEN](/workers/wrangler/system-environment-variables) environment variable to be set.
+R2 SQL is currently in open beta. Report R2 SQL bugs in [GitHub](https://github.com/cloudflare/workers-sdk/issues/new/choose). R2 SQL expects there to be a [`WRANGLER_R2_SQL_AUTH_TOKEN`](/r2-sql/query-data/#authentication) environment variable to be set.
 
 :::
 
@@ -19,6 +19,6 @@ wrangler r2 sql query <warehouse> <query>
 ```
 
 - `warehouse` <Type text="string" /> <MetaInfo text="required" />
-	- Your R2 Data Catalog warehouse - in the form of ACCOUNT_ID_BUCKET_NAME
+	- Your R2 Data Catalog [warehouse name](/r2-sql/query-data/#get-your-warehouse-name).
 - `query` <Type text="string" /> <MetaInfo text="required" />
 	- The SQL query to execute. Refer to the [SQL reference](/r2-sql/reference/sql-reference/).
\ No newline at end of file

From 8f7f5e99a6d9332d7c202eb08602fd66f1205a55 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Tue, 23 Sep 2025 15:57:19 -0700
Subject: [PATCH 24/30] fixed typo and added the changelog

---
 ...2025-09-25-announcing-r2-sql-open-beta.mdx | 54 +++++++++++++++++++
 src/content/docs/r2-sql/sql-reference.mdx     |  4 +-
 2 files changed, 56 insertions(+), 2 deletions(-)
 create mode 100644 src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx

diff --git a/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx b/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
new file mode 100644
index 00000000000000..b5fbe4d4648db9
--- /dev/null
+++ b/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
@@ -0,0 +1,54 @@
+---
+title: Announcing R2 SQL
+description: Run SQL queries against Apache Iceberg tables in R2 Data Catalog
+date: 2025-09-25
+products:
+  - r2-sql
+hidden: true
+---
+
+import { LinkCard} from "~/components";
+
+Today, we're launching the **open beta** for R2 SQL: A serverless, distributed query engine that can efficiently analyze petabytes of data in Apache Iceberg tables managed by [R2 Data Catalog](/r2/data-catalog).
+
+## What makes R2 SQL special?
+R2 SQL was built from the ground up to take advantage of Cloudflare's globally distributed compute, network and storage. Just some of the innovations and optimizations this enabled us to make include:
+- **Intelligent Query Planner**: R2 SQL utilizes R2 Data Catalog's metadata to reduce reading unnecessary files before reading a single byte, reducing I/O overhead and latency.
+- **Streaming execution pipeline**: R2 SQL begins processing data immediately as metadata continues to stream to the query planner, minimizing latency and allowing work to be efficiently parallelized.
+- **Truly serverless**: There's no infrastructure to manage or compute to scale. Just submit a query and Cloudflare's global compute infrastructure takes care of the rest.
+
+There's so much more that went into building R2 SQL - check out the [technical deep dive blog post](https://blog.cloudflare.com/r2-sql-deep-dive/) that goes into more details.
+
+# Give it a try
+
+Give our[getting started guide](/r2-sql/getting-started) a try. If you already have tables in R2 Data Catalog, running queries is as simple as:
+
+```bash
+export WRANGLER_R2_SQL_AUTH_TOKEN=<R2_API_TOKEN>
+
+npx wrangler r2 sql query "YOUR_WAREHOUSE" "
+SELECT
+    user_id,
+    event_type,
+		value,
+    __ingest_ts
+FROM events.user_events
+WHERE (event_type = 'CHANGELOG' or event_type = 'BLOG')
+  AND __ingest_ts BETWEEN '2025-09-24T01:00:00Z' AND '2025-09-25T01:00:00Z'
+ORDER BY __ingest_ts DESC
+LIMIT 1000"
+```
+
+## Learn more
+
+<LinkCard
+	title="Getting started"
+	href="/r2-sql/getting-started"
+	description="Learn how to query tables in R2 Data Catalog with R2 SQL"
+/>
+
+<LinkCard
+	title="SQL Reference"
+	href="/r2-sql/sql-reference"
+	description="Learn more about what features are available today"
+/>
\ No newline at end of file
diff --git a/src/content/docs/r2-sql/sql-reference.mdx b/src/content/docs/r2-sql/sql-reference.mdx
index ae072d2f1cb552..48e9888132e344 100644
--- a/src/content/docs/r2-sql/sql-reference.mdx
+++ b/src/content/docs/r2-sql/sql-reference.mdx
@@ -196,10 +196,10 @@ LIMIT 1000
 ### Null Handling
 
 ```sql
-SELECT user_id, session_id, timestamp
+SELECT user_id, session_id, date_column
 FROM user_events
 WHERE session_id IS NOT NULL
-  AND timestamp >= '2024-01-01'
+  AND date_column >= '2024-01-01'
 ORDER BY timestamp
 LIMIT 500
 ```

From 803fcd17eca7edaa376ff80f4858166f3fafc3c7 Mon Sep 17 00:00:00 2001
From: Phillip Jones <pjones@cloudflare.com>
Date: Tue, 23 Sep 2025 16:11:00 -0700
Subject: [PATCH 25/30] Add redirect for troubleshooting guide

---
 public/__redirects | 1 +
 1 file changed, 1 insertion(+)

diff --git a/public/__redirects b/public/__redirects
index bcad2024c33b3e..be00e265a1f17e 100644
--- a/public/__redirects
+++ b/public/__redirects
@@ -1579,6 +1579,7 @@
 /r2/examples/cloudflare-access/ /r2/tutorials/cloudflare-access/ 301
 /r2/examples/upload-logs-event-notifications/ /r2/tutorials/upload-logs-event-notifications/ 301
 /r2/examples/demo-worker/ /r2/api/workers/workers-api-usage/ 301
+/r2/sql/platform/troubleshooting/ /r2-sql/troubleshooting/ 301
 
 # time-services_redirects
 /time-services/nts/usage/ /time-services/nts/ 301

From c88356ab63591338fe199472440393ba77e9a222 Mon Sep 17 00:00:00 2001
From: Phillip Jones <pjones@cloudflare.com>
Date: Tue, 23 Sep 2025 16:58:00 -0700
Subject: [PATCH 26/30] Chagnes to changelog

---
 ...2025-09-25-announcing-r2-sql-open-beta.mdx | 43 +++++--------------
 1 file changed, 10 insertions(+), 33 deletions(-)

diff --git a/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx b/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
index b5fbe4d4648db9..a75f9a67e2083c 100644
--- a/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
+++ b/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
@@ -1,7 +1,7 @@
 ---
 title: Announcing R2 SQL
 description: Run SQL queries against Apache Iceberg tables in R2 Data Catalog
-date: 2025-09-25
+date: 2025-09-25T13:00:00
 products:
   - r2-sql
 hidden: true
@@ -9,46 +9,23 @@ hidden: true
 
 import { LinkCard} from "~/components";
 
-Today, we're launching the **open beta** for R2 SQL: A serverless, distributed query engine that can efficiently analyze petabytes of data in Apache Iceberg tables managed by [R2 Data Catalog](/r2/data-catalog).
+Today, we're launching the **open beta** for [R2 SQL](/r2-sql/): A serverless, distributed query engine that can efficiently analyze petabytes of data in [Apache Iceberg](https://iceberg.apache.org/) tables managed by [R2 Data Catalog](/r2/data-catalog).
 
-## What makes R2 SQL special?
-R2 SQL was built from the ground up to take advantage of Cloudflare's globally distributed compute, network and storage. Just some of the innovations and optimizations this enabled us to make include:
-- **Intelligent Query Planner**: R2 SQL utilizes R2 Data Catalog's metadata to reduce reading unnecessary files before reading a single byte, reducing I/O overhead and latency.
-- **Streaming execution pipeline**: R2 SQL begins processing data immediately as metadata continues to stream to the query planner, minimizing latency and allowing work to be efficiently parallelized.
-- **Truly serverless**: There's no infrastructure to manage or compute to scale. Just submit a query and Cloudflare's global compute infrastructure takes care of the rest.
+R2 SQL is ideal for exploring analytical and time-series data stored in R2, such as logs, events from [Pipelines](/pipelines/), or clickstream and user behavior data.
 
-There's so much more that went into building R2 SQL - check out the [technical deep dive blog post](https://blog.cloudflare.com/r2-sql-deep-dive/) that goes into more details.
-
-# Give it a try
-
-Give our[getting started guide](/r2-sql/getting-started) a try. If you already have tables in R2 Data Catalog, running queries is as simple as:
+If you already have a table in R2 Data Catalog, running queries is as simple as:
 
 ```bash
-export WRANGLER_R2_SQL_AUTH_TOKEN=<R2_API_TOKEN>
-
-npx wrangler r2 sql query "YOUR_WAREHOUSE" "
+npx wrangler r2 sql query YOUR_WAREHOUSE "
 SELECT
     user_id,
     event_type,
-		value,
-    __ingest_ts
+    value
 FROM events.user_events
-WHERE (event_type = 'CHANGELOG' or event_type = 'BLOG')
-  AND __ingest_ts BETWEEN '2025-09-24T01:00:00Z' AND '2025-09-25T01:00:00Z'
+WHERE event_type = 'CHANGELOG' or event_type = 'BLOG'
+  AND __ingest_ts > '2025-09-24T00:00:00Z'
 ORDER BY __ingest_ts DESC
-LIMIT 1000"
+LIMIT 100"
 ```
 
-## Learn more
-
-<LinkCard
-	title="Getting started"
-	href="/r2-sql/getting-started"
-	description="Learn how to query tables in R2 Data Catalog with R2 SQL"
-/>
-
-<LinkCard
-	title="SQL Reference"
-	href="/r2-sql/sql-reference"
-	description="Learn more about what features are available today"
-/>
\ No newline at end of file
+To get started with R2 SQL, check out our [getting started guide](/r2-sql/get-started/) or learn more about supported features in the [SQL reference](/r2-sql/reference/sql-reference/). For a technical deep dive into how we built R2 SQL, read our [blog post](https://blog.cloudflare.com/r2-sql-deep-dive/).

From 501babb3fa4ecdfd01ad7a604c244abafc2a58c9 Mon Sep 17 00:00:00 2001
From: Phillip Jones <pjones@cloudflare.com>
Date: Tue, 23 Sep 2025 19:50:25 -0700
Subject: [PATCH 27/30] Fixes pipeline, broken links

---
 .../r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx         | 2 +-
 src/content/docs/r2-sql/get-started.mdx                       | 2 +-
 src/content/docs/r2-sql/query-data.mdx                        | 4 ++--
 src/content/partials/workers/wrangler-commands/r2-sql.mdx     | 2 +-
 4 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx b/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
index a75f9a67e2083c..fbd01390b171aa 100644
--- a/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
+++ b/src/content/changelog/r2-sql/2025-09-25-announcing-r2-sql-open-beta.mdx
@@ -28,4 +28,4 @@ ORDER BY __ingest_ts DESC
 LIMIT 100"
 ```
 
-To get started with R2 SQL, check out our [getting started guide](/r2-sql/get-started/) or learn more about supported features in the [SQL reference](/r2-sql/reference/sql-reference/). For a technical deep dive into how we built R2 SQL, read our [blog post](https://blog.cloudflare.com/r2-sql-deep-dive/).
+To get started with R2 SQL, check out our [getting started guide](/r2-sql/get-started/) or learn more about supported features in the [SQL reference](/r2-sql/sql-reference/). For a technical deep dive into how we built R2 SQL, read our [blog post](https://blog.cloudflare.com/r2-sql-deep-dive/).
diff --git a/src/content/docs/r2-sql/get-started.mdx b/src/content/docs/r2-sql/get-started.mdx
index cd57592ae11c75..6ade75232a8691 100644
--- a/src/content/docs/r2-sql/get-started.mdx
+++ b/src/content/docs/r2-sql/get-started.mdx
@@ -351,6 +351,6 @@ You can also query this table with any engine that supports Apache Iceberg. To l
 
 <LinkCard
 	title="Pipelines"
-	href="/pipelines/pipelines/"
+	href="/pipelines/"
 	description="Understand SQL transformations and pipeline configuration."
 />
diff --git a/src/content/docs/r2-sql/query-data.mdx b/src/content/docs/r2-sql/query-data.mdx
index ad1e09ff176f72..1a323cb10bdaed 100644
--- a/src/content/docs/r2-sql/query-data.mdx
+++ b/src/content/docs/r2-sql/query-data.mdx
@@ -46,7 +46,7 @@ To run a SQL query, run the [`r2 sql query` command](/workers/wrangler/commands/
 npx wrangler r2 sql query <WAREHOUSE> "SELECT * FROM namespace.table_name limit 10;"
 ```
 
-For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/reference/sql-reference).
+For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/sql-reference).
 
 ## Query via API
 
@@ -64,7 +64,7 @@ curl -X POST \
 
 The API requires an API token with the appropriate permissions in the Authorization header. Refer to [Authentication](#authentication) for details on creating a token.
 
-For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/reference/sql-reference).
+For a full list of supported sql commands, refer to the [R2 SQL reference page](/r2-sql/sql-reference).
 
 ## Authentication
 
diff --git a/src/content/partials/workers/wrangler-commands/r2-sql.mdx b/src/content/partials/workers/wrangler-commands/r2-sql.mdx
index 6f8868114a6898..9ed0c3e5d91911 100644
--- a/src/content/partials/workers/wrangler-commands/r2-sql.mdx
+++ b/src/content/partials/workers/wrangler-commands/r2-sql.mdx
@@ -21,4 +21,4 @@ wrangler r2 sql query <warehouse> <query>
 - `warehouse` <Type text="string" /> <MetaInfo text="required" />
 	- Your R2 Data Catalog [warehouse name](/r2-sql/query-data/#get-your-warehouse-name).
 - `query` <Type text="string" /> <MetaInfo text="required" />
-	- The SQL query to execute. Refer to the [SQL reference](/r2-sql/reference/sql-reference/).
\ No newline at end of file
+	- The SQL query to execute. Refer to the [SQL reference](/r2-sql/sql-reference/).
\ No newline at end of file

From 6f1c55784c84253ca4a90150ac22ef5a14f5bd44 Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Wed, 24 Sep 2025 06:40:45 -0700
Subject: [PATCH 28/30] adding our official r2-sql icon

---
 src/icons/r2-sql.svg | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/icons/r2-sql.svg b/src/icons/r2-sql.svg
index 3d391a2de4036a..8e4c7c46cef8ee 100644
--- a/src/icons/r2-sql.svg
+++ b/src/icons/r2-sql.svg
@@ -1 +1,6 @@
-<svg xmlns="http://www.w3.org/2000/svg" width="40" height="40" viewBox="0 0 40 40"><path fill-rule="evenodd" d="M30.289 6.423c-2.43-.813-5.958-1.362-9.977-1.362-4.018 0-7.545.549-9.976 1.362-1.228.41-2.033.842-2.48 1.195q-.14.111-.204.18c.052.171.196.395.562.67.524.394 1.372.783 2.563 1.119 2.368.666 5.731 1.023 9.536 1.023s7.167-.357 9.535-1.023c1.191-.336 2.04-.725 2.563-1.119.366-.275.51-.499.562-.67a2 2 0 0 0-.204-.18c-.447-.353-1.252-.784-2.48-1.195m-20.24 5.624c-.885-.25-1.71-.552-2.424-.922v4.393c0 .196.097.514.625.941.535.433 1.391.869 2.576 1.252 2.36.764 5.71 1.222 9.486 1.222 3.778 0 7.128-.458 9.487-1.222 1.185-.383 2.041-.82 2.576-1.252.528-.427.625-.745.625-.94v-4.394c-.715.37-1.539.673-2.424.922-2.7.76-6.336 1.124-10.264 1.124s-7.564-.364-10.263-1.124m25.576 3.471V7.622c0-2.829-6.856-5.122-15.313-5.122C11.857 2.5 5 4.793 5 7.622v24.756c0 2.829 6.856 5.122 15.313 5.122 8.456 0 15.312-2.293 15.312-5.122zM33 19.134c-.7.393-1.505.726-2.375 1.008-2.708.877-6.358 1.352-10.313 1.352-3.954 0-7.604-.475-10.312-1.352-.87-.282-1.676-.615-2.375-1.008v4.28c0 .196.097.514.625.942.535.432 1.391.868 2.576 1.252 2.36.763 5.71 1.221 9.486 1.221 3.778 0 7.128-.458 9.487-1.221 1.185-.384 2.041-.82 2.576-1.252.528-.428.625-.746.625-.941v-4.28Zm-23 8.904c-.87-.281-1.676-.615-2.375-1.007v5.143c.044.048.116.117.231.208.447.353 1.252.785 2.48 1.195 2.43.813 5.958 1.362 9.976 1.362s7.546-.549 9.977-1.362c1.228-.41 2.033-.842 2.48-1.195a2 2 0 0 0 .231-.208v-5.143c-.7.392-1.505.726-2.375 1.007-2.708.877-6.358 1.352-10.313 1.352-3.954 0-7.604-.475-10.312-1.352m23.06 4.06-.01.016zm-25.495 0 .01.016zm3.997-15.726c.725 0 1.313-.573 1.313-1.28s-.588-1.281-1.313-1.281c-.724 0-1.312.573-1.312 1.28s.588 1.281 1.313 1.281Zm1.313 6.83c0 .706-.588 1.28-1.313 1.28-.724 0-1.312-.574-1.312-1.28 0-.708.588-1.281 1.313-1.281.724 0 1.312.573 1.312 1.28Zm-1.313 9.176c.725 0 1.313-.573 1.313-1.28s-.588-1.28-1.313-1.28c-.724 0-1.312.572-1.312 1.28 0 .707.588 1.28 1.313 1.28Z" clip-rule="evenodd"/></svg>
\ No newline at end of file
+<svg width="64" height="64" viewBox="0 0 64 64" fill="none" xmlns="http://www.w3.org/2000/svg">
+<rect x="12.7373" y="37.5132" width="6.94427" height="6.94427" transform="rotate(-45 12.7373 37.5132)" fill="#FF6633"/>
+<circle cx="31.7167" cy="37.0268" r="4.38813" fill="#FF6633"/>
+<path d="M45.3677 32.6392L50.0124 40.6841H40.7229L45.3677 32.6392Z" fill="#FF6633"/>
+<path d="M51.7668 51.4599H14.8645C11.1898 51.4517 7.66794 49.9882 5.06959 47.3896C2.47124 44.7911 1.00798 41.2691 1 37.5944C1.01996 35.542 1.48344 33.5182 2.35866 31.6618C3.23389 29.8053 4.50018 28.16 6.07073 26.8386C8.69899 24.6156 12.088 23.5006 15.5228 23.7289C17.0806 19.8949 19.8594 16.6817 23.4286 14.5872C26.9977 12.4926 31.1581 11.6336 35.265 12.1432C39.3718 12.6528 43.196 14.5026 46.145 17.406C49.094 20.3095 51.0031 24.1044 51.5766 28.2028C54.4181 28.0763 57.2031 29.0239 59.3778 30.8572C61.1746 32.422 62.4529 34.4963 63.0431 36.8047C63.6333 39.1132 63.5074 41.5465 62.6821 43.7817C61.8569 46.0169 60.3713 47.9482 58.4226 49.3193C56.4739 50.6903 54.1542 51.4362 51.7717 51.458L51.7668 51.4599ZM14.6451 27.6002C12.4223 27.5936 10.2705 28.3826 8.57879 29.8245C7.44201 30.7781 6.52477 31.9661 5.88991 33.3072C5.25505 34.6483 4.91756 36.1107 4.90056 37.5944C4.90466 40.2309 5.95184 42.7588 7.81342 44.6258C9.675 46.4929 12.1997 47.5475 14.8363 47.5594H51.7658C53.8188 47.5568 55.787 46.7399 57.2385 45.2881C58.69 43.8362 59.5064 41.8678 59.5084 39.8148C59.5182 38.6846 59.2859 37.5654 58.827 36.5325C58.3682 35.4995 57.6934 34.5768 56.8482 33.8265C55.9117 33.0801 54.8209 32.5514 53.6548 32.2787C52.4887 32.0059 51.2197 31.6645 49.2694 32.152L47.8467 30.3784C47.7451 26.8482 46.3933 23.4688 44.0322 20.8425C41.6712 18.2161 38.4542 16.5134 34.9548 16.0379C31.4553 15.5624 27.9007 16.3449 24.9244 18.246C21.9481 20.1471 19.7436 23.0433 18.7037 26.4183L18.1985 28.0634L16.5047 27.764C15.8908 27.6557 15.2686 27.6009 14.6451 27.6002Z" fill="#FF6633"/>
+</svg>

From 83ab7c947e744b7006c8eb5394f6a674134650ca Mon Sep 17 00:00:00 2001
From: Marc Selwan <marc@marcinthecloud.com>
Date: Wed, 24 Sep 2025 06:43:33 -0700
Subject: [PATCH 29/30] addressing Yevgen's feedback

---
 src/content/docs/r2-sql/get-started.mdx | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/content/docs/r2-sql/get-started.mdx b/src/content/docs/r2-sql/get-started.mdx
index 6ade75232a8691..0798b69936831d 100644
--- a/src/content/docs/r2-sql/get-started.mdx
+++ b/src/content/docs/r2-sql/get-started.mdx
@@ -101,9 +101,9 @@ Pipelines must authenticate to R2 Data Catalog with an [R2 API token](/r2/api/to
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
    <DashButton url="/?to=/:account/r2/overview" />
 
-2. Select **Manage API tokens**.
+2. Select the drop down first, then click **Manage API tokens**.
 
-3. Select **Create API token**.
+3. Select **Create Account API token**.
 
 4. Select the **R2 Token** text to edit your API token name.
 

From 2b189644cdb8f47a99eaf455b9758601b5132df6 Mon Sep 17 00:00:00 2001
From: Phillip Jones <pjones@cloudflare.com>
Date: Wed, 24 Sep 2025 06:58:45 -0700
Subject: [PATCH 30/30] fix typo in getting started for r2 sql

---
 src/content/docs/r2-sql/get-started.mdx | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/content/docs/r2-sql/get-started.mdx b/src/content/docs/r2-sql/get-started.mdx
index 0798b69936831d..ce957c85c48800 100644
--- a/src/content/docs/r2-sql/get-started.mdx
+++ b/src/content/docs/r2-sql/get-started.mdx
@@ -101,15 +101,15 @@ Pipelines must authenticate to R2 Data Catalog with an [R2 API token](/r2/api/to
 1. In the Cloudflare dashboard, go to the **R2 object storage** page.
    <DashButton url="/?to=/:account/r2/overview" />
 
-2. Select the drop down first, then click **Manage API tokens**.
+2. Select **Manage API tokens**.
 
 3. Select **Create Account API token**.
 
-4. Select the **R2 Token** text to edit your API token name.
+4. Give your API token a name.
 
 5. Under **Permissions**, choose the **Admin Read & Write** permission.
 
-6. Select **Create API Token**.
+6. Select **Create Account API Token**.
 
 7. Note the **Token value**.