maxmind
diff --git a/‎CHANGELOG.md‎
Lines changed: 5 additions & 5 deletions b/‎CHANGELOG.md‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎README.md‎
Lines changed: 2 additions & 2 deletions b/‎README.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/config.md‎
Lines changed: 19 additions & 8 deletions b/‎docs/config.md‎
Lines changed: 19 additions & 8 deletions
diff --git a/‎internal/config/config.go‎
Lines changed: 59 additions & 29 deletions b/‎internal/config/config.go‎
Lines changed: 59 additions & 29 deletions
@@ -15,17 +15,17 @@ and this project adheres to
   declaring that rows are sorted by start_int in ascending order. This enables
   query engines like DuckDB, Spark, and Trino to use the sort order for
   potential optimizations like binary search.
-- New `network_bucket` network column type for Parquet output, enabling
+- New `network_bucket` network column type for CSV and Parquet output, enabling
   efficient IP lookups in BigQuery and other analytics platforms. When a network
   spans multiple buckets, rows are duplicated with different bucket values while
   preserving original network info. For IPv4, the bucket is an integer. For
   IPv6, the bucket is either a hex string (e.g.,
   "200f0000000000000000000000000000") or an integer depending on
   `ipv6_bucket_type`. Requires split output files (`ipv4_file` and `ipv6_file`).
-- New Parquet options `ipv4_bucket_size` and `ipv6_bucket_size` to configure
-  bucket prefix lengths (default: 16).
-- New Parquet option `ipv6_bucket_type` to configure the IPv6 network bucket
-  column format (default: string).
+- New CSV and Parquet options `ipv4_bucket_size` and `ipv6_bucket_size` to
+  configure bucket prefix lengths (default: 16).
+- New CSV and Parquet option `ipv6_bucket_type` to configure the IPv6 network
+  bucket column format (default: string).
 
 ## [0.1.0] - 2025-11-07
 
 
@@ -423,7 +423,7 @@ split your output into separate IPv4/IPv6 files via `output.ipv4_file` and
 `output.ipv6_file`. For single-file outputs that include IPv6 data, use string
 columns (`start_ip`, `end_ip`, `cidr`).
 
-**Note:** `network_bucket` is currently only supported for Parquet output.
+**Note:** `network_bucket` is supported for CSV and Parquet output.
 
 ### Network Bucketing for Analytics (BigQuery, etc.)
 
@@ -466,7 +466,7 @@ For IPv4, the bucket is an integer. For IPv6, the bucket is either a hex string
 buckets), the row is duplicated for each bucket it spans. This ensures queries
 find the correct network regardless of which bucket the IP falls into.
 
-**Note:** `network_bucket` is currently only supported for Parquet output.
+**Note:** `network_bucket` is supported for CSV and Parquet output.
 
 ### Data Type Hints
 
 
@@ -72,8 +72,19 @@ When `format = "csv"`, you can specify CSV-specific options:
 [output.csv]
 delimiter = ","           # Field delimiter (default: ",")
 include_header = true     # Include column headers (default: true)
+ipv4_bucket_size = 16     # Bucket prefix length for IPv4 (default: 16)
+ipv6_bucket_size = 16     # Bucket prefix length for IPv6 (default: 16)
+ipv6_bucket_type = "string"  # IPv6 bucket value type: "string" or "int" (default: "string")
 ```
 
+| Option             | Description                                                                | Default  |
+| ------------------ | -------------------------------------------------------------------------- | -------- |
+| `delimiter`        | Field delimiter character                                                  | ","      |
+| `include_header`   | Include column headers in output                                           | true     |
+| `ipv4_bucket_size` | Prefix length for IPv4 buckets (1-32, when `network_bucket` column used)   | 16       |
+| `ipv6_bucket_size` | Prefix length for IPv6 buckets (1-60, when `network_bucket` column used)   | 16       |
+| `ipv6_bucket_type` | IPv6 bucket value type: "string" (hex) or "int" (first 60 bits as integer) | "string" |
+
 #### Parquet Options
 
 When `format = "parquet"`, you can specify Parquet-specific options:
@@ -146,14 +157,14 @@ type = "cidr"       # Output type
 
 **Available types:**
 
-| Type             | Description                                                                                                                                                |
-| ---------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `cidr`           | CIDR notation (e.g., "203.0.113.0/24")                                                                                                                     |
-| `start_ip`       | Starting IP address (e.g., "203.0.113.0")                                                                                                                  |
-| `end_ip`         | Ending IP address (e.g., "203.0.113.255")                                                                                                                  |
-| `start_int`      | Starting IP as integer                                                                                                                                     |
-| `end_int`        | Ending IP as integer                                                                                                                                       |
-| `network_bucket` | Bucket for efficient lookups. IPv4: integer. IPv6: hex string (default) or integer (with `ipv6_bucket_type = "int"`). Requires split files (Parquet only). |
+| Type             | Description                                                                                                                                                        |
+| ---------------- | ------------------------------------------------------------------------------------------------------------------------------------------------------------------ |
+| `cidr`           | CIDR notation (e.g., "203.0.113.0/24")                                                                                                                             |
+| `start_ip`       | Starting IP address (e.g., "203.0.113.0")                                                                                                                          |
+| `end_ip`         | Ending IP address (e.g., "203.0.113.255")                                                                                                                          |
+| `start_int`      | Starting IP as integer                                                                                                                                             |
+| `end_int`        | Ending IP as integer                                                                                                                                               |
+| `network_bucket` | Bucket for efficient lookups. IPv4: integer. IPv6: hex string (default) or integer (with `ipv6_bucket_type = "int"`). Requires split files (CSV and Parquet only). |
 
 **Default behavior:** If no `[[network.columns]]` sections are defined:
 
 
@@ -46,8 +46,11 @@ type OutputConfig struct {
 
 // CSVConfig defines CSV output options.
 type CSVConfig struct {
-	Delimiter     string `toml:"delimiter"`      // Field delimiter (default: ",")
-	IncludeHeader *bool  `toml:"include_header"` // Include column headers (default: true)
+	Delimiter      string `toml:"delimiter"`        // Field delimiter (default: ",")
+	IncludeHeader  *bool  `toml:"include_header"`   // Include column headers (default: true)
+	IPv4BucketSize int    `toml:"ipv4_bucket_size"` // Bucket prefix length for IPv4 (default: 16)
+	IPv6BucketSize int    `toml:"ipv6_bucket_size"` // Bucket prefix length for IPv6 (default: 16)
+	IPv6BucketType string `toml:"ipv6_bucket_type"` // "string" or "int" (default: "string")
 }
 
 // ParquetConfig defines Parquet output options.
@@ -174,6 +177,15 @@ func applyDefaults(config *Config) {
 	if config.Output.CSV.IncludeHeader == nil {
 		config.Output.CSV.IncludeHeader = boolPtr(true)
 	}
+	if config.Output.CSV.IPv4BucketSize == 0 {
+		config.Output.CSV.IPv4BucketSize = 16
+	}
+	if config.Output.CSV.IPv6BucketSize == 0 {
+		config.Output.CSV.IPv6BucketSize = 16
+	}
+	if config.Output.CSV.IPv6BucketType == "" {
+		config.Output.CSV.IPv6BucketType = IPv6BucketTypeString
+	}
 
 	// Parquet defaults
 	if config.Output.Parquet.Compression == "" {
@@ -360,9 +372,9 @@ func validate(config *Config) error {
 	}
 
 	if hasBucketColumn {
-		if config.Output.Format != formatParquet {
+		if config.Output.Format == formatMMDB {
 			return errors.New(
-				"network_bucket column type is only supported for Parquet output",
+				"network_bucket column type is only supported for CSV and Parquet output",
 			)
 		}
 
@@ -374,31 +386,8 @@ func validate(config *Config) error {
 			)
 		}
 
-		// Validate bucket sizes when network_bucket column is used
-		if config.Output.Parquet.IPv4BucketSize < 1 ||
-			config.Output.Parquet.IPv4BucketSize > 32 {
-			return fmt.Errorf(
-				"ipv4_bucket_size must be between 1 and 32, got %d",
-				config.Output.Parquet.IPv4BucketSize,
-			)
-		}
-		// IPv6 bucket size capped at 60 to support int type (60-bit values fit in
-		// positive int64, simplifying BigQuery queries)
-		if config.Output.Parquet.IPv6BucketSize < 1 ||
-			config.Output.Parquet.IPv6BucketSize > 60 {
-			return fmt.Errorf(
-				"ipv6_bucket_size must be between 1 and 60, got %d",
-				config.Output.Parquet.IPv6BucketSize,
-			)
-		}
-
-		// Validate IPv6 bucket type
-		if config.Output.Parquet.IPv6BucketType != IPv6BucketTypeString &&
-			config.Output.Parquet.IPv6BucketType != IPv6BucketTypeInt {
-			return fmt.Errorf(
-				"ipv6_bucket_type must be 'string' or 'int', got '%s'",
-				config.Output.Parquet.IPv6BucketType,
-			)
+		if err := validateBucketConfig(config); err != nil {
+			return err
 		}
 	}
 
@@ -451,3 +440,44 @@ func validate(config *Config) error {
 
 	return nil
 }
+
+// validateBucketConfig validates bucket configuration for CSV or Parquet output.
+func validateBucketConfig(config *Config) error {
+	var ipv4BucketSize, ipv6BucketSize int
+	var ipv6BucketType string
+
+	if config.Output.Format == formatCSV {
+		ipv4BucketSize = config.Output.CSV.IPv4BucketSize
+		ipv6BucketSize = config.Output.CSV.IPv6BucketSize
+		ipv6BucketType = config.Output.CSV.IPv6BucketType
+	} else {
+		ipv4BucketSize = config.Output.Parquet.IPv4BucketSize
+		ipv6BucketSize = config.Output.Parquet.IPv6BucketSize
+		ipv6BucketType = config.Output.Parquet.IPv6BucketType
+	}
+
+	if ipv4BucketSize < 1 || ipv4BucketSize > 32 {
+		return fmt.Errorf(
+			"ipv4_bucket_size must be between 1 and 32, got %d",
+			ipv4BucketSize,
+		)
+	}
+
+	// IPv6 bucket size capped at 60 to support int type (60-bit values fit in
+	// positive int64, simplifying BigQuery queries)
+	if ipv6BucketSize < 1 || ipv6BucketSize > 60 {
+		return fmt.Errorf(
+			"ipv6_bucket_size must be between 1 and 60, got %d",
+			ipv6BucketSize,
+		)
+	}
+
+	if ipv6BucketType != IPv6BucketTypeString && ipv6BucketType != IPv6BucketTypeInt {
+		return fmt.Errorf(
+			"ipv6_bucket_type must be 'string' or 'int', got '%s'",
+			ipv6BucketType,
+		)
+	}
+
+	return nil
+}