Skip to content

Commit cdb5159

Browse files
authored
chore: update datafusion to 49 (#1285)
1 parent 948cab1 commit cdb5159

File tree

17 files changed

+374
-271
lines changed

17 files changed

+374
-271
lines changed

Cargo.lock

Lines changed: 314 additions & 233 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

Cargo.toml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -35,10 +35,10 @@ arrow-flight = { version = "55", features = ["flight-sql-experimental"] }
3535
clap = { version = "4.5", features = ["derive", "cargo"] }
3636
configure_me = { version = "0.4.0" }
3737
configure_me_codegen = { version = "0.4.4" }
38-
datafusion = "48.0.1"
39-
datafusion-cli = "48.0.1"
40-
datafusion-proto = "48.0.1"
41-
datafusion-proto-common = "48.0.1"
38+
datafusion = "49.0.1"
39+
datafusion-cli = "49.0.1"
40+
datafusion-proto = "49.0.1"
41+
datafusion-proto-common = "49.0.1"
4242
object_store = "0.12"
4343
prost = "0.13"
4444
prost-types = "0.13"

ballista-cli/Cargo.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
[package]
1919
name = "ballista-cli"
2020
description = "Command Line Client for Ballista distributed query engine."
21-
version = "48.0.0"
21+
version = "49.0.0"
2222
authors = ["Apache DataFusion <[email protected]>"]
2323
edition = { workspace = true }
2424
rust-version = { workspace = true }
@@ -29,7 +29,7 @@ repository = "https://github.com/apache/datafusion-ballista"
2929
readme = "README.md"
3030

3131
[dependencies]
32-
ballista = { path = "../ballista/client", version = "48.0.0", features = ["standalone"] }
32+
ballista = { path = "../ballista/client", version = "49.0.0", features = ["standalone"] }
3333
clap = { workspace = true, features = ["derive", "cargo"] }
3434
datafusion = { workspace = true }
3535
datafusion-cli = { workspace = true }

ballista/client/Cargo.toml

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@
1919
name = "ballista"
2020
description = "Ballista Distributed Compute"
2121
license = "Apache-2.0"
22-
version = "48.0.0"
22+
version = "49.0.0"
2323
homepage = "https://datafusion.apache.org/ballista/"
2424
repository = "https://github.com/apache/datafusion-ballista"
2525
readme = "README.md"
@@ -29,18 +29,18 @@ rust-version = { workspace = true }
2929

3030
[dependencies]
3131
async-trait = { workspace = true }
32-
ballista-core = { path = "../core", version = "48.0.0" }
33-
ballista-executor = { path = "../executor", version = "48.0.0", optional = true }
34-
ballista-scheduler = { path = "../scheduler", version = "48.0.0", optional = true }
32+
ballista-core = { path = "../core", version = "49.0.0" }
33+
ballista-executor = { path = "../executor", version = "49.0.0", optional = true }
34+
ballista-scheduler = { path = "../scheduler", version = "49.0.0", optional = true }
3535
datafusion = { workspace = true }
3636
log = { workspace = true }
3737

3838
tokio = { workspace = true }
3939
url = { workspace = true }
4040

4141
[dev-dependencies]
42-
ballista-executor = { path = "../executor", version = "48.0.0" }
43-
ballista-scheduler = { path = "../scheduler", version = "48.0.0" }
42+
ballista-executor = { path = "../executor", version = "49.0.0" }
43+
ballista-scheduler = { path = "../scheduler", version = "49.0.0" }
4444
ctor = { workspace = true }
4545
datafusion-proto = { workspace = true }
4646
env_logger = { workspace = true }

ballista/client/tests/context_checks.rs

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -498,7 +498,7 @@ mod supported {
498498
ctx: SessionContext,
499499
) -> datafusion::error::Result<()> {
500500
let result = ctx
501-
.sql("select name, value from information_schema.df_settings where name like 'datafusion.execution.parquet.schema_force_view_types' or name like 'datafusion.sql_parser.map_varchar_to_utf8view' order by name limit 2")
501+
.sql("select name, value from information_schema.df_settings where name like 'datafusion.execution.parquet.schema_force_view_types' or name like 'datafusion.sql_parser.map_string_types_to_utf8view' order by name limit 2")
502502
.await?
503503
.collect()
504504
.await?;
@@ -508,7 +508,7 @@ mod supported {
508508
"| name | value |",
509509
"+------------------------------------------------------+-------+",
510510
"| datafusion.execution.parquet.schema_force_view_types | false |",
511-
"| datafusion.sql_parser.map_varchar_to_utf8view | false |",
511+
"| datafusion.sql_parser.map_string_types_to_utf8view | false |",
512512
"+------------------------------------------------------+-------+",
513513
];
514514

ballista/core/Cargo.toml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@
1919
name = "ballista-core"
2020
description = "Ballista Distributed Compute"
2121
license = "Apache-2.0"
22-
version = "48.0.0"
22+
version = "49.0.0"
2323
homepage = "https://datafusion.apache.org/ballista/"
2424
repository = "https://github.com/apache/datafusion-ballista"
2525
readme = "README.md"

ballista/core/proto/datafusion.proto

Lines changed: 11 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -98,6 +98,7 @@ message ListingTableScanNode {
9898
datafusion_common.ParquetFormat parquet = 11;
9999
datafusion_common.AvroFormat avro = 12;
100100
datafusion_common.NdJsonFormat json = 15;
101+
datafusion_common.ArrowFormat arrow = 16;
101102
}
102103
repeated SortExprNodeCollection file_sort_order = 13;
103104
}
@@ -243,7 +244,7 @@ message JoinNode {
243244
datafusion_common.JoinConstraint join_constraint = 4;
244245
repeated LogicalExprNode left_join_key = 5;
245246
repeated LogicalExprNode right_join_key = 6;
246-
bool null_equals_null = 7;
247+
datafusion_common.NullEquality null_equality = 7;
247248
LogicalExprNode filter = 8;
248249
}
249250

@@ -726,6 +727,7 @@ message PhysicalPlanNode {
726727
ParquetSinkExecNode parquet_sink = 29;
727728
UnnestExecNode unnest = 30;
728729
JsonScanExecNode json_scan = 31;
730+
CooperativeExecNode cooperative = 32;
729731
}
730732
}
731733

@@ -858,6 +860,7 @@ message PhysicalScalarUdfNode {
858860
optional bytes fun_definition = 3;
859861
datafusion_common.ArrowType return_type = 4;
860862
bool nullable = 5;
863+
string return_field_name = 6;
861864
}
862865

863866
message PhysicalAggregateExprNode {
@@ -869,6 +872,7 @@ message PhysicalAggregateExprNode {
869872
bool distinct = 3;
870873
bool ignore_nulls = 6;
871874
optional bytes fun_definition = 7;
875+
string human_display = 8;
872876
}
873877

874878
message PhysicalWindowExprNode {
@@ -1033,6 +1037,10 @@ message AvroScanExecNode {
10331037
FileScanExecConf base_conf = 1;
10341038
}
10351039

1040+
message CooperativeExecNode {
1041+
PhysicalPlanNode input = 1;
1042+
}
1043+
10361044
enum PartitionMode {
10371045
COLLECT_LEFT = 0;
10381046
PARTITIONED = 1;
@@ -1045,7 +1053,7 @@ message HashJoinExecNode {
10451053
repeated JoinOn on = 3;
10461054
datafusion_common.JoinType join_type = 4;
10471055
PartitionMode partition_mode = 6;
1048-
bool null_equals_null = 7;
1056+
datafusion_common.NullEquality null_equality = 7;
10491057
JoinFilter filter = 8;
10501058
repeated uint32 projection = 9;
10511059
}
@@ -1061,7 +1069,7 @@ message SymmetricHashJoinExecNode {
10611069
repeated JoinOn on = 3;
10621070
datafusion_common.JoinType join_type = 4;
10631071
StreamPartitionMode partition_mode = 6;
1064-
bool null_equals_null = 7;
1072+
datafusion_common.NullEquality null_equality = 7;
10651073
JoinFilter filter = 8;
10661074
repeated PhysicalSortExprNode left_sort_exprs = 9;
10671075
repeated PhysicalSortExprNode right_sort_exprs = 10;

ballista/core/proto/datafusion_common.proto

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -55,6 +55,8 @@ message NdJsonFormat {
5555
JsonOptions options = 1;
5656
}
5757

58+
message ArrowFormat {}
59+
5860

5961
message PrimaryKeyConstraint{
6062
repeated uint64 indices = 1;
@@ -85,13 +87,19 @@ enum JoinType {
8587
RIGHTSEMI = 6;
8688
RIGHTANTI = 7;
8789
LEFTMARK = 8;
90+
RIGHTMARK = 9;
8891
}
8992

9093
enum JoinConstraint {
9194
ON = 0;
9295
USING = 1;
9396
}
9497

98+
enum NullEquality {
99+
NULL_EQUALS_NOTHING = 0;
100+
NULL_EQUALS_NULL = 1;
101+
}
102+
95103
message AvroOptions {}
96104
message ArrowOptions {}
97105

ballista/core/src/client.rs

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -232,7 +232,7 @@ impl Stream for FlightDataStream {
232232
self.schema.clone(),
233233
&self.dictionaries_by_id,
234234
)
235-
.map_err(|e| DataFusionError::ArrowError(e, None))
235+
.map_err(|e| DataFusionError::ArrowError(Box::new(e), None))
236236
});
237237
Some(converted_chunk)
238238
}

ballista/core/src/error.rs

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ pub enum BallistaError {
3838
General(String),
3939
Internal(String),
4040
Configuration(String),
41-
ArrowError(ArrowError),
41+
ArrowError(Box<ArrowError>),
4242
DataFusionError(Box<DataFusionError>),
4343
SqlError(parser::ParserError),
4444
IoError(io::Error),
@@ -84,7 +84,7 @@ impl From<ArrowError> for BallistaError {
8484
*e.downcast::<DataFusionError>().unwrap(),
8585
))
8686
}
87-
other => BallistaError::ArrowError(other),
87+
other => BallistaError::ArrowError(Box::new(other)),
8888
}
8989
}
9090
}
@@ -98,7 +98,7 @@ impl From<parser::ParserError> for BallistaError {
9898
impl From<DataFusionError> for BallistaError {
9999
fn from(e: DataFusionError) -> Self {
100100
match e {
101-
DataFusionError::ArrowError(e, _) => Self::from(e),
101+
DataFusionError::ArrowError(e, _) => Self::from(*e),
102102
_ => BallistaError::DataFusionError(Box::new(e)),
103103
}
104104
}

0 commit comments

Comments
 (0)