From 4180741fefec950ef4a6e492e22699227152398c Mon Sep 17 00:00:00 2001 From: Zhang Li Date: Fri, 10 May 2024 19:35:43 +0800 Subject: [PATCH] release version 2.0.9.1 (#470) Co-authored-by: zhangli20 --- .github/workflows/build-ce7-releases.yml | 2 +- Cargo.toml | 36 ++++++++++++------------ RELEASES.md | 23 ++++----------- pom.xml | 2 +- 4 files changed, 26 insertions(+), 37 deletions(-) diff --git a/.github/workflows/build-ce7-releases.yml b/.github/workflows/build-ce7-releases.yml index a9da1b43..cf8fda8f 100644 --- a/.github/workflows/build-ce7-releases.yml +++ b/.github/workflows/build-ce7-releases.yml @@ -12,7 +12,7 @@ jobs: strategy: matrix: sparkver: [spark303, spark333] - blazever: [2.0.9] + blazever: [2.0.9.1] steps: - uses: actions/checkout@v4 diff --git a/Cargo.toml b/Cargo.toml index 9ec42049..5052eab7 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -64,26 +64,26 @@ serde_json = { version = "1.0.96" } [patch.crates-io] # datafusion: branch=v36-blaze -datafusion = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "8cd557f32"} -datafusion-common = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "8cd557f32"} -datafusion-expr = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "8cd557f32"} -datafusion-execution = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "8cd557f32"} -datafusion-optimizer = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "8cd557f32"} -datafusion-physical-expr = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "8cd557f32"} +datafusion = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "71433f743b2c399ea1728531b0e56fd7c6ef5282"} +datafusion-common = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "71433f743b2c399ea1728531b0e56fd7c6ef5282"} +datafusion-expr = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "71433f743b2c399ea1728531b0e56fd7c6ef5282"} +datafusion-execution = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "71433f743b2c399ea1728531b0e56fd7c6ef5282"} +datafusion-optimizer = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "71433f743b2c399ea1728531b0e56fd7c6ef5282"} +datafusion-physical-expr = { git = "https://github.com/blaze-init/arrow-datafusion.git", rev = "71433f743b2c399ea1728531b0e56fd7c6ef5282"} # arrow: branch=v50-blaze -arrow = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-arith = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-array = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-buffer = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-cast = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-data = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-ord = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-row = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-schema = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-select = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -arrow-string = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} -parquet = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "b1e0762ba4"} +arrow = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-arith = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-array = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-buffer = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-cast = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-data = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-ord = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-row = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-schema = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-select = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +arrow-string = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} +parquet = { git = "https://github.com/blaze-init/arrow-rs.git", rev = "2c39d9a251f7e3f8f15312bdd0c38759e465e8bc"} # serde_json: branch=v1.0.96-blaze serde_json = { git = "https://github.com/blaze-init/json", branch = "v1.0.96-blaze" } diff --git a/RELEASES.md b/RELEASES.md index adf28f49..795eeb7d 100644 --- a/RELEASES.md +++ b/RELEASES.md @@ -1,23 +1,12 @@ -# blaze-v2.0.9 +# blaze-v2.0.9.1 ## Features -* Upgrades datafusion/arrow dependency version to v36/v50. -* Supports max/min aggregation with complex types. -* Supports json_tuple. -* Introduce sonic-rs for json parsing. -* Add stage id in operator metrics. -* Implements writing table with dynamic partitions (not tested in spark303/spark333). +* Supports failing-back nondeterministic expressions. +* Supports "$[].xxx" jsonpath syntax in get_json_object(). ## Performance -* Improves batch serialization format and reduce compressed size. -* Implements radix-based k-way merging used in shuffling and aggregating. -* Improves performance of on-heap spilling. -* Improves performance of SortExec. -* Improves performance of AggExec. -* Improves performance of collect_set/collect_list. +* Supports adaptive batch size in ParquetScan, improving vectorized reading performance. +* Supports directly spill to disk file when on-heap memory is full. ## Bugfix -* Fix concat_ws with empty batches. -* Fix spark333 RenameExec incorrect ordering expressions. -* Fix incorrect join type mapping in BroadcastNestedLoopJoin. -* Fix decimal dividing with zero. +* Fix incorrect parquet rowgroup pruning with files containing deprecated min/max values. diff --git a/pom.xml b/pom.xml index bfe9041f..8598cfd2 100644 --- a/pom.xml +++ b/pom.xml @@ -13,7 +13,7 @@ - 2.0.9-SNAPSHOT + 2.0.9.1-SNAPSHOT UTF-8 15.0.2 3.21.9