diff --git a/.github/workflows/build-ce7-releases.yml b/.github/workflows/build-ce7-releases.yml index d84825e0..3763a313 100644 --- a/.github/workflows/build-ce7-releases.yml +++ b/.github/workflows/build-ce7-releases.yml @@ -12,7 +12,7 @@ jobs: strategy: matrix: sparkver: [spark-3.0, spark-3.1, spark-3.2, spark-3.3, spark-3.4, spark-3.5] - blazever: [3.0.1] + blazever: [4.0.0] steps: - uses: actions/checkout@v4 diff --git a/RELEASES.md b/RELEASES.md index 4ed7b0a5..32725386 100644 --- a/RELEASES.md +++ b/RELEASES.md @@ -1,10 +1,18 @@ -# blaze-v3.0.1 +# blaze-v4.0.0 -## Features -* Supports spark3.0/3.2/3.3. +## New features +* supports spark3.0/3.1/3.2/3.3/3.4/3.5. +* supports integrating with Apache Celeborn. +* supports native ORC input format. +* supports bloom filter join introduced in spark 3.5. +* supports forceShuffledHashJoin for running tpch/tpcds benchmarks. +* new supported native expression/functions: year, month, day, md5. -## Performance -fix GetJsonObject conversion, supporting faster get_json_object with sonic-rs. +## Bug fixes +* add missing UDTF.terminate() invokes. +* fix NPE while executing some native spark physical plans. -## Bugfix -* fix childOrderingRequiredTag computation logic. +## Performance +* use custom implemented hash table for faster joining, supporting SIMD, bulk searching, memory prefetching, etc. +* improve shuffle write performance. +* reuse FSDataInputStream for same input file. diff --git a/pom.xml b/pom.xml index 0f2f7619..42868d1e 100644 --- a/pom.xml +++ b/pom.xml @@ -14,7 +14,7 @@ - 3.0.1-SNAPSHOT + 4.0.0-SNAPSHOT UTF-8 16.0.0 3.21.9