From 152be37c1669ef4b98e63e42b9653e23499ce633 Mon Sep 17 00:00:00 2001
From: Zhen Wang <643348094@qq.com>
Date: Mon, 9 Dec 2024 14:08:34 +0800
Subject: [PATCH] [CORE][UNIFFLE] Bump uniffle 0.9.1 (#8166)
* Bump uniffle 0.9.1
* address comment
* address comment
---
.github/workflows/velox_backend.yml | 23 ++++++++++-------------
docs/get-started/Velox.md | 2 +-
pom.xml | 2 +-
tools/gluten-it/pom.xml | 2 +-
4 files changed, 13 insertions(+), 16 deletions(-)
diff --git a/.github/workflows/velox_backend.yml b/.github/workflows/velox_backend.yml
index ce195c4e1b52..5feb5fa56855 100644
--- a/.github/workflows/velox_backend.yml
+++ b/.github/workflows/velox_backend.yml
@@ -491,6 +491,8 @@ jobs:
fail-fast: false
matrix:
spark: [ "spark-3.2" ]
+ uniffle: [ "0.9.1" ]
+ hadoop: [ "2.8.5" ]
runs-on: ubuntu-20.04
container: centos:8
steps:
@@ -513,21 +515,16 @@ jobs:
run: |
yum update -y && yum install -y java-1.8.0-openjdk-devel wget git
$SETUP install_maven
- - name: Build for Uniffle 0.9.0
+ - name: Install Uniffle ${{ matrix.uniffle }}
run: |
export JAVA_HOME=/usr/lib/jvm/java-1.8.0-openjdk && \
cd /opt && \
- git clone -b v0.9.0 https://github.com/apache/incubator-uniffle.git && \
- cd incubator-uniffle && \
- $MVN_CMD clean install -Phadoop2.8,spark3 -DskipTests
- cd /opt && \
- ${WGET_CMD} https://archive.apache.org/dist/incubator/uniffle/0.9.0/apache-uniffle-0.9.0-incubating-bin.tar.gz && \
- tar xzf apache-uniffle-0.9.0-incubating-bin.tar.gz -C /opt/ && mv /opt/rss-0.9.0-hadoop2.8 /opt/uniffle && \
- ${WGET_CMD} https://archive.apache.org/dist/hadoop/common/hadoop-2.8.5/hadoop-2.8.5.tar.gz && \
- tar xzf hadoop-2.8.5.tar.gz -C /opt/
- rm -rf /opt/incubator-uniffle
+ ${WGET_CMD} https://archive.apache.org/dist/incubator/uniffle/${{ matrix.uniffle }}/apache-uniffle-${{ matrix.uniffle }}-incubating-bin.tar.gz && \
+ mkdir /opt/uniffle && tar xzf apache-uniffle-${{ matrix.uniffle }}-incubating-bin.tar.gz -C /opt/uniffle --strip-components=1 && \
+ ${WGET_CMD} https://archive.apache.org/dist/hadoop/common/hadoop-${{ matrix.hadoop }}/hadoop-${{ matrix.hadoop }}.tar.gz && \
+ tar xzf hadoop-${{ matrix.hadoop }}.tar.gz -C /opt/ && \
cd /opt/uniffle && mkdir shuffle_data && \
- bash -c "echo -e 'XMX_SIZE=16g\nHADOOP_HOME=/opt/hadoop-2.8.5' > ./bin/rss-env.sh" && \
+ bash -c "echo -e 'XMX_SIZE=16g\nHADOOP_HOME=/opt/hadoop-${{ matrix.hadoop }}' > ./bin/rss-env.sh" && \
bash -c "echo -e 'rss.coordinator.shuffle.nodes.max 1\nrss.rpc.server.port 19999' > ./conf/coordinator.conf" && \
bash -c "echo -e 'rss.server.app.expired.withoutHeartbeat 7200000\nrss.server.heartbeat.delay 3000\nrss.rpc.server.port 19997\nrss.rpc.server.type GRPC_NETTY\nrss.jetty.http.port 19996\nrss.server.netty.port 19995\nrss.storage.basePath /opt/uniffle/shuffle_data\nrss.storage.type MEMORY_LOCALFILE\nrss.coordinator.quorum localhost:19999\nrss.server.flush.thread.alive 10\nrss.server.single.buffer.flush.threshold 64m' > ./conf/server.conf" && \
bash ./bin/start-coordinator.sh && bash ./bin/start-shuffle-server.sh
@@ -535,11 +532,11 @@ jobs:
run: |
cd $GITHUB_WORKSPACE/ && \
$MVN_CMD clean install -P${{ matrix.spark }} -Pbackends-velox -Puniffle -DskipTests
- - name: TPC-H SF1.0 && TPC-DS SF1.0 Parquet local spark3.2 with uniffle-0.9.0
+ - name: TPC-H SF1.0 && TPC-DS SF1.0 Parquet local spark3.2 with uniffle-${{ matrix.uniffle }}
run: |
export JAVA_HOME=/usr/lib/jvm/java-1.8.0-openjdk && \
cd $GITHUB_WORKSPACE/tools/gluten-it && \
- $MVN_CMD clean install -Pspark-3.2 -Puniffle && \
+ $MVN_CMD clean install -P${{ matrix.spark }} -Puniffle && \
GLUTEN_IT_JVM_ARGS=-Xmx5G sbin/gluten-it.sh queries-compare \
--local --preset=velox-with-uniffle --benchmark-type=h --error-on-memleak --off-heap-size=10g -s=1.0 --threads=16 --iterations=1
diff --git a/docs/get-started/Velox.md b/docs/get-started/Velox.md
index 3b3ab07a8dea..a0af0cc75d02 100644
--- a/docs/get-started/Velox.md
+++ b/docs/get-started/Velox.md
@@ -272,7 +272,7 @@ spark.dynamicAllocation.enabled false
## Uniffle support
-Uniffle with velox backend supports [Uniffle](https://github.com/apache/incubator-uniffle) as remote shuffle service. Currently, the supported Uniffle versions are `0.9.0`.
+Uniffle with velox backend supports [Uniffle](https://github.com/apache/incubator-uniffle) as remote shuffle service. Currently, the supported Uniffle versions are `0.9.1`.
First refer to this URL(https://uniffle.apache.org/docs/intro) to get start with uniffle.
diff --git a/pom.xml b/pom.xml
index a2cccda1e45e..9b27a6839712 100644
--- a/pom.xml
+++ b/pom.xml
@@ -66,7 +66,7 @@
2.4.0
24
0.5.2
- 0.9.0
+ 0.9.1
15.0.0
15.0.0-gluten
arrow-memory-unsafe
diff --git a/tools/gluten-it/pom.xml b/tools/gluten-it/pom.xml
index 1973a7d99890..eb2c3d87e761 100644
--- a/tools/gluten-it/pom.xml
+++ b/tools/gluten-it/pom.xml
@@ -22,7 +22,7 @@
2.12
3
0.3.2-incubating
- 0.9.0
+ 0.9.1
1.3.0-SNAPSHOT
32.0.1-jre
1.1