diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml index 4b871d637..60afcf6fd 100644 --- a/.github/workflows/master.yml +++ b/.github/workflows/master.yml @@ -17,10 +17,10 @@ jobs: strategy: matrix: profiles: - - '-Pspark-3.0 -Phadoop-2.7' - - '-Pspark-3.0 -Phadoop-2.7 -Dspark.archive.mirror=https://archive.apache.org/dist/spark/spark-3.1.1 -Dspark.archive.name=spark-3.1.1-bin-hadoop2.7.tgz -Dmaven.plugin.scalatest.exclude.tags=org.apache.kyuubi.tags.DataLakeTest' - - '-Pspark-3.1 -Phadoop-2.7' - - '-Pspark-3.1 -Phadoop-3.2' + - '-Pspark-3.0 -Pspark-hadoop-2.7' + - '-Pspark-3.0 -Pspark-hadoop-2.7 -Dspark.archive.mirror=https://archive.apache.org/dist/spark/spark-3.1.1 -Dspark.archive.name=spark-3.1.1-bin-hadoop2.7.tgz -Dmaven.plugin.scalatest.exclude.tags=org.apache.kyuubi.tags.DataLakeTest' + - '-Pspark-3.1 -Pspark-hadoop-2.7' + - '-Pspark-3.1 -Pspark-hadoop-3.2' steps: - uses: actions/checkout@v2 - name: Setup JDK 1.8 diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml index 4378f564e..6524c6a7f 100644 --- a/.github/workflows/release.yml +++ b/.github/workflows/release.yml @@ -12,12 +12,12 @@ jobs: strategy: matrix: profiles: - - '-Pspark-3.0 -Phadoop-2.7' - - '--spark-provided -Pspark-3.0 -Phadoop-2.7' - - '-Pspark-3.1 -Phadoop-2.7' - - '--spark-provided -Pspark-3.1 -Phadoop-2.7' - - '-Pspark-3.1 -Phadoop-3.2' - - '--spark-provided -Pspark-3.1 -Phadoop-3.2' + - '-Pspark-3.0 -Pspark-hadoop-2.7' + - '--spark-provided -Pspark-3.0 -Pspark-hadoop-2.7' + - '-Pspark-3.1 -Pspark-hadoop-2.7' + - '--spark-provided -Pspark-3.1 -Pspark-hadoop-2.7' + - '-Pspark-3.1 -Pspark-hadoop-3.2' + - '--spark-provided -Pspark-3.1 -Pspark-hadoop-3.2' steps: - uses: actions/checkout@master # We split caches because GitHub Action Cache has a 400MB-size limit. diff --git a/.travis.yml b/.travis.yml index adde60221..fd18314e5 100644 --- a/.travis.yml +++ b/.travis.yml @@ -28,21 +28,21 @@ cache: matrix: include: - - name: Test Kyuubi w/ -Pspark-3.0 -Phadoop-2.7 + - name: Test Kyuubi w/ -Pspark-3.0 -Pspark-hadoop-2.7 env: - - PROFILE="-Pspark-3.0 -Phadoop-2.7" + - PROFILE="-Pspark-3.0 -Pspark-hadoop-2.7" - EXCLUDE_TAGS="" - - name: Test Kyuubi w/ -Pspark-3.1 -Phadoop-2.7 + - name: Test Kyuubi w/ -Pspark-3.1 -Pspark-hadoop-2.7 env: - - PROFILE="-Pspark-3.1 -Phadoop-2.7" + - PROFILE="-Pspark-3.1 -Pspark-hadoop-2.7" - EXCLUDE_TAGS="org.apache.kyuubi.tags.DataLakeTest" - - name: Test Kyuubi w/ -Pspark-3.1 -Phadoop-3.2 + - name: Test Kyuubi w/ -Pspark-3.1 -Pspark-hadoop-3.2 env: - - PROFILE="-Pspark-3.1 -Phadoop-3.2" + - PROFILE="-Pspark-3.1 -Pspark-hadoop-3.2" - EXCLUDE_TAGS="org.apache.kyuubi.tags.DataLakeTest" - - name: Test Kyuubi w/ -Pspark-3.0 -Phadoop-2.7 by Spark 3.1 distribution + - name: Test Kyuubi w/ -Pspark-3.0 -Pspark-hadoop-2.7 by Spark 3.1 distribution env: - - PROFILE="-Pspark-3.0 -Phadoop-2.7 -Dspark.archive.mirror=https://archive.apache.org/dist/spark/spark-3.1.1 -Dspark.archive.name=spark-3.1.1-bin-hadoop2.7.tgz" + - PROFILE="-Pspark-3.0 -Pspark-hadoop-2.7 -Dspark.archive.mirror=https://archive.apache.org/dist/spark/spark-3.1.1 -Dspark.archive.name=spark-3.1.1-bin-hadoop2.7.tgz" - EXCLUDE_TAGS="org.apache.kyuubi.tags.DataLakeTest" install: diff --git a/build/dist b/build/dist index 3379d8b93..5eba94e09 100755 --- a/build/dist +++ b/build/dist @@ -128,6 +128,11 @@ SPARK_VERSION=$("$MVN" help:evaluate -Dexpression=spark.version $@ 2>/dev/null\ | grep -v "WARNING"\ | tail -n 1) +SPARK_HADOOP_VERSION=$("$MVN" help:evaluate -Dexpression=spark.hadoop.binary.version $@ 2>/dev/null\ + | grep -v "INFO"\ + | grep -v "WARNING"\ + | tail -n 1) + HADOOP_VERSION=$("$MVN" help:evaluate -Dexpression=hadoop.version $@ 2>/dev/null\ | grep -v "INFO"\ | grep -v "WARNING"\ @@ -141,17 +146,12 @@ HIVE_VERSION=$("$MVN" help:evaluate -Dexpression=hive.version $@ 2>/dev/null\ echo "Building Kyuubi package of version $VERSION against Spark version - $SPARK_VERSION" if [[ "$NAME" == "none" ]]; then - - if [[ ${HADOOP_VERSION:0:3} == "2.7" ]]; then - HADOOP_VERSION_SUFFIX="" - else - HADOOP_VERSION_SUFFIX="-hadoop${HADOOP_VERSION:0:3}" - fi + SPARK_HADOOP_VERSION_SUFFIX="-hadoop${SPARK_HADOOP_VERSION}" if [[ "$SPARK_PROVIDED" == "true" ]]; then - NAME="without-spark"$HADOOP_VERSION_SUFFIX + NAME="without-spark"$SPARK_HADOOP_VERSION_SUFFIX else - NAME="spark-"${SPARK_VERSION:0:3}$HADOOP_VERSION_SUFFIX + NAME="spark-"${SPARK_VERSION:0:3}$SPARK_HADOOP_VERSION_SUFFIX fi fi @@ -192,8 +192,8 @@ cp -r "$KYUUBI_HOME/kyuubi-assembly/target/scala-$SCALA_VERSION/jars/" "$DISTDIR ## cp engines if [[ "$SPARK_PROVIDED" != "true" ]]; then - cp -r "$KYUUBI_HOME/externals/kyuubi-download/target/spark-$SPARK_VERSION-bin-hadoop${HADOOP_VERSION:0:3}$HIVE_VERSION_SUFFIX/" \ - "$DISTDIR/externals/spark-$SPARK_VERSION-bin-hadoop${HADOOP_VERSION:0:3}$HIVE_VERSION_SUFFIX/" + cp -r "$KYUUBI_HOME/externals/kyuubi-download/target/spark-$SPARK_VERSION-bin-hadoop${SPARK_HADOOP_VERSION}$HIVE_VERSION_SUFFIX/" \ + "$DISTDIR/externals/spark-$SPARK_VERSION-bin-hadoop${SPARK_HADOOP_VERSION}$HIVE_VERSION_SUFFIX/" fi cp "$KYUUBI_HOME/externals/kyuubi-spark-sql-engine/target/kyuubi-spark-sql-engine-$VERSION.jar" "$DISTDIR/externals/engines/spark" diff --git a/externals/kyuubi-spark-sql-engine/pom.xml b/externals/kyuubi-spark-sql-engine/pom.xml index d2c7ad549..eaab1a315 100644 --- a/externals/kyuubi-spark-sql-engine/pom.xml +++ b/externals/kyuubi-spark-sql-engine/pom.xml @@ -64,6 +64,12 @@ test + + commons-collections + commons-collections + test + + org.apache.spark spark-hive_${scala.binary.version} @@ -106,7 +112,13 @@ org.apache.hadoop - hadoop-client + hadoop-client-api + test + + + + org.apache.hadoop + hadoop-client-runtime test diff --git a/kyuubi-assembly/pom.xml b/kyuubi-assembly/pom.xml index 5482e7853..ce1f22cc9 100644 --- a/kyuubi-assembly/pom.xml +++ b/kyuubi-assembly/pom.xml @@ -53,7 +53,12 @@ org.apache.hadoop - hadoop-common + hadoop-client-api + + + + org.apache.hadoop + hadoop-client-runtime diff --git a/kyuubi-common/pom.xml b/kyuubi-common/pom.xml index 2c452731d..3de378e9e 100644 --- a/kyuubi-common/pom.xml +++ b/kyuubi-common/pom.xml @@ -56,7 +56,17 @@ org.apache.hadoop - hadoop-common + hadoop-client-api + + + + org.apache.hadoop + hadoop-client-runtime + + + + commons-codec + commons-codec diff --git a/kyuubi-ha/pom.xml b/kyuubi-ha/pom.xml index 2143b957d..198481fc2 100644 --- a/kyuubi-ha/pom.xml +++ b/kyuubi-ha/pom.xml @@ -40,7 +40,13 @@ org.apache.hadoop - hadoop-common + hadoop-client-api + provided + + + + org.apache.hadoop + hadoop-client-runtime provided diff --git a/kyuubi-main/pom.xml b/kyuubi-main/pom.xml index cafb4bc6b..681c03e45 100644 --- a/kyuubi-main/pom.xml +++ b/kyuubi-main/pom.xml @@ -45,7 +45,12 @@ org.apache.hadoop - hadoop-common + hadoop-client-api + + + + org.apache.hadoop + hadoop-client-runtime diff --git a/pom.xml b/pom.xml index d116f739f..9e89b92a4 100644 --- a/pom.xml +++ b/pom.xml @@ -60,16 +60,18 @@ 2.12 2.0.0-M15 + 1.15 + 3.2.2 3.10 4.5.6 4.4.12 24.1.1-jre 2.12.0 - 2.7.4 - 2.7 + 3.2.2 2.3.7 3.0.2 - spark-${spark.version}-bin-hadoop${hadoop.binary.version}.tgz + 3.2 + spark-${spark.version}-bin-hadoop${spark.hadoop.binary.version}.tgz https://archive.apache.org/dist/spark/spark-${spark.version} false @@ -301,7 +303,13 @@ org.apache.hadoop - hadoop-client + hadoop-client-api + ${hadoop.version} + + + + org.apache.hadoop + hadoop-client-runtime ${hadoop.version} @@ -318,6 +326,18 @@ + + commons-codec + commons-codec + ${commons-codec.version} + + + + commons-collections + commons-collections + ${commons-collections.version} + + org.apache.commons commons-lang3 @@ -1367,14 +1387,16 @@ - hadoop-2.7 + spark-hadoop-2.7 + + 2.7 + - hadoop-3.2 + spark-hadoop-3.2 - 3.2.2 - 3.2 + 3.2