[KYUUBI #2024] Hive Backend Engine - ProcBuilder for HiveEngine
### _Why are the changes needed?_ Add ProcBuilder for HiveEngine. ### _How was this patch tested?_ - [ ] Add some test cases that check the changes thoroughly including negative and positive cases if possible - [ ] Add screenshots for manual tests if appropriate - [ ] [Run test](https://kyuubi.apache.org/docs/latest/develop_tools/testing.html#running-tests) locally before make a pull request Closes #2146 from zhaomin1423/hive_process_builder. Closes #2024 1baf1397 [Min Zhao] [KYUUBI #2024] Hive Backend Engine - ProcBuilder for HiveEngine 23fdc3b7 [Min Zhao] [KYUUBI #2024] Hive Backend Engine - ProcBuilder for HiveEngine Authored-by: Min Zhao <zhaomin1423@163.com> Signed-off-by: Kent Yao <yao@apache.org>
This commit is contained in:
parent
f22a14f1e5
commit
2911ac26c7
@ -81,6 +81,7 @@ fi
|
||||
export FLINK_HOME="${FLINK_HOME:-"${FLINK_BUILTIN}"}"
|
||||
export FLINK_ENGINE_HOME="${KYUUBI_HOME}/externals/engines/flink"
|
||||
export TRINO_ENGINE_HOME="${KYUUBI_HOME}/externals/engines/trino"
|
||||
export HIVE_ENGINE_HOME="${KYUUBI_HOME}/externals/engines/hive"
|
||||
export SPARK_HOME="${SPARK_HOME:-"${SPARK_BUILTIN}"}"
|
||||
|
||||
# Print essential environment variables to console
|
||||
@ -101,6 +102,8 @@ if [ $silent -eq 0 ]; then
|
||||
|
||||
echo "TRINO_ENGINE_HOME: ${TRINO_ENGINE_HOME}"
|
||||
|
||||
echo "HIVE_ENGINE_HOME: ${HIVE_ENGINE_HOME}"
|
||||
|
||||
echo "HADOOP_CONF_DIR: ${HADOOP_CONF_DIR}"
|
||||
|
||||
echo "YARN_CONF_DIR: ${YARN_CONF_DIR}"
|
||||
|
||||
@ -324,6 +324,7 @@ Key | Default | Meaning | Type | Since
|
||||
<code>kyuubi.session.engine.check.interval</code>|<div style='width: 65pt;word-wrap: break-word;white-space: normal'>PT1M</div>|<div style='width: 170pt;word-wrap: break-word;white-space: normal'>The check interval for engine timeout</div>|<div style='width: 30pt'>duration</div>|<div style='width: 20pt'>1.0.0</div>
|
||||
<code>kyuubi.session.engine.flink.main.resource</code>|<div style='width: 65pt;word-wrap: break-word;white-space: normal'><undefined></div>|<div style='width: 170pt;word-wrap: break-word;white-space: normal'>The package used to create Flink SQL engine remote job. If it is undefined, Kyuubi will use the default</div>|<div style='width: 30pt'>string</div>|<div style='width: 20pt'>1.4.0</div>
|
||||
<code>kyuubi.session.engine.flink.max.rows</code>|<div style='width: 65pt;word-wrap: break-word;white-space: normal'>1000000</div>|<div style='width: 170pt;word-wrap: break-word;white-space: normal'>Max rows of Flink query results. For batch queries, rows that exceeds the limit would be ignored. For streaming queries, the query would be canceled if the limit is reached.</div>|<div style='width: 30pt'>int</div>|<div style='width: 20pt'>1.5.0</div>
|
||||
<code>kyuubi.session.engine.hive.main.resource</code>|<div style='width: 65pt;word-wrap: break-word;white-space: normal'><undefined></div>|<div style='width: 170pt;word-wrap: break-word;white-space: normal'>The package used to create Hive engine remote job. If it is undefined, Kyuubi will use the default</div>|<div style='width: 30pt'>string</div>|<div style='width: 20pt'>1.6.0</div>
|
||||
<code>kyuubi.session.engine.idle.timeout</code>|<div style='width: 65pt;word-wrap: break-word;white-space: normal'>PT30M</div>|<div style='width: 170pt;word-wrap: break-word;white-space: normal'>engine timeout, the engine will self-terminate when it's not accessed for this duration. 0 or negative means not to self-terminate.</div>|<div style='width: 30pt'>duration</div>|<div style='width: 20pt'>1.0.0</div>
|
||||
<code>kyuubi.session.engine.initialize.timeout</code>|<div style='width: 65pt;word-wrap: break-word;white-space: normal'>PT3M</div>|<div style='width: 170pt;word-wrap: break-word;white-space: normal'>Timeout for starting the background engine, e.g. SparkSQLEngine.</div>|<div style='width: 30pt'>duration</div>|<div style='width: 20pt'>1.0.0</div>
|
||||
<code>kyuubi.session.engine.launch.async</code>|<div style='width: 65pt;word-wrap: break-word;white-space: normal'>true</div>|<div style='width: 170pt;word-wrap: break-word;white-space: normal'>When opening kyuubi session, whether to launch backend engine asynchronously. When true, the Kyuubi server will set up the connection with the client without delay as the backend engine will be created asynchronously.</div>|<div style='width: 30pt'>boolean</div>|<div style='width: 20pt'>1.4.0</div>
|
||||
|
||||
46
externals/kyuubi-hive-sql-engine/bin/hive-sql-engine.sh
vendored
Executable file
46
externals/kyuubi-hive-sql-engine/bin/hive-sql-engine.sh
vendored
Executable file
@ -0,0 +1,46 @@
|
||||
#!/usr/bin/env bash
|
||||
#
|
||||
# Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
# contributor license agreements. See the NOTICE file distributed with
|
||||
# this work for additional information regarding copyright ownership.
|
||||
# The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
# (the "License"); you may not use this file except in compliance with
|
||||
# the License. You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
#
|
||||
if [[ -z ${JAVA_HOME} ]]; then
|
||||
echo "[ERROR] JAVA_HOME IS NOT SET! CANNOT PROCEED."
|
||||
exit 1
|
||||
fi
|
||||
|
||||
RUNNER="${JAVA_HOME}/bin/java"
|
||||
|
||||
if [[ "$HIVE_ENGINE_HOME" == "$KYUUBI_HOME/externals/engines/hive" ]]; then
|
||||
HIVE_CLIENT_JAR="$HIVE_ENGINE_JAR"
|
||||
HIVE_CLIENT_JARS_DIR="$HIVE_ENGINE_HOME/jars"
|
||||
else
|
||||
echo "\nHIVE_ENGINE_HOME $HIVE_ENGINE_HOME doesn't match production directory, assuming in development environment..."
|
||||
HIVE_CLIENT_JAR=$(find $HIVE_ENGINE_HOME/target -regex '.*/kyuubi-hive-sql-engine_.*.jar$' | grep -v '\-sources.jar$' | grep -v '\-javadoc.jar$' | grep -v '\-tests.jar$')
|
||||
HIVE_CLIENT_JARS_DIR=$(find $HIVE_ENGINE_HOME/target -regex '.*/jars')
|
||||
fi
|
||||
|
||||
HIVE_CLIENT_CLASSPATH="$HIVE_CLIENT_JARS_DIR/*"
|
||||
if [[ -z ${YARN_CONF_DIR} ]]; then
|
||||
FULL_CLASSPATH="$HIVE_CLIENT_CLASSPATH:$HIVE_CLIENT_JAR:$HADOOP_CONF_DIR:$HIVE_CONF_DIR"
|
||||
else
|
||||
FULL_CLASSPATH="$HIVE_CLIENT_CLASSPATH:$HIVE_CLIENT_JAR:$HADOOP_CONF_DIR:$HIVE_CONF_DIR:$YARN_CONF_DIR"
|
||||
fi
|
||||
|
||||
if [ -n "$HIVE_CLIENT_JAR" ]; then
|
||||
exec $RUNNER ${HIVE_ENGINE_DYNAMIC_ARGS} -cp ${FULL_CLASSPATH} org.apache.kyuubi.engine.hive.HiveSQLEngine "$@"
|
||||
else
|
||||
(>&2 echo "[ERROR] HIVE Engine JAR file 'kyuubi-hive-sql-engine*.jar' should be located in $HIVE_ENGINE_HOME/jars.")
|
||||
exit 1
|
||||
fi
|
||||
@ -648,6 +648,14 @@ object KyuubiConf {
|
||||
.stringConf
|
||||
.createOptional
|
||||
|
||||
val ENGINE_HIVE_MAIN_RESOURCE: OptionalConfigEntry[String] =
|
||||
buildConf("session.engine.hive.main.resource")
|
||||
.doc("The package used to create Hive engine remote job. If it is undefined," +
|
||||
" Kyuubi will use the default")
|
||||
.version("1.6.0")
|
||||
.stringConf
|
||||
.createOptional
|
||||
|
||||
val ENGINE_LOGIN_TIMEOUT: ConfigEntry[Long] = buildConf("session.engine.login.timeout")
|
||||
.doc("The timeout of creating the connection to remote sql query engine")
|
||||
.version("1.0.0")
|
||||
|
||||
@ -23,5 +23,5 @@ package org.apache.kyuubi.engine
|
||||
object EngineType extends Enumeration {
|
||||
type EngineType = Value
|
||||
|
||||
val SPARK_SQL, FLINK_SQL, TRINO = Value
|
||||
val SPARK_SQL, FLINK_SQL, TRINO, HIVE_SQL = Value
|
||||
}
|
||||
|
||||
@ -33,9 +33,10 @@ import org.apache.kyuubi.{KYUUBI_VERSION, KyuubiSQLException, Logging, Utils}
|
||||
import org.apache.kyuubi.config.KyuubiConf
|
||||
import org.apache.kyuubi.config.KyuubiConf._
|
||||
import org.apache.kyuubi.config.KyuubiReservedKeys.KYUUBI_ENGINE_SUBMIT_TIME_KEY
|
||||
import org.apache.kyuubi.engine.EngineType.{EngineType, FLINK_SQL, SPARK_SQL, TRINO}
|
||||
import org.apache.kyuubi.engine.EngineType.{EngineType, FLINK_SQL, HIVE_SQL, SPARK_SQL, TRINO}
|
||||
import org.apache.kyuubi.engine.ShareLevel.{CONNECTION, GROUP, SERVER, ShareLevel}
|
||||
import org.apache.kyuubi.engine.flink.FlinkProcessBuilder
|
||||
import org.apache.kyuubi.engine.hive.HiveProcessBuilder
|
||||
import org.apache.kyuubi.engine.spark.SparkProcessBuilder
|
||||
import org.apache.kyuubi.engine.trino.TrinoProcessBuilder
|
||||
import org.apache.kyuubi.ha.HighAvailabilityConf.HA_ZK_ENGINE_REF_ID
|
||||
@ -198,6 +199,8 @@ private[kyuubi] class EngineRef(
|
||||
new FlinkProcessBuilder(appUser, conf, extraEngineLog)
|
||||
case TRINO =>
|
||||
new TrinoProcessBuilder(appUser, conf, extraEngineLog)
|
||||
case HIVE_SQL =>
|
||||
new HiveProcessBuilder(appUser, conf, extraEngineLog)
|
||||
}
|
||||
|
||||
MetricsSystem.tracing(_.incCount(ENGINE_TOTAL))
|
||||
|
||||
@ -0,0 +1,100 @@
|
||||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
* contributor license agreements. See the NOTICE file distributed with
|
||||
* this work for additional information regarding copyright ownership.
|
||||
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
* (the "License"); you may not use this file except in compliance with
|
||||
* the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
package org.apache.kyuubi.engine.hive
|
||||
|
||||
import java.net.URI
|
||||
import java.nio.file.{Files, Paths}
|
||||
|
||||
import org.apache.kyuubi.{KYUUBI_VERSION, KyuubiSQLException, Logging, SCALA_COMPILE_VERSION}
|
||||
import org.apache.kyuubi.config.KyuubiConf
|
||||
import org.apache.kyuubi.config.KyuubiConf.ENGINE_HIVE_MAIN_RESOURCE
|
||||
import org.apache.kyuubi.engine.ProcBuilder
|
||||
import org.apache.kyuubi.engine.hive.HiveProcessBuilder.HIVE_ENGINE_BINARY_FILE
|
||||
import org.apache.kyuubi.operation.log.OperationLog
|
||||
|
||||
class HiveProcessBuilder(
|
||||
override val proxyUser: String,
|
||||
override val conf: KyuubiConf,
|
||||
val extraEngineLog: Option[OperationLog] = None)
|
||||
extends ProcBuilder with Logging {
|
||||
|
||||
override protected def executable: String = {
|
||||
val hiveHomeOpt = env.get("HIVE_ENGINE_HOME").orElse {
|
||||
val cwd = getClass.getProtectionDomain.getCodeSource.getLocation.getPath
|
||||
.split("kyuubi-server")
|
||||
assert(cwd.length > 1)
|
||||
Option(
|
||||
Paths.get(cwd.head)
|
||||
.resolve("externals")
|
||||
.resolve(module)
|
||||
.toFile)
|
||||
.map(_.getAbsolutePath)
|
||||
}
|
||||
|
||||
hiveHomeOpt.map { dir =>
|
||||
Paths.get(dir, "bin", HIVE_ENGINE_BINARY_FILE).toAbsolutePath.toFile.getCanonicalPath
|
||||
}.getOrElse {
|
||||
throw KyuubiSQLException("HIVE_ENGINE_HOME is not set! " +
|
||||
"For more detail information on installing and configuring Hive, please visit " +
|
||||
"https://kyuubi.apache.org/docs/stable/deployment/settings.html#environments")
|
||||
}
|
||||
}
|
||||
|
||||
override protected def mainResource: Option[String] = {
|
||||
val jarName = s"${module}_$SCALA_COMPILE_VERSION-$KYUUBI_VERSION.jar"
|
||||
// 1. get the main resource jar for user specified config first
|
||||
conf.get(ENGINE_HIVE_MAIN_RESOURCE).filter { userSpecified =>
|
||||
// skip check exist if not local file.
|
||||
val uri = new URI(userSpecified)
|
||||
val schema = if (uri.getScheme != null) uri.getScheme else "file"
|
||||
schema match {
|
||||
case "file" => Files.exists(Paths.get(userSpecified))
|
||||
case _ => true
|
||||
}
|
||||
}.orElse {
|
||||
// 2. get the main resource jar from system build default
|
||||
env.get(KyuubiConf.KYUUBI_HOME)
|
||||
.map { Paths.get(_, "externals", "engines", "hive", "jars", jarName) }
|
||||
.filter(Files.exists(_)).map(_.toAbsolutePath.toFile.getCanonicalPath)
|
||||
}.orElse {
|
||||
// 3. get the main resource from dev environment
|
||||
Option(Paths.get("externals", module, "target", jarName))
|
||||
.filter(Files.exists(_)).orElse {
|
||||
Some(Paths.get("..", "externals", module, "target", jarName))
|
||||
}.map(_.toAbsolutePath.toFile.getCanonicalPath)
|
||||
}
|
||||
}
|
||||
|
||||
override protected def childProcEnv: Map[String, String] = conf.getEnvs +
|
||||
("HIVE_ENGINE_JAR" -> mainResource.get) +
|
||||
("HIVE_ENGINE_DYNAMIC_ARGS" ->
|
||||
conf.getAll.map { case (k, v) => s"-D$k=$v" }.mkString(" "))
|
||||
|
||||
override protected def module: String = "kyuubi-hive-sql-engine"
|
||||
|
||||
override protected def mainClass: String = "org.apache.kyuubi.engine.hive.HiveSQLEngine"
|
||||
|
||||
override protected def commands: Array[String] = Array(executable)
|
||||
|
||||
}
|
||||
|
||||
object HiveProcessBuilder {
|
||||
|
||||
val HIVE_ENGINE_BINARY_FILE = "hive-sql-engine.sh"
|
||||
|
||||
}
|
||||
@ -0,0 +1,32 @@
|
||||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
* contributor license agreements. See the NOTICE file distributed with
|
||||
* this work for additional information regarding copyright ownership.
|
||||
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
* (the "License"); you may not use this file except in compliance with
|
||||
* the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
package org.apache.kyuubi.engine.hive
|
||||
|
||||
import org.apache.kyuubi.KyuubiFunSuite
|
||||
import org.apache.kyuubi.config.KyuubiConf
|
||||
|
||||
class HiveProcessBuilderSuite extends KyuubiFunSuite {
|
||||
|
||||
private def conf = KyuubiConf().set("kyuubi.on", "off")
|
||||
|
||||
test("hive process builder") {
|
||||
val builder = new HiveProcessBuilder("kyuubi", conf)
|
||||
val commands = builder.toString.split(' ')
|
||||
assert(commands.exists(_.endsWith("hive-sql-engine.sh")))
|
||||
}
|
||||
}
|
||||
Loading…
Reference in New Issue
Block a user