|
@@ -1,200 +0,0 @@
|
|
|
-#!/usr/bin/python
|
|
|
-"""
|
|
|
-Licensed to the Apache Software Foundation (ASF) under one
|
|
|
-or more contributor license agreements. See the NOTICE file
|
|
|
-distributed with this work for additional information
|
|
|
-regarding copyright ownership. The ASF licenses this file
|
|
|
-to you under the Apache License, Version 2.0 (the
|
|
|
-"License"); you may not use this file except in compliance
|
|
|
-with the License. You may obtain a copy of the License at
|
|
|
-
|
|
|
- http://www.apache.org/licenses/LICENSE-2.0
|
|
|
-
|
|
|
-Unless required by applicable law or agreed to in writing, software
|
|
|
-distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
-See the License for the specific language governing permissions and
|
|
|
-limitations under the License.
|
|
|
-
|
|
|
-"""
|
|
|
-
|
|
|
-
|
|
|
-import status_params
|
|
|
-from resource_management.libraries.functions.stack_features import check_stack_feature
|
|
|
-from resource_management.libraries.functions import StackFeature
|
|
|
-from setup_spark import *
|
|
|
-
|
|
|
-import resource_management.libraries.functions
|
|
|
-from resource_management.libraries.functions import conf_select
|
|
|
-from resource_management.libraries.functions import stack_select
|
|
|
-from resource_management.libraries.functions import format
|
|
|
-from resource_management.libraries.functions.get_stack_version import get_stack_version
|
|
|
-from resource_management.libraries.functions.version import format_stack_version
|
|
|
-from resource_management.libraries.functions.default import default
|
|
|
-from resource_management.libraries.functions import get_kinit_path
|
|
|
-from resource_management.libraries.functions.get_not_managed_resources import get_not_managed_resources
|
|
|
-
|
|
|
-from resource_management.libraries.script.script import Script
|
|
|
-
|
|
|
-# a map of the Ambari role to the component name
|
|
|
-# for use with <stack-root>/current/<component>
|
|
|
-SERVER_ROLE_DIRECTORY_MAP = {
|
|
|
- 'SPARK_JOBHISTORYSERVER' : 'spark-historyserver',
|
|
|
- 'SPARK_CLIENT' : 'spark-client',
|
|
|
- 'SPARK_THRIFTSERVER' : 'spark-thriftserver'
|
|
|
-}
|
|
|
-
|
|
|
-component_directory = Script.get_component_from_role(SERVER_ROLE_DIRECTORY_MAP, "SPARK_CLIENT")
|
|
|
-
|
|
|
-config = Script.get_config()
|
|
|
-tmp_dir = Script.get_tmp_dir()
|
|
|
-
|
|
|
-stack_name = status_params.stack_name
|
|
|
-stack_root = Script.get_stack_root()
|
|
|
-stack_version_unformatted = config['hostLevelParams']['stack_version']
|
|
|
-stack_version_formatted = format_stack_version(stack_version_unformatted)
|
|
|
-host_sys_prepped = default("/hostLevelParams/host_sys_prepped", False)
|
|
|
-
|
|
|
-# New Cluster Stack Version that is defined during the RESTART of a Stack Upgrade
|
|
|
-version = default("/commandParams/version", None)
|
|
|
-
|
|
|
-spark_conf = '/etc/spark/conf'
|
|
|
-hadoop_conf_dir = conf_select.get_hadoop_conf_dir()
|
|
|
-hadoop_bin_dir = stack_select.get_hadoop_dir("bin")
|
|
|
-
|
|
|
-if stack_version_formatted and check_stack_feature(StackFeature.ROLLING_UPGRADE, stack_version_formatted):
|
|
|
- hadoop_home = stack_select.get_hadoop_dir("home")
|
|
|
- spark_conf = format("{stack_root}/current/{component_directory}/conf")
|
|
|
- spark_log_dir = config['configurations']['spark-env']['spark_log_dir']
|
|
|
- spark_daemon_memory = config['configurations']['spark-env']['spark_daemon_memory']
|
|
|
- spark_pid_dir = status_params.spark_pid_dir
|
|
|
- spark_home = format("{stack_root}/current/{component_directory}")
|
|
|
-
|
|
|
-spark_thrift_server_conf_file = spark_conf + "/spark-thrift-sparkconf.conf"
|
|
|
-java_home = config['hostLevelParams']['java_home']
|
|
|
-
|
|
|
-hdfs_user = config['configurations']['hadoop-env']['hdfs_user']
|
|
|
-hdfs_principal_name = config['configurations']['hadoop-env']['hdfs_principal_name']
|
|
|
-hdfs_user_keytab = config['configurations']['hadoop-env']['hdfs_user_keytab']
|
|
|
-user_group = config['configurations']['cluster-env']['user_group']
|
|
|
-
|
|
|
-spark_user = status_params.spark_user
|
|
|
-hive_user = status_params.hive_user
|
|
|
-spark_group = status_params.spark_group
|
|
|
-user_group = status_params.user_group
|
|
|
-spark_hdfs_user_dir = format("/user/{spark_user}")
|
|
|
-spark_history_dir = default('/configurations/spark-defaults/spark.history.fs.logDirectory', "hdfs:///spark-history")
|
|
|
-
|
|
|
-spark_history_server_pid_file = status_params.spark_history_server_pid_file
|
|
|
-spark_thrift_server_pid_file = status_params.spark_thrift_server_pid_file
|
|
|
-
|
|
|
-spark_history_server_start = format("{spark_home}/sbin/start-history-server.sh")
|
|
|
-spark_history_server_stop = format("{spark_home}/sbin/stop-history-server.sh")
|
|
|
-
|
|
|
-spark_thrift_server_start = format("{spark_home}/sbin/start-thriftserver.sh")
|
|
|
-spark_thrift_server_stop = format("{spark_home}/sbin/stop-thriftserver.sh")
|
|
|
-spark_logs_dir = format("{spark_home}/logs")
|
|
|
-spark_hadoop_lib_native = format("{stack_root}/current/hadoop-client/lib/native")
|
|
|
-
|
|
|
-spark_submit_cmd = format("{spark_home}/bin/spark-submit")
|
|
|
-spark_smoke_example = "org.apache.spark.examples.SparkPi"
|
|
|
-spark_service_check_cmd = format(
|
|
|
- "{spark_submit_cmd} --class {spark_smoke_example} --master yarn-cluster --num-executors 1 --driver-memory 256m --executor-memory 256m --executor-cores 1 {spark_home}/lib/spark-examples*.jar 1")
|
|
|
-
|
|
|
-spark_jobhistoryserver_hosts = default("/clusterHostInfo/spark_jobhistoryserver_hosts", [])
|
|
|
-
|
|
|
-if len(spark_jobhistoryserver_hosts) > 0:
|
|
|
- spark_history_server_host = spark_jobhistoryserver_hosts[0]
|
|
|
-else:
|
|
|
- spark_history_server_host = "localhost"
|
|
|
-
|
|
|
-# spark-defaults params
|
|
|
-spark_yarn_historyServer_address = default(spark_history_server_host, "localhost")
|
|
|
-
|
|
|
-spark_history_ui_port = config['configurations']['spark-defaults']['spark.history.ui.port']
|
|
|
-
|
|
|
-spark_env_sh = config['configurations']['spark-env']['content']
|
|
|
-spark_log4j_properties = config['configurations']['spark-log4j-properties']['content']
|
|
|
-spark_metrics_properties = config['configurations']['spark-metrics-properties']['content']
|
|
|
-
|
|
|
-hive_server_host = default("/clusterHostInfo/hive_server_host", [])
|
|
|
-is_hive_installed = not len(hive_server_host) == 0
|
|
|
-
|
|
|
-security_enabled = config['configurations']['cluster-env']['security_enabled']
|
|
|
-kinit_path_local = get_kinit_path(default('/configurations/kerberos-env/executable_search_paths', None))
|
|
|
-spark_kerberos_keytab = config['configurations']['spark-defaults']['spark.history.kerberos.keytab']
|
|
|
-spark_kerberos_principal = config['configurations']['spark-defaults']['spark.history.kerberos.principal']
|
|
|
-
|
|
|
-spark_thriftserver_hosts = default("/clusterHostInfo/spark_thriftserver_hosts", [])
|
|
|
-has_spark_thriftserver = not len(spark_thriftserver_hosts) == 0
|
|
|
-
|
|
|
-# hive-site params
|
|
|
-spark_hive_properties = {
|
|
|
- 'hive.metastore.uris': config['configurations']['hive-site']['hive.metastore.uris']
|
|
|
-}
|
|
|
-
|
|
|
-# security settings
|
|
|
-if security_enabled:
|
|
|
- spark_principal = spark_kerberos_principal.replace('_HOST',spark_history_server_host.lower())
|
|
|
-
|
|
|
- if is_hive_installed:
|
|
|
- spark_hive_properties.update({
|
|
|
- 'hive.metastore.sasl.enabled': str(config['configurations']['hive-site']['hive.metastore.sasl.enabled']).lower(),
|
|
|
- 'hive.metastore.kerberos.keytab.file': config['configurations']['hive-site']['hive.metastore.kerberos.keytab.file'],
|
|
|
- 'hive.server2.authentication.spnego.principal': config['configurations']['hive-site']['hive.server2.authentication.spnego.principal'],
|
|
|
- 'hive.server2.authentication.spnego.keytab': config['configurations']['hive-site']['hive.server2.authentication.spnego.keytab'],
|
|
|
- 'hive.metastore.kerberos.principal': config['configurations']['hive-site']['hive.metastore.kerberos.principal'],
|
|
|
- 'hive.server2.authentication.kerberos.principal': config['configurations']['hive-site']['hive.server2.authentication.kerberos.principal'],
|
|
|
- 'hive.server2.authentication.kerberos.keytab': config['configurations']['hive-site']['hive.server2.authentication.kerberos.keytab'],
|
|
|
- 'hive.server2.authentication': config['configurations']['hive-site']['hive.server2.authentication'],
|
|
|
- })
|
|
|
-
|
|
|
- hive_kerberos_keytab = config['configurations']['hive-site']['hive.server2.authentication.kerberos.keytab']
|
|
|
- hive_kerberos_principal = config['configurations']['hive-site']['hive.server2.authentication.kerberos.principal']
|
|
|
-
|
|
|
-# thrift server support - available on HDP 2.3 or higher
|
|
|
-spark_thrift_sparkconf = None
|
|
|
-spark_thrift_cmd_opts_properties = ''
|
|
|
-spark_thrift_fairscheduler_content = None
|
|
|
-spark_thrift_master = "yarn-client"
|
|
|
-if 'nm_hosts' in config['clusterHostInfo'] and len(config['clusterHostInfo']['nm_hosts']) == 1:
|
|
|
- # use local mode when there's only one nodemanager
|
|
|
- spark_thrift_master = "local[4]"
|
|
|
-
|
|
|
-if has_spark_thriftserver and 'spark-thrift-sparkconf' in config['configurations']:
|
|
|
- spark_thrift_sparkconf = config['configurations']['spark-thrift-sparkconf']
|
|
|
- spark_thrift_cmd_opts_properties = config['configurations']['spark-env']['spark_thrift_cmd_opts']
|
|
|
- if is_hive_installed:
|
|
|
- # update default metastore client properties (async wait for metastore component) it is useful in case of
|
|
|
- # blueprint provisioning when hive-metastore and spark-thriftserver is not on the same host.
|
|
|
- spark_hive_properties.update({
|
|
|
- 'hive.metastore.client.socket.timeout' : config['configurations']['hive-site']['hive.metastore.client.socket.timeout']
|
|
|
- })
|
|
|
- spark_hive_properties.update(config['configurations']['spark-hive-site-override'])
|
|
|
-
|
|
|
- if 'spark-thrift-fairscheduler' in config['configurations'] and 'fairscheduler_content' in config['configurations']['spark-thrift-fairscheduler']:
|
|
|
- spark_thrift_fairscheduler_content = config['configurations']['spark-thrift-fairscheduler']['fairscheduler_content']
|
|
|
-
|
|
|
-default_fs = config['configurations']['core-site']['fs.defaultFS']
|
|
|
-hdfs_site = config['configurations']['hdfs-site']
|
|
|
-
|
|
|
-dfs_type = default("/commandParams/dfs_type", "")
|
|
|
-
|
|
|
-import functools
|
|
|
-#create partial functions with common arguments for every HdfsResource call
|
|
|
-#to create/delete hdfs directory/file/copyfromlocal we need to call params.HdfsResource in code
|
|
|
-HdfsResource = functools.partial(
|
|
|
- HdfsResource,
|
|
|
- user=hdfs_user,
|
|
|
- hdfs_resource_ignore_file = "/var/lib/ambari-agent/data/.hdfs_resource_ignore",
|
|
|
- security_enabled = security_enabled,
|
|
|
- keytab = hdfs_user_keytab,
|
|
|
- kinit_path_local = kinit_path_local,
|
|
|
- hadoop_bin_dir = hadoop_bin_dir,
|
|
|
- hadoop_conf_dir = hadoop_conf_dir,
|
|
|
- principal_name = hdfs_principal_name,
|
|
|
- hdfs_site = hdfs_site,
|
|
|
- default_fs = default_fs,
|
|
|
- immutable_paths = get_not_managed_resources(),
|
|
|
- dfs_type = dfs_type
|
|
|
- )
|