|
@@ -0,0 +1,164 @@
|
|
|
+<?xml version="1.0" encoding="UTF-8"?>
|
|
|
+<!--
|
|
|
+/**
|
|
|
+ * Licensed to the Apache Software Foundation (ASF) under one
|
|
|
+ * or more contributor license agreements. See the NOTICE file
|
|
|
+ * distributed with this work for additional information
|
|
|
+ * regarding copyright ownership. The ASF licenses this file
|
|
|
+ * to you under the Apache License, Version 2.0 (the
|
|
|
+ * "License"); you may not use this file except in compliance
|
|
|
+ * with the License. You may obtain a copy of the License at
|
|
|
+ *
|
|
|
+ * http://www.apache.org/licenses/LICENSE-2.0
|
|
|
+ *
|
|
|
+ * Unless required by applicable law or agreed to in writing, software
|
|
|
+ * distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
+ * See the License for the specific language governing permissions and
|
|
|
+ * limitations under the License.
|
|
|
+ */
|
|
|
+-->
|
|
|
+
|
|
|
+<configuration supports_final="true">
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.executor.memoryOverhead</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.driver.memoryOverhead</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.scheduler.heartbeat.interval-ms</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.max.executor.failures</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.containerLauncherMaxThreads</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.submit.file.replication</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.preserve.staging.files</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.max.executor.failures</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.services</name>
|
|
|
+ <deleted>true</deleted>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.history.provider</name>
|
|
|
+ <value>org.apache.spark.deploy.history.FsHistoryProvider</value>
|
|
|
+ <description>Name of history provider class</description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.history.fs.logDirectory</name>
|
|
|
+ <value>{{spark_history_dir}}</value>
|
|
|
+ <description>
|
|
|
+ Base directory for history spark application log.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.eventLog.enabled</name>
|
|
|
+ <value>true</value>
|
|
|
+ <description>
|
|
|
+ Whether to log Spark events, useful for reconstructing the Web UI after the application has finished.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.eventLog.dir</name>
|
|
|
+ <value>{{spark_history_dir}}</value>
|
|
|
+ <description>
|
|
|
+ Base directory in which Spark events are logged, if spark.eventLog.enabled is true.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.master</name>
|
|
|
+ <value>{{spark_thrift_master}}</value>
|
|
|
+ <description>
|
|
|
+ The deploying mode of spark application, by default it is yarn-client for thrift-server but local mode for there's
|
|
|
+ only one nodemanager.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.scheduler.allocation.file</name>
|
|
|
+ <value>{{spark_conf}}/spark-thrift-fairscheduler.xml</value>
|
|
|
+ <description>
|
|
|
+ Scheduler configuration file for thriftserver.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.scheduler.mode</name>
|
|
|
+ <value>FAIR</value>
|
|
|
+ <description>
|
|
|
+ The scheduling mode between jobs submitted to the same SparkContext.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.shuffle.service.enabled</name>
|
|
|
+ <value>true</value>
|
|
|
+ <description>
|
|
|
+ Enables the external shuffle service.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.dynamicAllocation.enabled</name>
|
|
|
+ <value>true</value>
|
|
|
+ <description>
|
|
|
+ Whether to use dynamic resource allocation, which scales the number of executors registered with this application up and down based on the workload.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.executor.instances</name>
|
|
|
+ <value>2</value>
|
|
|
+ <description>
|
|
|
+ The number of executor.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.yarn.am.memory</name>
|
|
|
+ <value>512m</value>
|
|
|
+ <description>
|
|
|
+ Amount of memory to use for the YARN Application Master in client mode.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+ <property>
|
|
|
+ <name>spark.executor.memory</name>
|
|
|
+ <value>1g</value>
|
|
|
+ <description>
|
|
|
+ Amount of memory to use per executor process.
|
|
|
+ </description>
|
|
|
+ </property>
|
|
|
+
|
|
|
+</configuration>
|