capacity-scheduler.xml.template 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156
  1. <?xml version="1.0"?>
  2. <!-- This is the configuration file for the resource manager in Hadoop. -->
  3. <!-- You can configure various scheduling parameters related to queues. -->
  4. <!-- The properties for a queue follow a naming convention,such as, -->
  5. <!-- mapred.capacity-scheduler.queue.<queue-name>.property-name. -->
  6. <configuration>
  7. <property>
  8. <name>mapred.capacity-scheduler.queue.default.guaranteed-capacity</name>
  9. <value>100</value>
  10. <description>Percentage of the number of slots in the cluster that are
  11. guaranteed to be available for jobs in this queue.
  12. </description>
  13. </property>
  14. <property>
  15. <name>mapred.capacity-scheduler.queue.default.reclaim-time-limit</name>
  16. <value>300</value>
  17. <description>The amount of time, in seconds, before which
  18. resources distributed to other queues will be reclaimed.
  19. </description>
  20. </property>
  21. <property>
  22. <name>mapred.capacity-scheduler.queue.default.supports-priority</name>
  23. <value>false</value>
  24. <description>If true, priorities of jobs will be taken into
  25. account in scheduling decisions.
  26. </description>
  27. </property>
  28. <property>
  29. <name>mapred.capacity-scheduler.queue.default.minimum-user-limit-percent</name>
  30. <value>100</value>
  31. <description> Each queue enforces a limit on the percentage of resources
  32. allocated to a user at any given time, if there is competition for them.
  33. This user limit can vary between a minimum and maximum value. The former
  34. depends on the number of users who have submitted jobs, and the latter is
  35. set to this property value. For example, suppose the value of this
  36. property is 25. If two users have submitted jobs to a queue, no single
  37. user can use more than 50% of the queue resources. If a third user submits
  38. a job, no single user can use more than 33% of the queue resources. With 4
  39. or more users, no user can use more than 25% of the queue's resources. A
  40. value of 100 implies no user limits are imposed.
  41. </description>
  42. </property>
  43. <property>
  44. <name>mapred.capacity-scheduler.queue.default.maximum-initialized-jobs-per-user</name>
  45. <value>2</value>
  46. <description>The maximum number of jobs to be pre-initialized for a user
  47. of the job queue.
  48. </description>
  49. </property>
  50. <property>
  51. <name>mapred.capacity-scheduler.reclaimCapacity.interval</name>
  52. <value>5</value>
  53. <description>The time interval, in seconds, between which the scheduler
  54. periodically determines whether capacity needs to be reclaimed for
  55. any queue.
  56. </description>
  57. </property>
  58. <!-- The default configuration settings for the capacity task scheduler -->
  59. <!-- The default values would be applied to all the queues which don't have -->
  60. <!-- the appropriate property for the particular queue -->
  61. <property>
  62. <name>mapred.capacity-scheduler.default-reclaim-time-limit</name>
  63. <value>300</value>
  64. <description>The amount of time, in seconds, before which
  65. resources distributed to other queues will be reclaimed by default
  66. in a job queue.
  67. </description>
  68. </property>
  69. <property>
  70. <name>mapred.capacity-scheduler.default-supports-priority</name>
  71. <value>false</value>
  72. <description>If true, priorities of jobs will be taken into
  73. account in scheduling decisions by default in a job queue.
  74. </description>
  75. </property>
  76. <property>
  77. <name>mapred.capacity-scheduler.task.default-pmem-percentage-in-vmem</name>
  78. <value>-1</value>
  79. <description>If mapred.task.maxpmem is set to -1, this configuration will
  80. be used to calculate job's physical memory requirements as a percentage of
  81. the job's virtual memory requirements set via mapred.task.maxvmem. This
  82. property thus provides default value of physical memory for job's that
  83. don't explicitly specify physical memory requirements.
  84. If not explicitly set to a valid value, scheduler will not consider
  85. physical memory for scheduling even if virtual memory based scheduling is
  86. enabled(by setting valid values for both mapred.task.default.maxvmem and
  87. mapred.task.limit.maxvmem).
  88. </description>
  89. </property>
  90. <property>
  91. <name>mapred.capacity-scheduler.task.limit.maxpmem</name>
  92. <value>-1</value>
  93. <description>Configuration that provides an upper limit on the maximum
  94. physical memory that can be specified by a job. The job configuration
  95. mapred.task.maxpmem should be less than this value. If not, the job will
  96. be rejected by the scheduler.
  97. If it is set to -1, scheduler will not consider physical memory for
  98. scheduling even if virtual memory based scheduling is enabled(by setting
  99. valid values for both mapred.task.default.maxvmem and
  100. mapred.task.limit.maxvmem).
  101. </description>
  102. </property>
  103. <property>
  104. <name>mapred.capacity-scheduler.default-minimum-user-limit-percent</name>
  105. <value>100</value>
  106. <description>The percentage of the resources limited to a particular user
  107. for the job queue at any given point of time by default.
  108. </description>
  109. </property>
  110. <property>
  111. <name>mapred.capacity-scheduler.default-maximum-initialized-jobs-per-user</name>
  112. <value>2</value>
  113. <description>The maximum number of jobs to be pre-initialized for a user
  114. of the job queue.
  115. </description>
  116. </property>
  117. <!-- Capacity scheduler Job Initialization configuration parameters -->
  118. <property>
  119. <name>mapred.capacity-scheduler.init-poll-interval</name>
  120. <value>5000</value>
  121. <description>The amount of time in miliseconds which is used to poll
  122. the job queues for jobs to initialize.
  123. </description>
  124. </property>
  125. <property>
  126. <name>mapred.capacity-scheduler.init-worker-threads</name>
  127. <value>5</value>
  128. <description>Number of worker threads which would be used by
  129. Initialization poller to initialize jobs in a set of queue.
  130. If number mentioned in property is equal to number of job queues
  131. then a single thread would initialize jobs in a queue. If lesser
  132. then a thread would get a set of queues assigned. If the number
  133. is greater then number of threads would be equal to number of
  134. job queues.
  135. </description>
  136. </property>
  137. </configuration>