capacity-scheduler.xml.template 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126
  1. <?xml version="1.0"?>
  2. <!-- This is the configuration file for the resource manager in Hadoop. -->
  3. <!-- You can configure various scheduling parameters related to queues. -->
  4. <!-- The properties for a queue follow a naming convention,such as, -->
  5. <!-- mapred.capacity-scheduler.queue.<queue-name>.property-name. -->
  6. <configuration>
  7. <property>
  8. <name>mapred.capacity-scheduler.queue.default.capacity</name>
  9. <value>100</value>
  10. <description>Percentage of the number of slots in the cluster that are
  11. to be available for jobs in this queue.
  12. </description>
  13. </property>
  14. <property>
  15. <name>mapred.capacity-scheduler.queue.default.supports-priority</name>
  16. <value>false</value>
  17. <description>If true, priorities of jobs will be taken into
  18. account in scheduling decisions.
  19. </description>
  20. </property>
  21. <property>
  22. <name>mapred.capacity-scheduler.queue.default.minimum-user-limit-percent</name>
  23. <value>100</value>
  24. <description> Each queue enforces a limit on the percentage of resources
  25. allocated to a user at any given time, if there is competition for them.
  26. This user limit can vary between a minimum and maximum value. The former
  27. depends on the number of users who have submitted jobs, and the latter is
  28. set to this property value. For example, suppose the value of this
  29. property is 25. If two users have submitted jobs to a queue, no single
  30. user can use more than 50% of the queue resources. If a third user submits
  31. a job, no single user can use more than 33% of the queue resources. With 4
  32. or more users, no user can use more than 25% of the queue's resources. A
  33. value of 100 implies no user limits are imposed.
  34. </description>
  35. </property>
  36. <property>
  37. <name>mapred.capacity-scheduler.queue.default.maximum-initialized-jobs-per-user</name>
  38. <value>2</value>
  39. <description>The maximum number of jobs to be pre-initialized for a user
  40. of the job queue.
  41. </description>
  42. </property>
  43. <!-- The default configuration settings for the capacity task scheduler -->
  44. <!-- The default values would be applied to all the queues which don't have -->
  45. <!-- the appropriate property for the particular queue -->
  46. <property>
  47. <name>mapred.capacity-scheduler.default-supports-priority</name>
  48. <value>false</value>
  49. <description>If true, priorities of jobs will be taken into
  50. account in scheduling decisions by default in a job queue.
  51. </description>
  52. </property>
  53. <property>
  54. <name>mapred.capacity-scheduler.task.default-pmem-percentage-in-vmem</name>
  55. <value>-1</value>
  56. <description>A percentage (float) of the default VM limit for jobs
  57. (mapred.task.default.maxvm). This is the default RAM task-limit
  58. associated with a task. Unless overridden by a job's setting, this
  59. number defines the RAM task-limit.
  60. If this property is missing, or set to an invalid value, scheduling
  61. based on physical memory, RAM, is disabled.
  62. </description>
  63. </property>
  64. <property>
  65. <name>mapred.capacity-scheduler.task.limit.maxpmem</name>
  66. <value>-1</value>
  67. <description>Configuration that provides an upper limit on the maximum
  68. physical memory that can be specified by a job. The job configuration
  69. mapred.task.maxpmem should be less than this value. If not, the job will
  70. be rejected by the scheduler.
  71. If it is set to -1, scheduler will not consider physical memory for
  72. scheduling even if virtual memory based scheduling is enabled(by setting
  73. valid values for both mapred.task.default.maxvmem and
  74. mapred.task.limit.maxvmem).
  75. </description>
  76. </property>
  77. <property>
  78. <name>mapred.capacity-scheduler.default-minimum-user-limit-percent</name>
  79. <value>100</value>
  80. <description>The percentage of the resources limited to a particular user
  81. for the job queue at any given point of time by default.
  82. </description>
  83. </property>
  84. <property>
  85. <name>mapred.capacity-scheduler.default-maximum-initialized-jobs-per-user</name>
  86. <value>2</value>
  87. <description>The maximum number of jobs to be pre-initialized for a user
  88. of the job queue.
  89. </description>
  90. </property>
  91. <!-- Capacity scheduler Job Initialization configuration parameters -->
  92. <property>
  93. <name>mapred.capacity-scheduler.init-poll-interval</name>
  94. <value>5000</value>
  95. <description>The amount of time in miliseconds which is used to poll
  96. the job queues for jobs to initialize.
  97. </description>
  98. </property>
  99. <property>
  100. <name>mapred.capacity-scheduler.init-worker-threads</name>
  101. <value>5</value>
  102. <description>Number of worker threads which would be used by
  103. Initialization poller to initialize jobs in a set of queue.
  104. If number mentioned in property is equal to number of job queues
  105. then a single thread would initialize jobs in a queue. If lesser
  106. then a thread would get a set of queues assigned. If the number
  107. is greater then number of threads would be equal to number of
  108. job queues.
  109. </description>
  110. </property>
  111. </configuration>