hadoop-mapred_0.22.0.xml 1.3 MB


  1. <?xml version="1.0" encoding="iso-8859-1" standalone="no"?>
  2. <!-- Generated by the JDiff Javadoc doclet -->
  3. <!-- (http://www.jdiff.org) -->
  4. <!-- on Sun Dec 04 01:04:32 UTC 2011 -->
  5. <api
  6. xmlns:xsi='http://www.w3.org/2001/XMLSchema-instance'
  7. xsi:noNamespaceSchemaLocation='api.xsd'
  8. name="hadoop-mapred 0.22.0"
  9. jdversion="1.0.9">
  10. <!-- Command line arguments = -doclet org.apache.hadoop.classification.tools.ExcludePrivateAnnotationsJDiffDoclet -docletpath /x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/build/ivy/lib/Hadoop/common/hadoop-common-0.22.0-SNAPSHOT.jar:/x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/build/ivy/lib/Hadoop/jdiff/jdiff-1.0.9.jar:/x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/build/ivy/lib/Hadoop/jdiff/xerces-1.4.4.jar -classpath /x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/build/classes:/x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/conf:/home/jenkins/.ivy2/cache/org.apache.hadoop/hadoop-common/jars/hadoop-common-0.22.0-SNAPSHOT.jar:/home/jenkins/.ivy2/cache/commons-cli/commons-cli/jars/commons-cli-1.2.jar:/home/jenkins/.ivy2/cache/xmlenc/xmlenc/jars/xmlenc-0.52.jar:/home/jenkins/.ivy2/cache/commons-codec/commons-codec/jars/commons-codec-1.4.jar:/home/jenkins/.ivy2/cache/commons-logging/commons-logging/jars/commons-logging-1.1.1.jar:/home/jenkins/.ivy2/cache/org.slf4j/slf4j-api/jars/slf4j-api-1.6.1.jar:/home/jenkins/.ivy2/cache/org.slf4j/slf4j-log4j12/jars/slf4j-log4j12-1.6.1.jar:/home/jenkins/.ivy2/cache/log4j/log4j/bundles/log4j-1.2.16.jar:/home/jenkins/.ivy2/cache/org.mortbay.jetty/jetty/jars/jetty-6.1.26.jar:/home/jenkins/.ivy2/cache/org.mortbay.jetty/jetty-util/jars/jetty-util-6.1.26.jar:/home/jenkins/.ivy2/cache/org.mortbay.jetty/servlet-api/jars/servlet-api-2.5-20081211.jar:/home/jenkins/.ivy2/cache/tomcat/jasper-runtime/jars/jasper-runtime-5.5.12.jar:/home/jenkins/.ivy2/cache/tomcat/jasper-compiler/jars/jasper-compiler-5.5.12.jar:/home/jenkins/.ivy2/cache/org.mortbay.jetty/jsp-2.1-jetty/jars/jsp-2.1-jetty-6.1.26.jar:/home/jenkins/.ivy2/cache/org.eclipse.jdt/core/jars/core-3.1.1.jar:/home/jenkins/.ivy2/cache/org.mortbay.jetty/jsp-api-2.1-glassfish/jars/jsp-api-2.1-glassfish-2.1.v20091210.jar:/home/jenkins/.ivy2/cache/org.mortbay.jetty/jsp-2.1-glassfish/jars/jsp-2.1-glassfish-2.1.v20091210.jar:/home/jenkins/.ivy2/cache/org.eclipse.jdt.core.compiler/ecj/jars/ecj-3.5.1.jar:/home/jenkins/.ivy2/cache/commons-el/commons-el/jars/commons-el-1.0.jar:/home/jenkins/.ivy2/cache/net.java.dev.jets3t/jets3t/jars/jets3t-0.7.1.jar:/home/jenkins/.ivy2/cache/commons-httpclient/commons-httpclient/jars/commons-httpclient-3.1.jar:/home/jenkins/.ivy2/cache/commons-net/commons-net/jars/commons-net-1.4.1.jar:/home/jenkins/.ivy2/cache/oro/oro/jars/oro-2.0.8.jar:/home/jenkins/.ivy2/cache/net.sf.kosmosfs/kfs/jars/kfs-0.3.jar:/home/jenkins/.ivy2/cache/junit/junit/jars/junit-4.8.1.jar:/home/jenkins/.ivy2/cache/hsqldb/hsqldb/jars/hsqldb-1.8.0.10.jar:/home/jenkins/.ivy2/cache/org.apache.avro/avro/jars/avro-1.5.3.jar:/home/jenkins/.ivy2/cache/org.codehaus.jackson/jackson-mapper-asl/jars/jackson-mapper-asl-1.7.3.jar:/home/jenkins/.ivy2/cache/org.codehaus.jackson/jackson-core-asl/jars/jackson-core-asl-1.7.3.jar:/home/jenkins/.ivy2/cache/com.thoughtworks.paranamer/paranamer/jars/paranamer-2.3.jar:/home/jenkins/.ivy2/cache/org.xerial.snappy/snappy-java/bundles/snappy-java-1.0.3.2.jar:/home/jenkins/.ivy2/cache/org.apache.avro/avro-ipc/jars/avro-ipc-1.5.3.jar:/home/jenkins/.ivy2/cache/org.apache.hadoop/hadoop-common-test/jars/hadoop-common-test-0.22.0-SNAPSHOT.jar:/home/jenkins/.ivy2/cache/org.apache.hadoop/hadoop-hdfs/jars/hadoop-hdfs-0.22.0-SNAPSHOT.jar:/home/jenkins/.ivy2/cache/com.google.guava/guava/jars/guava-r09.jar:/home/jenkins/.ivy2/cache/org.apache.avro/avro-compiler/jars/avro-compiler-1.5.3.jar:/home/jenkins/.ivy2/cache/commons-lang/commons-lang/jars/commons-lang-2.5.jar:/home/jenkins/.ivy2/cache/org.apache.velocity/velocity/jars/velocity-1.6.4.jar:/home/jenkins/.ivy2/cache/commons-collections/commons-collections/jars/commons-collections-3.2.1.jar:/home/jenkins/.ivy2/cache/org.aspectj/aspectjrt/jars/aspectjrt-1.6.5.jar:/home/jenkins/.ivy2/cache/org.aspectj/aspectjtools/jars/aspectjtools-1.6.5.jar:/home/jenkins/.ivy2/cache/jdiff/jdiff/jars/jdiff-1.0.9.jar:/home/jenkins/.ivy2/cache/xerces/xerces/jars/xerces-1.4.4.jar:/home/jenkins/tools/ant/latest/lib/ant-launcher.jar:/usr/share/java/xmlParserAPIs.jar:/usr/share/java/xercesImpl.jar:/home/jenkins/tools/ant/latest/lib/ant-apache-resolver.jar:/home/jenkins/tools/ant/latest/lib/ant-apache-bcel.jar:/home/jenkins/tools/ant/latest/lib/ant-jsch.jar:/home/jenkins/tools/ant/latest/lib/ant-jmf.jar:/home/jenkins/tools/ant/latest/lib/ant-apache-oro.jar:/home/jenkins/tools/ant/latest/lib/ant-netrexx.jar:/home/jenkins/tools/ant/latest/lib/ant-testutil.jar:/home/jenkins/tools/ant/latest/lib/ant-apache-xalan2.jar:/home/jenkins/tools/ant/latest/lib/ant-javamail.jar:/home/jenkins/tools/ant/latest/lib/ant.jar:/home/jenkins/tools/ant/latest/lib/ant-junit.jar:/home/jenkins/tools/ant/latest/lib/ant-swing.jar:/home/jenkins/tools/ant/latest/lib/ant-commons-net.jar:/home/jenkins/tools/ant/latest/lib/ant-jdepend.jar:/home/jenkins/tools/ant/latest/lib/ant-junit4.jar:/home/jenkins/tools/ant/latest/lib/ant-commons-logging.jar:/home/jenkins/tools/ant/latest/lib/ant-apache-bsf.jar:/home/jenkins/tools/ant/latest/lib/ant-apache-log4j.jar:/home/jenkins/tools/ant/latest/lib/ant-jai.jar:/home/jenkins/tools/ant/latest/lib/ant-apache-regexp.jar:/home/jenkins/tools/ant/latest/lib/ant-antlr.jar:/tmp/jdk1.6.0_29/lib/tools.jar -sourcepath /x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/src/java:/x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/src/tools -apidir /x1/jenkins/jenkins-slave/workspace/Hadoop-22-Build/common/mapreduce/lib/jdiff -apiname hadoop-mapred 0.22.0 -->
  11. <package name="org.apache.hadoop.filecache">
  12. <!-- start class org.apache.hadoop.filecache.DistributedCache -->
  13. <class name="DistributedCache" extends="org.apache.hadoop.mapreduce.filecache.DistributedCache"
  14. abstract="false"
  15. static="false" final="false" visibility="public"
  16. deprecated="Use methods on {@link Job}.">
  17. <constructor name="DistributedCache"
  18. static="false" final="false" visibility="public"
  19. deprecated="not deprecated">
  20. </constructor>
  21. <doc>
  22. <![CDATA[Distribute application-specific large, read-only files efficiently.
  23. <p><code>DistributedCache</code> is a facility provided by the Map-Reduce
  24. framework to cache files (text, archives, jars etc.) needed by applications.
  25. </p>
  26. <p>Applications specify the files, via urls (hdfs:// or http://) to be cached
  27. via the {@link org.apache.hadoop.mapred.JobConf}. The
  28. <code>DistributedCache</code> assumes that the files specified via urls are
  29. already present on the {@link FileSystem} at the path specified by the url
  30. and are accessible by every machine in the cluster.</p>
  31. <p>The framework will copy the necessary files on to the slave node before
  32. any tasks for the job are executed on that node. Its efficiency stems from
  33. the fact that the files are only copied once per job and the ability to
  34. cache archives which are un-archived on the slaves.</p>
  35. <p><code>DistributedCache</code> can be used to distribute simple, read-only
  36. data/text files and/or more complex types such as archives, jars etc.
  37. Archives (zip, tar and tgz/tar.gz files) are un-archived at the slave nodes.
  38. Jars may be optionally added to the classpath of the tasks, a rudimentary
  39. software distribution mechanism. Files have execution permissions.
  40. Optionally users can also direct it to symlink the distributed cache file(s)
  41. into the working directory of the task.</p>
  42. <p><code>DistributedCache</code> tracks modification timestamps of the cache
  43. files. Clearly the cache files should not be modified by the application
  44. or externally while the job is executing.</p>
  45. <p>Here is an illustrative example on how to use the
  46. <code>DistributedCache</code>:</p>
  47. <p><blockquote><pre>
  48. // Setting up the cache for the application
  49. 1. Copy the requisite files to the <code>FileSystem</code>:
  50. $ bin/hadoop fs -copyFromLocal lookup.dat /myapp/lookup.dat
  51. $ bin/hadoop fs -copyFromLocal map.zip /myapp/map.zip
  52. $ bin/hadoop fs -copyFromLocal mylib.jar /myapp/mylib.jar
  53. $ bin/hadoop fs -copyFromLocal mytar.tar /myapp/mytar.tar
  54. $ bin/hadoop fs -copyFromLocal mytgz.tgz /myapp/mytgz.tgz
  55. $ bin/hadoop fs -copyFromLocal mytargz.tar.gz /myapp/mytargz.tar.gz
  56. 2. Setup the application's <code>JobConf</code>:
  57. JobConf job = new JobConf();
  58. DistributedCache.addCacheFile(new URI("/myapp/lookup.dat#lookup.dat"),
  59. job);
  60. DistributedCache.addCacheArchive(new URI("/myapp/map.zip", job);
  61. DistributedCache.addFileToClassPath(new Path("/myapp/mylib.jar"), job);
  62. DistributedCache.addCacheArchive(new URI("/myapp/mytar.tar", job);
  63. DistributedCache.addCacheArchive(new URI("/myapp/mytgz.tgz", job);
  64. DistributedCache.addCacheArchive(new URI("/myapp/mytargz.tar.gz", job);
  65. 3. Use the cached files in the {@link org.apache.hadoop.mapred.Mapper}
  66. or {@link org.apache.hadoop.mapred.Reducer}:
  67. public static class MapClass extends MapReduceBase
  68. implements Mapper&lt;K, V, K, V&gt; {
  69. private Path[] localArchives;
  70. private Path[] localFiles;
  71. public void configure(JobConf job) {
  72. // Get the cached archives/files
  73. localArchives = DistributedCache.getLocalCacheArchives(job);
  74. localFiles = DistributedCache.getLocalCacheFiles(job);
  75. }
  76. public void map(K key, V value,
  77. OutputCollector&lt;K, V&gt; output, Reporter reporter)
  78. throws IOException {
  79. // Use data from the cached archives/files here
  80. // ...
  81. // ...
  82. output.collect(k, v);
  83. }
  84. }
  85. </pre></blockquote></p>
  86. It is also very common to use the DistributedCache by using
  87. {@link org.apache.hadoop.util.GenericOptionsParser}.
  88. This class includes methods that should be used by users
  89. (specifically those mentioned in the example above, as well
  90. as {@link DistributedCache#addArchiveToClassPath(Path, Configuration)}),
  91. as well as methods intended for use by the MapReduce framework
  92. (e.g., {@link org.apache.hadoop.mapred.JobClient}). For implementation
  93. details, see {@link TrackerDistributedCacheManager} and
  94. {@link TaskDistributedCacheManager}.
  95. @see org.apache.hadoop.mapred.JobConf
  96. @see org.apache.hadoop.mapred.JobClient
  97. @see org.apache.hadoop.mapreduce.Job
  98. @deprecated Use methods on {@link Job}.]]>
  99. </doc>
  100. </class>
  101. <!-- end class org.apache.hadoop.filecache.DistributedCache -->
  102. </package>
  103. <package name="org.apache.hadoop.mapred">
  104. <!-- start class org.apache.hadoop.mapred.ClusterStatus -->
  105. <class name="ClusterStatus" extends="java.lang.Object"
  106. abstract="false"
  107. static="false" final="false" visibility="public"
  108. deprecated="Use {@link ClusterMetrics} or {@link TaskTrackerInfo} instead">
  109. <implements name="org.apache.hadoop.io.Writable"/>
  110. <method name="getTaskTrackers" return="int"
  111. abstract="false" native="false" synchronized="false"
  112. static="false" final="false" visibility="public"
  113. deprecated="not deprecated">
  114. <doc>
  115. <![CDATA[Get the number of task trackers in the cluster.
  116. @return the number of task trackers in the cluster.]]>
  117. </doc>
  118. </method>
  119. <method name="getActiveTrackerNames" return="java.util.Collection"
  120. abstract="false" native="false" synchronized="false"
  121. static="false" final="false" visibility="public"
  122. deprecated="not deprecated">
  123. <doc>
  124. <![CDATA[Get the names of task trackers in the cluster.
  125. @return the active task trackers in the cluster.]]>
  126. </doc>
  127. </method>
  128. <method name="getBlacklistedTrackerNames" return="java.util.Collection"
  129. abstract="false" native="false" synchronized="false"
  130. static="false" final="false" visibility="public"
  131. deprecated="not deprecated">
  132. <doc>
  133. <![CDATA[Get the names of task trackers in the cluster.
  134. @return the blacklisted task trackers in the cluster.]]>
  135. </doc>
  136. </method>
  137. <method name="getBlacklistedTrackers" return="int"
  138. abstract="false" native="false" synchronized="false"
  139. static="false" final="false" visibility="public"
  140. deprecated="not deprecated">
  141. <doc>
  142. <![CDATA[Get the number of blacklisted task trackers in the cluster.
  143. @return the number of blacklisted task trackers in the cluster.]]>
  144. </doc>
  145. </method>
  146. <method name="getNumExcludedNodes" return="int"
  147. abstract="false" native="false" synchronized="false"
  148. static="false" final="false" visibility="public"
  149. deprecated="not deprecated">
  150. <doc>
  151. <![CDATA[Get the number of excluded hosts in the cluster.
  152. @return the number of excluded hosts in the cluster.]]>
  153. </doc>
  154. </method>
  155. <method name="getTTExpiryInterval" return="long"
  156. abstract="false" native="false" synchronized="false"
  157. static="false" final="false" visibility="public"
  158. deprecated="not deprecated">
  159. <doc>
  160. <![CDATA[Get the tasktracker expiry interval for the cluster
  161. @return the expiry interval in msec]]>
  162. </doc>
  163. </method>
  164. <method name="getMapTasks" return="int"
  165. abstract="false" native="false" synchronized="false"
  166. static="false" final="false" visibility="public"
  167. deprecated="not deprecated">
  168. <doc>
  169. <![CDATA[Get the number of currently running map tasks in the cluster.
  170. @return the number of currently running map tasks in the cluster.]]>
  171. </doc>
  172. </method>
  173. <method name="getReduceTasks" return="int"
  174. abstract="false" native="false" synchronized="false"
  175. static="false" final="false" visibility="public"
  176. deprecated="not deprecated">
  177. <doc>
  178. <![CDATA[Get the number of currently running reduce tasks in the cluster.
  179. @return the number of currently running reduce tasks in the cluster.]]>
  180. </doc>
  181. </method>
  182. <method name="getMaxMapTasks" return="int"
  183. abstract="false" native="false" synchronized="false"
  184. static="false" final="false" visibility="public"
  185. deprecated="not deprecated">
  186. <doc>
  187. <![CDATA[Get the maximum capacity for running map tasks in the cluster.
  188. @return the maximum capacity for running map tasks in the cluster.]]>
  189. </doc>
  190. </method>
  191. <method name="getMaxReduceTasks" return="int"
  192. abstract="false" native="false" synchronized="false"
  193. static="false" final="false" visibility="public"
  194. deprecated="not deprecated">
  195. <doc>
  196. <![CDATA[Get the maximum capacity for running reduce tasks in the cluster.
  197. @return the maximum capacity for running reduce tasks in the cluster.]]>
  198. </doc>
  199. </method>
  200. <method name="getJobTrackerState" return="org.apache.hadoop.mapred.JobTracker.State"
  201. abstract="false" native="false" synchronized="false"
  202. static="false" final="false" visibility="public"
  203. deprecated="Use {@link #getJobTrackerStatus()} instead.">
  204. <doc>
  205. <![CDATA[Get the current state of the <code>JobTracker</code>,
  206. as {@link JobTracker.State}
  207. @return the current state of the <code>JobTracker</code>.
  208. @deprecated Use {@link #getJobTrackerStatus()} instead.]]>
  209. </doc>
  210. </method>
  211. <method name="getJobTrackerStatus" return="org.apache.hadoop.mapreduce.Cluster.JobTrackerStatus"
  212. abstract="false" native="false" synchronized="false"
  213. static="false" final="false" visibility="public"
  214. deprecated="not deprecated">
  215. <doc>
  216. <![CDATA[Get the JobTracker's status.
  217. @return {@link JobTrackerStatus} of the JobTracker]]>
  218. </doc>
  219. </method>
  220. <method name="getBlackListedTrackersInfo" return="java.util.Collection"
  221. abstract="false" native="false" synchronized="false"
  222. static="false" final="false" visibility="public"
  223. deprecated="not deprecated">
  224. <doc>
  225. <![CDATA[Gets the list of blacklisted trackers along with reasons for blacklisting.
  226. @return the collection of {@link BlackListInfo} objects.]]>
  227. </doc>
  228. </method>
  229. <method name="write"
  230. abstract="false" native="false" synchronized="false"
  231. static="false" final="false" visibility="public"
  232. deprecated="not deprecated">
  233. <param name="out" type="java.io.DataOutput"/>
  234. <exception name="IOException" type="java.io.IOException"/>
  235. </method>
  236. <method name="readFields"
  237. abstract="false" native="false" synchronized="false"
  238. static="false" final="false" visibility="public"
  239. deprecated="not deprecated">
  240. <param name="in" type="java.io.DataInput"/>
  241. <exception name="IOException" type="java.io.IOException"/>
  242. </method>
  243. <doc>
  244. <![CDATA[Status information on the current state of the Map-Reduce cluster.
  245. <p><code>ClusterStatus</code> provides clients with information such as:
  246. <ol>
  247. <li>
  248. Size of the cluster.
  249. </li>
  250. <li>
  251. Name of the trackers.
  252. </li>
  253. <li>
  254. Task capacity of the cluster.
  255. </li>
  256. <li>
  257. The number of currently running map & reduce tasks.
  258. </li>
  259. <li>
  260. State of the <code>JobTracker</code>.
  261. </li>
  262. <li>
  263. Details regarding black listed trackers.
  264. </li>
  265. </ol></p>
  266. <p>Clients can query for the latest <code>ClusterStatus</code>, via
  267. {@link JobClient#getClusterStatus()}.</p>
  268. @see JobClient
  269. @deprecated Use {@link ClusterMetrics} or {@link TaskTrackerInfo} instead]]>
  270. </doc>
  271. </class>
  272. <!-- end class org.apache.hadoop.mapred.ClusterStatus -->
  273. <!-- start class org.apache.hadoop.mapred.ClusterStatus.BlackListInfo -->
  274. <class name="ClusterStatus.BlackListInfo" extends="java.lang.Object"
  275. abstract="false"
  276. static="true" final="false" visibility="public"
  277. deprecated="not deprecated">
  278. <implements name="org.apache.hadoop.io.Writable"/>
  279. <method name="getTrackerName" return="java.lang.String"
  280. abstract="false" native="false" synchronized="false"
  281. static="false" final="false" visibility="public"
  282. deprecated="not deprecated">
  283. <doc>
  284. <![CDATA[Gets the blacklisted tasktracker's name.
  285. @return tracker's name.]]>
  286. </doc>
  287. </method>
  288. <method name="getReasonForBlackListing" return="java.lang.String"
  289. abstract="false" native="false" synchronized="false"
  290. static="false" final="false" visibility="public"
  291. deprecated="not deprecated">
  292. <doc>
  293. <![CDATA[Gets the reason for which the tasktracker was blacklisted.
  294. @return reason which tracker was blacklisted]]>
  295. </doc>
  296. </method>
  297. <method name="getBlackListReport" return="java.lang.String"
  298. abstract="false" native="false" synchronized="false"
  299. static="false" final="false" visibility="public"
  300. deprecated="not deprecated">
  301. <doc>
  302. <![CDATA[Gets a descriptive report about why the tasktracker was blacklisted.
  303. @return report describing why the tasktracker was blacklisted.]]>
  304. </doc>
  305. </method>
  306. <method name="readFields"
  307. abstract="false" native="false" synchronized="false"
  308. static="false" final="false" visibility="public"
  309. deprecated="not deprecated">
  310. <param name="in" type="java.io.DataInput"/>
  311. <exception name="IOException" type="java.io.IOException"/>
  312. </method>
  313. <method name="write"
  314. abstract="false" native="false" synchronized="false"
  315. static="false" final="false" visibility="public"
  316. deprecated="not deprecated">
  317. <param name="out" type="java.io.DataOutput"/>
  318. <exception name="IOException" type="java.io.IOException"/>
  319. </method>
  320. <method name="toString" return="java.lang.String"
  321. abstract="false" native="false" synchronized="false"
  322. static="false" final="false" visibility="public"
  323. deprecated="not deprecated">
  324. </method>
  325. <doc>
  326. <![CDATA[Class which encapsulates information about a blacklisted tasktracker.
  327. The information includes the tasktracker's name and reasons for
  328. getting blacklisted. The toString method of the class will print
  329. the information in a whitespace separated fashion to enable parsing.]]>
  330. </doc>
  331. </class>
  332. <!-- end class org.apache.hadoop.mapred.ClusterStatus.BlackListInfo -->
  333. <!-- start class org.apache.hadoop.mapred.Counters -->
  334. <class name="Counters" extends="java.lang.Object"
  335. abstract="false"
  336. static="false" final="false" visibility="public"
  337. deprecated="Use {@link org.apache.hadoop.mapreduce.Counters} instead.">
  338. <implements name="org.apache.hadoop.io.Writable"/>
  339. <implements name="java.lang.Iterable"/>
  340. <constructor name="Counters"
  341. static="false" final="false" visibility="public"
  342. deprecated="not deprecated">
  343. </constructor>
  344. <method name="getGroupNames" return="java.util.Collection"
  345. abstract="false" native="false" synchronized="true"
  346. static="false" final="false" visibility="public"
  347. deprecated="not deprecated">
  348. <doc>
  349. <![CDATA[Returns the names of all counter classes.
  350. @return Set of counter names.]]>
  351. </doc>
  352. </method>
  353. <method name="iterator" return="java.util.Iterator"
  354. abstract="false" native="false" synchronized="true"
  355. static="false" final="false" visibility="public"
  356. deprecated="not deprecated">
  357. </method>
  358. <method name="getGroup" return="org.apache.hadoop.mapred.Counters.Group"
  359. abstract="false" native="false" synchronized="true"
  360. static="false" final="false" visibility="public"
  361. deprecated="not deprecated">
  362. <param name="groupName" type="java.lang.String"/>
  363. <doc>
  364. <![CDATA[Returns the named counter group, or an empty group if there is none
  365. with the specified name.]]>
  366. </doc>
  367. </method>
  368. <method name="findCounter" return="org.apache.hadoop.mapred.Counters.Counter"
  369. abstract="false" native="false" synchronized="true"
  370. static="false" final="false" visibility="public"
  371. deprecated="not deprecated">
  372. <param name="key" type="java.lang.Enum"/>
  373. <doc>
  374. <![CDATA[Find the counter for the given enum. The same enum will always return the
  375. same counter.
  376. @param key the counter key
  377. @return the matching counter object]]>
  378. </doc>
  379. </method>
  380. <method name="findCounter" return="org.apache.hadoop.mapred.Counters.Counter"
  381. abstract="false" native="false" synchronized="true"
  382. static="false" final="false" visibility="public"
  383. deprecated="not deprecated">
  384. <param name="group" type="java.lang.String"/>
  385. <param name="name" type="java.lang.String"/>
  386. <doc>
  387. <![CDATA[Find a counter given the group and the name.
  388. @param group the name of the group
  389. @param name the internal name of the counter
  390. @return the counter for that name]]>
  391. </doc>
  392. </method>
  393. <method name="findCounter" return="org.apache.hadoop.mapred.Counters.Counter"
  394. abstract="false" native="false" synchronized="true"
  395. static="false" final="false" visibility="public"
  396. deprecated="deprecated, no comment">
  397. <param name="group" type="java.lang.String"/>
  398. <param name="id" type="int"/>
  399. <param name="name" type="java.lang.String"/>
  400. <doc>
  401. <![CDATA[Find a counter by using strings
  402. @param group the name of the group
  403. @param id the id of the counter within the group (0 to N-1)
  404. @param name the internal name of the counter
  405. @return the counter for that name
  406. @deprecated]]>
  407. </doc>
  408. </method>
  409. <method name="incrCounter"
  410. abstract="false" native="false" synchronized="true"
  411. static="false" final="false" visibility="public"
  412. deprecated="not deprecated">
  413. <param name="key" type="java.lang.Enum"/>
  414. <param name="amount" type="long"/>
  415. <doc>
  416. <![CDATA[Increments the specified counter by the specified amount, creating it if
  417. it didn't already exist.
  418. @param key identifies a counter
  419. @param amount amount by which counter is to be incremented]]>
  420. </doc>
  421. </method>
  422. <method name="incrCounter"
  423. abstract="false" native="false" synchronized="true"
  424. static="false" final="false" visibility="public"
  425. deprecated="not deprecated">
  426. <param name="group" type="java.lang.String"/>
  427. <param name="counter" type="java.lang.String"/>
  428. <param name="amount" type="long"/>
  429. <doc>
  430. <![CDATA[Increments the specified counter by the specified amount, creating it if
  431. it didn't already exist.
  432. @param group the name of the group
  433. @param counter the internal name of the counter
  434. @param amount amount by which counter is to be incremented]]>
  435. </doc>
  436. </method>
  437. <method name="getCounter" return="long"
  438. abstract="false" native="false" synchronized="true"
  439. static="false" final="false" visibility="public"
  440. deprecated="not deprecated">
  441. <param name="key" type="java.lang.Enum"/>
  442. <doc>
  443. <![CDATA[Returns current value of the specified counter, or 0 if the counter
  444. does not exist.]]>
  445. </doc>
  446. </method>
  447. <method name="incrAllCounters"
  448. abstract="false" native="false" synchronized="true"
  449. static="false" final="false" visibility="public"
  450. deprecated="not deprecated">
  451. <param name="other" type="org.apache.hadoop.mapred.Counters"/>
  452. <doc>
  453. <![CDATA[Increments multiple counters by their amounts in another Counters
  454. instance.
  455. @param other the other Counters instance]]>
  456. </doc>
  457. </method>
  458. <method name="sum" return="org.apache.hadoop.mapred.Counters"
  459. abstract="false" native="false" synchronized="false"
  460. static="true" final="false" visibility="public"
  461. deprecated="not deprecated">
  462. <param name="a" type="org.apache.hadoop.mapred.Counters"/>
  463. <param name="b" type="org.apache.hadoop.mapred.Counters"/>
  464. <doc>
  465. <![CDATA[Convenience method for computing the sum of two sets of counters.]]>
  466. </doc>
  467. </method>
  468. <method name="size" return="int"
  469. abstract="false" native="false" synchronized="true"
  470. static="false" final="false" visibility="public"
  471. deprecated="not deprecated">
  472. <doc>
  473. <![CDATA[Returns the total number of counters, by summing the number of counters
  474. in each group.]]>
  475. </doc>
  476. </method>
  477. <method name="write"
  478. abstract="false" native="false" synchronized="true"
  479. static="false" final="false" visibility="public"
  480. deprecated="not deprecated">
  481. <param name="out" type="java.io.DataOutput"/>
  482. <exception name="IOException" type="java.io.IOException"/>
  483. <doc>
  484. <![CDATA[Write the set of groups.
  485. The external format is:
  486. #groups (groupName group)*
  487. i.e. the number of groups followed by 0 or more groups, where each
  488. group is of the form:
  489. groupDisplayName #counters (false | true counter)*
  490. where each counter is of the form:
  491. name (false | true displayName) value]]>
  492. </doc>
  493. </method>
  494. <method name="readFields"
  495. abstract="false" native="false" synchronized="true"
  496. static="false" final="false" visibility="public"
  497. deprecated="not deprecated">
  498. <param name="in" type="java.io.DataInput"/>
  499. <exception name="IOException" type="java.io.IOException"/>
  500. <doc>
  501. <![CDATA[Read a set of groups.]]>
  502. </doc>
  503. </method>
  504. <method name="log"
  505. abstract="false" native="false" synchronized="false"
  506. static="false" final="false" visibility="public"
  507. deprecated="not deprecated">
  508. <param name="log" type="org.apache.commons.logging.Log"/>
  509. <doc>
  510. <![CDATA[Logs the current counter values.
  511. @param log The log to use.]]>
  512. </doc>
  513. </method>
  514. <method name="toString" return="java.lang.String"
  515. abstract="false" native="false" synchronized="true"
  516. static="false" final="false" visibility="public"
  517. deprecated="not deprecated">
  518. <doc>
  519. <![CDATA[Return textual representation of the counter values.]]>
  520. </doc>
  521. </method>
  522. <method name="makeCompactString" return="java.lang.String"
  523. abstract="false" native="false" synchronized="true"
  524. static="false" final="false" visibility="public"
  525. deprecated="not deprecated">
  526. <doc>
  527. <![CDATA[Convert a counters object into a single line that is easy to parse.
  528. @return the string with "name=value" for each counter and separated by ","]]>
  529. </doc>
  530. </method>
  531. <method name="makeEscapedCompactString" return="java.lang.String"
  532. abstract="false" native="false" synchronized="true"
  533. static="false" final="false" visibility="public"
  534. deprecated="not deprecated">
  535. <doc>
  536. <![CDATA[Represent the counter in a textual format that can be converted back to
  537. its object form
  538. @return the string in the following format
  539. {(groupname)(group-displayname)[(countername)(displayname)(value)][][]}{}{}]]>
  540. </doc>
  541. </method>
  542. <method name="fromEscapedCompactString" return="org.apache.hadoop.mapred.Counters"
  543. abstract="false" native="false" synchronized="false"
  544. static="true" final="false" visibility="public"
  545. deprecated="not deprecated">
  546. <param name="compactString" type="java.lang.String"/>
  547. <exception name="ParseException" type="java.text.ParseException"/>
  548. <doc>
  549. <![CDATA[Convert a stringified counter representation into a counter object. Note
  550. that the counter can be recovered if its stringified using
  551. {@link #makeEscapedCompactString()}.
  552. @return a Counter]]>
  553. </doc>
  554. </method>
  555. <method name="hashCode" return="int"
  556. abstract="false" native="false" synchronized="true"
  557. static="false" final="false" visibility="public"
  558. deprecated="not deprecated">
  559. </method>
  560. <method name="equals" return="boolean"
  561. abstract="false" native="false" synchronized="true"
  562. static="false" final="false" visibility="public"
  563. deprecated="not deprecated">
  564. <param name="obj" type="java.lang.Object"/>
  565. </method>
  566. <doc>
  567. <![CDATA[A set of named counters.
  568. <p><code>Counters</code> represent global counters, defined either by the
  569. Map-Reduce framework or applications. Each <code>Counter</code> can be of
  570. any {@link Enum} type.</p>
  571. <p><code>Counters</code> are bunched into {@link Group}s, each comprising of
  572. counters from a particular <code>Enum</code> class.
  573. @deprecated Use {@link org.apache.hadoop.mapreduce.Counters} instead.]]>
  574. </doc>
  575. </class>
  576. <!-- end class org.apache.hadoop.mapred.Counters -->
  577. <!-- start class org.apache.hadoop.mapred.Counters.Counter -->
  578. <class name="Counters.Counter" extends="org.apache.hadoop.mapreduce.Counter"
  579. abstract="false"
  580. static="true" final="false" visibility="public"
  581. deprecated="not deprecated">
  582. <method name="setDisplayName"
  583. abstract="false" native="false" synchronized="false"
  584. static="false" final="false" visibility="public"
  585. deprecated="not deprecated">
  586. <param name="newName" type="java.lang.String"/>
  587. </method>
  588. <method name="makeEscapedCompactString" return="java.lang.String"
  589. abstract="false" native="false" synchronized="true"
  590. static="false" final="false" visibility="public"
  591. deprecated="not deprecated">
  592. <doc>
  593. <![CDATA[Returns the compact stringified version of the counter in the format
  594. [(actual-name)(display-name)(value)]]]>
  595. </doc>
  596. </method>
  597. <method name="getCounter" return="long"
  598. abstract="false" native="false" synchronized="true"
  599. static="false" final="false" visibility="public"
  600. deprecated="not deprecated">
  601. <doc>
  602. <![CDATA[What is the current value of this counter?
  603. @return the current value]]>
  604. </doc>
  605. </method>
  606. <doc>
  607. <![CDATA[A counter record, comprising its name and value.]]>
  608. </doc>
  609. </class>
  610. <!-- end class org.apache.hadoop.mapred.Counters.Counter -->
  611. <!-- start class org.apache.hadoop.mapred.Counters.Group -->
  612. <class name="Counters.Group" extends="java.lang.Object"
  613. abstract="false"
  614. static="true" final="false" visibility="public"
  615. deprecated="not deprecated">
  616. <implements name="org.apache.hadoop.io.Writable"/>
  617. <implements name="java.lang.Iterable"/>
  618. <method name="getName" return="java.lang.String"
  619. abstract="false" native="false" synchronized="false"
  620. static="false" final="false" visibility="public"
  621. deprecated="not deprecated">
  622. <doc>
  623. <![CDATA[Returns raw name of the group. This is the name of the enum class
  624. for this group of counters.]]>
  625. </doc>
  626. </method>
  627. <method name="getDisplayName" return="java.lang.String"
  628. abstract="false" native="false" synchronized="false"
  629. static="false" final="false" visibility="public"
  630. deprecated="not deprecated">
  631. <doc>
  632. <![CDATA[Returns localized name of the group. This is the same as getName() by
  633. default, but different if an appropriate ResourceBundle is found.]]>
  634. </doc>
  635. </method>
  636. <method name="setDisplayName"
  637. abstract="false" native="false" synchronized="false"
  638. static="false" final="false" visibility="public"
  639. deprecated="not deprecated">
  640. <param name="displayName" type="java.lang.String"/>
  641. <doc>
  642. <![CDATA[Set the display name]]>
  643. </doc>
  644. </method>
  645. <method name="makeEscapedCompactString" return="java.lang.String"
  646. abstract="false" native="false" synchronized="false"
  647. static="false" final="false" visibility="public"
  648. deprecated="not deprecated">
  649. <doc>
  650. <![CDATA[Returns the compact stringified version of the group in the format
  651. {(actual-name)(display-name)(value)[][][]} where [] are compact strings for the
  652. counters within.]]>
  653. </doc>
  654. </method>
  655. <method name="hashCode" return="int"
  656. abstract="false" native="false" synchronized="false"
  657. static="false" final="false" visibility="public"
  658. deprecated="not deprecated">
  659. </method>
  660. <method name="equals" return="boolean"
  661. abstract="false" native="false" synchronized="true"
  662. static="false" final="false" visibility="public"
  663. deprecated="not deprecated">
  664. <param name="obj" type="java.lang.Object"/>
  665. <doc>
  666. <![CDATA[Checks for (content) equality of Groups]]>
  667. </doc>
  668. </method>
  669. <method name="getCounter" return="long"
  670. abstract="false" native="false" synchronized="true"
  671. static="false" final="false" visibility="public"
  672. deprecated="not deprecated">
  673. <param name="counterName" type="java.lang.String"/>
  674. <doc>
  675. <![CDATA[Returns the value of the specified counter, or 0 if the counter does
  676. not exist.]]>
  677. </doc>
  678. </method>
  679. <method name="getCounter" return="org.apache.hadoop.mapred.Counters.Counter"
  680. abstract="false" native="false" synchronized="true"
  681. static="false" final="false" visibility="public"
  682. deprecated="use {@link #getCounter(String)} instead">
  683. <param name="id" type="int"/>
  684. <param name="name" type="java.lang.String"/>
  685. <doc>
  686. <![CDATA[Get the counter for the given id and create it if it doesn't exist.
  687. @param id the numeric id of the counter within the group
  688. @param name the internal counter name
  689. @return the counter
  690. @deprecated use {@link #getCounter(String)} instead]]>
  691. </doc>
  692. </method>
  693. <method name="getCounterForName" return="org.apache.hadoop.mapred.Counters.Counter"
  694. abstract="false" native="false" synchronized="true"
  695. static="false" final="false" visibility="public"
  696. deprecated="not deprecated">
  697. <param name="name" type="java.lang.String"/>
  698. <doc>
  699. <![CDATA[Get the counter for the given name and create it if it doesn't exist.
  700. @param name the internal counter name
  701. @return the counter]]>
  702. </doc>
  703. </method>
  704. <method name="size" return="int"
  705. abstract="false" native="false" synchronized="true"
  706. static="false" final="false" visibility="public"
  707. deprecated="not deprecated">
  708. <doc>
  709. <![CDATA[Returns the number of counters in this group.]]>
  710. </doc>
  711. </method>
  712. <method name="write"
  713. abstract="false" native="false" synchronized="true"
  714. static="false" final="false" visibility="public"
  715. deprecated="not deprecated">
  716. <param name="out" type="java.io.DataOutput"/>
  717. <exception name="IOException" type="java.io.IOException"/>
  718. </method>
  719. <method name="readFields"
  720. abstract="false" native="false" synchronized="true"
  721. static="false" final="false" visibility="public"
  722. deprecated="not deprecated">
  723. <param name="in" type="java.io.DataInput"/>
  724. <exception name="IOException" type="java.io.IOException"/>
  725. </method>
  726. <method name="iterator" return="java.util.Iterator"
  727. abstract="false" native="false" synchronized="true"
  728. static="false" final="false" visibility="public"
  729. deprecated="not deprecated">
  730. </method>
  731. <doc>
  732. <![CDATA[<code>Group</code> of counters, comprising of counters from a particular
  733. counter {@link Enum} class.
  734. <p><code>Group</code>handles localization of the class name and the
  735. counter names.</p>]]>
  736. </doc>
  737. </class>
  738. <!-- end class org.apache.hadoop.mapred.Counters.Group -->
  739. <!-- start class org.apache.hadoop.mapred.FileAlreadyExistsException -->
  740. <class name="FileAlreadyExistsException" extends="java.io.IOException"
  741. abstract="false"
  742. static="false" final="false" visibility="public"
  743. deprecated="not deprecated">
  744. <constructor name="FileAlreadyExistsException"
  745. static="false" final="false" visibility="public"
  746. deprecated="not deprecated">
  747. </constructor>
  748. <constructor name="FileAlreadyExistsException" type="java.lang.String"
  749. static="false" final="false" visibility="public"
  750. deprecated="not deprecated">
  751. </constructor>
  752. <doc>
  753. <![CDATA[Used when target file already exists for any operation and
  754. is not configured to be overwritten.]]>
  755. </doc>
  756. </class>
  757. <!-- end class org.apache.hadoop.mapred.FileAlreadyExistsException -->
  758. <!-- start class org.apache.hadoop.mapred.FileInputFormat -->
  759. <class name="FileInputFormat" extends="java.lang.Object"
  760. abstract="true"
  761. static="false" final="false" visibility="public"
  762. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.input.FileInputFormat}
  763. instead.">
  764. <implements name="org.apache.hadoop.mapred.InputFormat"/>
  765. <constructor name="FileInputFormat"
  766. static="false" final="false" visibility="public"
  767. deprecated="not deprecated">
  768. </constructor>
  769. <method name="setMinSplitSize"
  770. abstract="false" native="false" synchronized="false"
  771. static="false" final="false" visibility="protected"
  772. deprecated="not deprecated">
  773. <param name="minSplitSize" type="long"/>
  774. </method>
  775. <method name="isSplitable" return="boolean"
  776. abstract="false" native="false" synchronized="false"
  777. static="false" final="false" visibility="protected"
  778. deprecated="not deprecated">
  779. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  780. <param name="filename" type="org.apache.hadoop.fs.Path"/>
  781. <doc>
  782. <![CDATA[Is the given filename splitable? Usually, true, but if the file is
  783. stream compressed, it will not be.
  784. <code>FileInputFormat</code> implementations can override this and return
  785. <code>false</code> to ensure that individual input files are never split-up
  786. so that {@link Mapper}s process entire files.
  787. @param fs the file system that the file is on
  788. @param filename the file name to check
  789. @return is this file splitable?]]>
  790. </doc>
  791. </method>
  792. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  793. abstract="true" native="false" synchronized="false"
  794. static="false" final="false" visibility="public"
  795. deprecated="not deprecated">
  796. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  797. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  798. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  799. <exception name="IOException" type="java.io.IOException"/>
  800. </method>
  801. <method name="setInputPathFilter"
  802. abstract="false" native="false" synchronized="false"
  803. static="true" final="false" visibility="public"
  804. deprecated="not deprecated">
  805. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  806. <param name="filter" type="java.lang.Class"/>
  807. <doc>
  808. <![CDATA[Set a PathFilter to be applied to the input paths for the map-reduce job.
  809. @param filter the PathFilter class use for filtering the input paths.]]>
  810. </doc>
  811. </method>
  812. <method name="getInputPathFilter" return="org.apache.hadoop.fs.PathFilter"
  813. abstract="false" native="false" synchronized="false"
  814. static="true" final="false" visibility="public"
  815. deprecated="not deprecated">
  816. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  817. <doc>
  818. <![CDATA[Get a PathFilter instance of the filter set for the input paths.
  819. @return the PathFilter instance set for the job, NULL if none has been set.]]>
  820. </doc>
  821. </method>
  822. <method name="addInputPathRecursively"
  823. abstract="false" native="false" synchronized="false"
  824. static="false" final="false" visibility="protected"
  825. deprecated="not deprecated">
  826. <param name="result" type="java.util.List"/>
  827. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  828. <param name="path" type="org.apache.hadoop.fs.Path"/>
  829. <param name="inputFilter" type="org.apache.hadoop.fs.PathFilter"/>
  830. <exception name="IOException" type="java.io.IOException"/>
  831. <doc>
  832. <![CDATA[Add files in the input path recursively into the results.
  833. @param result
  834. The List to store all files.
  835. @param fs
  836. The FileSystem.
  837. @param path
  838. The input path.
  839. @param inputFilter
  840. The input filter that can be used to filter files/dirs.
  841. @throws IOException]]>
  842. </doc>
  843. </method>
  844. <method name="listStatus" return="org.apache.hadoop.fs.FileStatus[]"
  845. abstract="false" native="false" synchronized="false"
  846. static="false" final="false" visibility="protected"
  847. deprecated="not deprecated">
  848. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  849. <exception name="IOException" type="java.io.IOException"/>
  850. <doc>
  851. <![CDATA[List input directories.
  852. Subclasses may override to, e.g., select only files matching a regular
  853. expression.
  854. @param job the job to list input paths for
  855. @return array of FileStatus objects
  856. @throws IOException if zero items.]]>
  857. </doc>
  858. </method>
  859. <method name="makeSplit" return="org.apache.hadoop.mapred.FileSplit"
  860. abstract="false" native="false" synchronized="false"
  861. static="false" final="false" visibility="protected"
  862. deprecated="not deprecated">
  863. <param name="file" type="org.apache.hadoop.fs.Path"/>
  864. <param name="start" type="long"/>
  865. <param name="length" type="long"/>
  866. <param name="hosts" type="java.lang.String[]"/>
  867. <doc>
  868. <![CDATA[A factory that makes the split for this class. It can be overridden
  869. by sub-classes to make sub-types]]>
  870. </doc>
  871. </method>
  872. <method name="getSplits" return="org.apache.hadoop.mapred.InputSplit[]"
  873. abstract="false" native="false" synchronized="false"
  874. static="false" final="false" visibility="public"
  875. deprecated="not deprecated">
  876. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  877. <param name="numSplits" type="int"/>
  878. <exception name="IOException" type="java.io.IOException"/>
  879. <doc>
  880. <![CDATA[Splits files returned by {@link #listStatus(JobConf)} when
  881. they're too big.]]>
  882. </doc>
  883. </method>
  884. <method name="computeSplitSize" return="long"
  885. abstract="false" native="false" synchronized="false"
  886. static="false" final="false" visibility="protected"
  887. deprecated="not deprecated">
  888. <param name="goalSize" type="long"/>
  889. <param name="minSize" type="long"/>
  890. <param name="blockSize" type="long"/>
  891. </method>
  892. <method name="getBlockIndex" return="int"
  893. abstract="false" native="false" synchronized="false"
  894. static="false" final="false" visibility="protected"
  895. deprecated="not deprecated">
  896. <param name="blkLocations" type="org.apache.hadoop.fs.BlockLocation[]"/>
  897. <param name="offset" type="long"/>
  898. </method>
  899. <method name="setInputPaths"
  900. abstract="false" native="false" synchronized="false"
  901. static="true" final="false" visibility="public"
  902. deprecated="not deprecated">
  903. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  904. <param name="commaSeparatedPaths" type="java.lang.String"/>
  905. <doc>
  906. <![CDATA[Sets the given comma separated paths as the list of inputs
  907. for the map-reduce job.
  908. @param conf Configuration of the job
  909. @param commaSeparatedPaths Comma separated paths to be set as
  910. the list of inputs for the map-reduce job.]]>
  911. </doc>
  912. </method>
  913. <method name="addInputPaths"
  914. abstract="false" native="false" synchronized="false"
  915. static="true" final="false" visibility="public"
  916. deprecated="not deprecated">
  917. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  918. <param name="commaSeparatedPaths" type="java.lang.String"/>
  919. <doc>
  920. <![CDATA[Add the given comma separated paths to the list of inputs for
  921. the map-reduce job.
  922. @param conf The configuration of the job
  923. @param commaSeparatedPaths Comma separated paths to be added to
  924. the list of inputs for the map-reduce job.]]>
  925. </doc>
  926. </method>
  927. <method name="setInputPaths"
  928. abstract="false" native="false" synchronized="false"
  929. static="true" final="false" visibility="public"
  930. deprecated="not deprecated">
  931. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  932. <param name="inputPaths" type="org.apache.hadoop.fs.Path[]"/>
  933. <doc>
  934. <![CDATA[Set the array of {@link Path}s as the list of inputs
  935. for the map-reduce job.
  936. @param conf Configuration of the job.
  937. @param inputPaths the {@link Path}s of the input directories/files
  938. for the map-reduce job.]]>
  939. </doc>
  940. </method>
  941. <method name="addInputPath"
  942. abstract="false" native="false" synchronized="false"
  943. static="true" final="false" visibility="public"
  944. deprecated="not deprecated">
  945. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  946. <param name="path" type="org.apache.hadoop.fs.Path"/>
  947. <doc>
  948. <![CDATA[Add a {@link Path} to the list of inputs for the map-reduce job.
  949. @param conf The configuration of the job
  950. @param path {@link Path} to be added to the list of inputs for
  951. the map-reduce job.]]>
  952. </doc>
  953. </method>
  954. <method name="getInputPaths" return="org.apache.hadoop.fs.Path[]"
  955. abstract="false" native="false" synchronized="false"
  956. static="true" final="false" visibility="public"
  957. deprecated="not deprecated">
  958. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  959. <doc>
  960. <![CDATA[Get the list of input {@link Path}s for the map-reduce job.
  961. @param conf The configuration of the job
  962. @return the list of input {@link Path}s for the map-reduce job.]]>
  963. </doc>
  964. </method>
  965. <method name="getSplitHosts" return="java.lang.String[]"
  966. abstract="false" native="false" synchronized="false"
  967. static="false" final="false" visibility="protected"
  968. deprecated="not deprecated">
  969. <param name="blkLocations" type="org.apache.hadoop.fs.BlockLocation[]"/>
  970. <param name="offset" type="long"/>
  971. <param name="splitSize" type="long"/>
  972. <param name="clusterMap" type="org.apache.hadoop.net.NetworkTopology"/>
  973. <exception name="IOException" type="java.io.IOException"/>
  974. <doc>
  975. <![CDATA[This function identifies and returns the hosts that contribute
  976. most for a given split. For calculating the contribution, rack
  977. locality is treated on par with host locality, so hosts from racks
  978. that contribute the most are preferred over hosts on racks that
  979. contribute less
  980. @param blkLocations The list of block locations
  981. @param offset
  982. @param splitSize
  983. @return array of hosts that contribute most to this split
  984. @throws IOException]]>
  985. </doc>
  986. </method>
  987. <field name="LOG" type="org.apache.commons.logging.Log"
  988. transient="false" volatile="false"
  989. static="true" final="true" visibility="public"
  990. deprecated="not deprecated">
  991. </field>
  992. <field name="NUM_INPUT_FILES" type="java.lang.String"
  993. transient="false" volatile="false"
  994. static="true" final="true" visibility="public"
  995. deprecated="not deprecated">
  996. </field>
  997. <doc>
  998. <![CDATA[A base class for file-based {@link InputFormat}.
  999. <p><code>FileInputFormat</code> is the base class for all file-based
  1000. <code>InputFormat</code>s. This provides a generic implementation of
  1001. {@link #getSplits(JobConf, int)}.
  1002. Subclasses of <code>FileInputFormat</code> can also override the
  1003. {@link #isSplitable(FileSystem, Path)} method to ensure input-files are
  1004. not split-up and are processed as a whole by {@link Mapper}s.
  1005. @deprecated Use {@link org.apache.hadoop.mapreduce.lib.input.FileInputFormat}
  1006. instead.]]>
  1007. </doc>
  1008. </class>
  1009. <!-- end class org.apache.hadoop.mapred.FileInputFormat -->
  1010. <!-- start class org.apache.hadoop.mapred.FileOutputCommitter -->
  1011. <class name="FileOutputCommitter" extends="org.apache.hadoop.mapred.OutputCommitter"
  1012. abstract="false"
  1013. static="false" final="false" visibility="public"
  1014. deprecated="not deprecated">
  1015. <constructor name="FileOutputCommitter"
  1016. static="false" final="false" visibility="public"
  1017. deprecated="not deprecated">
  1018. </constructor>
  1019. <method name="setupJob"
  1020. abstract="false" native="false" synchronized="false"
  1021. static="false" final="false" visibility="public"
  1022. deprecated="not deprecated">
  1023. <param name="context" type="org.apache.hadoop.mapred.JobContext"/>
  1024. <exception name="IOException" type="java.io.IOException"/>
  1025. </method>
  1026. <method name="commitJob"
  1027. abstract="false" native="false" synchronized="false"
  1028. static="false" final="false" visibility="public"
  1029. deprecated="not deprecated">
  1030. <param name="context" type="org.apache.hadoop.mapred.JobContext"/>
  1031. <exception name="IOException" type="java.io.IOException"/>
  1032. </method>
  1033. <method name="cleanupJob"
  1034. abstract="false" native="false" synchronized="false"
  1035. static="false" final="false" visibility="public"
  1036. deprecated="not deprecated">
  1037. <param name="context" type="org.apache.hadoop.mapred.JobContext"/>
  1038. <exception name="IOException" type="java.io.IOException"/>
  1039. </method>
  1040. <method name="abortJob"
  1041. abstract="false" native="false" synchronized="false"
  1042. static="false" final="false" visibility="public"
  1043. deprecated="not deprecated">
  1044. <param name="context" type="org.apache.hadoop.mapred.JobContext"/>
  1045. <param name="runState" type="int"/>
  1046. <exception name="IOException" type="java.io.IOException"/>
  1047. </method>
  1048. <method name="setupTask"
  1049. abstract="false" native="false" synchronized="false"
  1050. static="false" final="false" visibility="public"
  1051. deprecated="not deprecated">
  1052. <param name="context" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  1053. <exception name="IOException" type="java.io.IOException"/>
  1054. </method>
  1055. <method name="commitTask"
  1056. abstract="false" native="false" synchronized="false"
  1057. static="false" final="false" visibility="public"
  1058. deprecated="not deprecated">
  1059. <param name="context" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  1060. <exception name="IOException" type="java.io.IOException"/>
  1061. </method>
  1062. <method name="abortTask"
  1063. abstract="false" native="false" synchronized="false"
  1064. static="false" final="false" visibility="public"
  1065. deprecated="not deprecated">
  1066. <param name="context" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  1067. <exception name="IOException" type="java.io.IOException"/>
  1068. </method>
  1069. <method name="needsTaskCommit" return="boolean"
  1070. abstract="false" native="false" synchronized="false"
  1071. static="false" final="false" visibility="public"
  1072. deprecated="not deprecated">
  1073. <param name="context" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  1074. <exception name="IOException" type="java.io.IOException"/>
  1075. </method>
  1076. <field name="LOG" type="org.apache.commons.logging.Log"
  1077. transient="false" volatile="false"
  1078. static="true" final="true" visibility="public"
  1079. deprecated="not deprecated">
  1080. </field>
  1081. <field name="TEMP_DIR_NAME" type="java.lang.String"
  1082. transient="false" volatile="false"
  1083. static="true" final="true" visibility="public"
  1084. deprecated="not deprecated">
  1085. <doc>
  1086. <![CDATA[Temporary directory name]]>
  1087. </doc>
  1088. </field>
  1089. <field name="SUCCEEDED_FILE_NAME" type="java.lang.String"
  1090. transient="false" volatile="false"
  1091. static="true" final="true" visibility="public"
  1092. deprecated="not deprecated">
  1093. </field>
  1094. <doc>
  1095. <![CDATA[An {@link OutputCommitter} that commits files specified
  1096. in job output directory i.e. ${mapreduce.output.fileoutputformat.outputdir}.]]>
  1097. </doc>
  1098. </class>
  1099. <!-- end class org.apache.hadoop.mapred.FileOutputCommitter -->
  1100. <!-- start class org.apache.hadoop.mapred.FileOutputFormat -->
  1101. <class name="FileOutputFormat" extends="java.lang.Object"
  1102. abstract="true"
  1103. static="false" final="false" visibility="public"
  1104. deprecated="not deprecated">
  1105. <implements name="org.apache.hadoop.mapred.OutputFormat"/>
  1106. <constructor name="FileOutputFormat"
  1107. static="false" final="false" visibility="public"
  1108. deprecated="not deprecated">
  1109. </constructor>
  1110. <method name="setCompressOutput"
  1111. abstract="false" native="false" synchronized="false"
  1112. static="true" final="false" visibility="public"
  1113. deprecated="not deprecated">
  1114. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1115. <param name="compress" type="boolean"/>
  1116. <doc>
  1117. <![CDATA[Set whether the output of the job is compressed.
  1118. @param conf the {@link JobConf} to modify
  1119. @param compress should the output of the job be compressed?]]>
  1120. </doc>
  1121. </method>
  1122. <method name="getCompressOutput" return="boolean"
  1123. abstract="false" native="false" synchronized="false"
  1124. static="true" final="false" visibility="public"
  1125. deprecated="not deprecated">
  1126. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1127. <doc>
  1128. <![CDATA[Is the job output compressed?
  1129. @param conf the {@link JobConf} to look in
  1130. @return <code>true</code> if the job output should be compressed,
  1131. <code>false</code> otherwise]]>
  1132. </doc>
  1133. </method>
  1134. <method name="setOutputCompressorClass"
  1135. abstract="false" native="false" synchronized="false"
  1136. static="true" final="false" visibility="public"
  1137. deprecated="not deprecated">
  1138. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1139. <param name="codecClass" type="java.lang.Class"/>
  1140. <doc>
  1141. <![CDATA[Set the {@link CompressionCodec} to be used to compress job outputs.
  1142. @param conf the {@link JobConf} to modify
  1143. @param codecClass the {@link CompressionCodec} to be used to
  1144. compress the job outputs]]>
  1145. </doc>
  1146. </method>
  1147. <method name="getOutputCompressorClass" return="java.lang.Class"
  1148. abstract="false" native="false" synchronized="false"
  1149. static="true" final="false" visibility="public"
  1150. deprecated="not deprecated">
  1151. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1152. <param name="defaultValue" type="java.lang.Class"/>
  1153. <doc>
  1154. <![CDATA[Get the {@link CompressionCodec} for compressing the job outputs.
  1155. @param conf the {@link JobConf} to look in
  1156. @param defaultValue the {@link CompressionCodec} to return if not set
  1157. @return the {@link CompressionCodec} to be used to compress the
  1158. job outputs
  1159. @throws IllegalArgumentException if the class was specified, but not found]]>
  1160. </doc>
  1161. </method>
  1162. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  1163. abstract="true" native="false" synchronized="false"
  1164. static="false" final="false" visibility="public"
  1165. deprecated="not deprecated">
  1166. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  1167. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  1168. <param name="name" type="java.lang.String"/>
  1169. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  1170. <exception name="IOException" type="java.io.IOException"/>
  1171. </method>
  1172. <method name="checkOutputSpecs"
  1173. abstract="false" native="false" synchronized="false"
  1174. static="false" final="false" visibility="public"
  1175. deprecated="not deprecated">
  1176. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  1177. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  1178. <exception name="FileAlreadyExistsException" type="org.apache.hadoop.mapred.FileAlreadyExistsException"/>
  1179. <exception name="InvalidJobConfException" type="org.apache.hadoop.mapred.InvalidJobConfException"/>
  1180. <exception name="IOException" type="java.io.IOException"/>
  1181. </method>
  1182. <method name="setOutputPath"
  1183. abstract="false" native="false" synchronized="false"
  1184. static="true" final="false" visibility="public"
  1185. deprecated="not deprecated">
  1186. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1187. <param name="outputDir" type="org.apache.hadoop.fs.Path"/>
  1188. <doc>
  1189. <![CDATA[Set the {@link Path} of the output directory for the map-reduce job.
  1190. @param conf The configuration of the job.
  1191. @param outputDir the {@link Path} of the output directory for
  1192. the map-reduce job.]]>
  1193. </doc>
  1194. </method>
  1195. <method name="getOutputPath" return="org.apache.hadoop.fs.Path"
  1196. abstract="false" native="false" synchronized="false"
  1197. static="true" final="false" visibility="public"
  1198. deprecated="not deprecated">
  1199. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1200. <doc>
  1201. <![CDATA[Get the {@link Path} to the output directory for the map-reduce job.
  1202. @return the {@link Path} to the output directory for the map-reduce job.
  1203. @see FileOutputFormat#getWorkOutputPath(JobConf)]]>
  1204. </doc>
  1205. </method>
  1206. <method name="getWorkOutputPath" return="org.apache.hadoop.fs.Path"
  1207. abstract="false" native="false" synchronized="false"
  1208. static="true" final="false" visibility="public"
  1209. deprecated="not deprecated">
  1210. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1211. <doc>
  1212. <![CDATA[Get the {@link Path} to the task's temporary output directory
  1213. for the map-reduce job
  1214. <h4 id="SideEffectFiles">Tasks' Side-Effect Files</h4>
  1215. <p><i>Note:</i> The following is valid only if the {@link OutputCommitter}
  1216. is {@link FileOutputCommitter}. If <code>OutputCommitter</code> is not
  1217. a <code>FileOutputCommitter</code>, the task's temporary output
  1218. directory is same as {@link #getOutputPath(JobConf)} i.e.
  1219. <tt>${mapreduce.output.fileoutputformat.outputdir}$</tt></p>
  1220. <p>Some applications need to create/write-to side-files, which differ from
  1221. the actual job-outputs.
  1222. <p>In such cases there could be issues with 2 instances of the same TIP
  1223. (running simultaneously e.g. speculative tasks) trying to open/write-to the
  1224. same file (path) on HDFS. Hence the application-writer will have to pick
  1225. unique names per task-attempt (e.g. using the attemptid, say
  1226. <tt>attempt_200709221812_0001_m_000000_0</tt>), not just per TIP.</p>
  1227. <p>To get around this the Map-Reduce framework helps the application-writer
  1228. out by maintaining a special
  1229. <tt>${mapreduce.output.fileoutputformat.outputdir}/_temporary/_${taskid}</tt>
  1230. sub-directory for each task-attempt on HDFS where the output of the
  1231. task-attempt goes. On successful completion of the task-attempt the files
  1232. in the <tt>${mapreduce.output.fileoutputformat.outputdir}/_temporary/_${taskid}</tt> (only)
  1233. are <i>promoted</i> to <tt>${mapreduce.output.fileoutputformat.outputdir}</tt>. Of course, the
  1234. framework discards the sub-directory of unsuccessful task-attempts. This
  1235. is completely transparent to the application.</p>
  1236. <p>The application-writer can take advantage of this by creating any
  1237. side-files required in <tt>${mapreduce.task.output.dir}</tt> during execution
  1238. of his reduce-task i.e. via {@link #getWorkOutputPath(JobConf)}, and the
  1239. framework will move them out similarly - thus she doesn't have to pick
  1240. unique paths per task-attempt.</p>
  1241. <p><i>Note</i>: the value of <tt>${mapreduce.task.output.dir}</tt> during
  1242. execution of a particular task-attempt is actually
  1243. <tt>${mapreduce.output.fileoutputformat.outputdir}/_temporary/_{$taskid}</tt>, and this value is
  1244. set by the map-reduce framework. So, just create any side-files in the
  1245. path returned by {@link #getWorkOutputPath(JobConf)} from map/reduce
  1246. task to take advantage of this feature.</p>
  1247. <p>The entire discussion holds true for maps of jobs with
  1248. reducer=NONE (i.e. 0 reduces) since output of the map, in that case,
  1249. goes directly to HDFS.</p>
  1250. @return the {@link Path} to the task's temporary output directory
  1251. for the map-reduce job.]]>
  1252. </doc>
  1253. </method>
  1254. <method name="getTaskOutputPath" return="org.apache.hadoop.fs.Path"
  1255. abstract="false" native="false" synchronized="false"
  1256. static="true" final="false" visibility="public"
  1257. deprecated="not deprecated">
  1258. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1259. <param name="name" type="java.lang.String"/>
  1260. <exception name="IOException" type="java.io.IOException"/>
  1261. <doc>
  1262. <![CDATA[Helper function to create the task's temporary output directory and
  1263. return the path to the task's output file.
  1264. @param conf job-configuration
  1265. @param name temporary task-output filename
  1266. @return path to the task's temporary output file
  1267. @throws IOException]]>
  1268. </doc>
  1269. </method>
  1270. <method name="getUniqueName" return="java.lang.String"
  1271. abstract="false" native="false" synchronized="false"
  1272. static="true" final="false" visibility="public"
  1273. deprecated="not deprecated">
  1274. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1275. <param name="name" type="java.lang.String"/>
  1276. <doc>
  1277. <![CDATA[Helper function to generate a name that is unique for the task.
  1278. <p>The generated name can be used to create custom files from within the
  1279. different tasks for the job, the names for different tasks will not collide
  1280. with each other.</p>
  1281. <p>The given name is postfixed with the task type, 'm' for maps, 'r' for
  1282. reduces and the task partition number. For example, give a name 'test'
  1283. running on the first map o the job the generated name will be
  1284. 'test-m-00000'.</p>
  1285. @param conf the configuration for the job.
  1286. @param name the name to make unique.
  1287. @return a unique name accross all tasks of the job.]]>
  1288. </doc>
  1289. </method>
  1290. <method name="getPathForCustomFile" return="org.apache.hadoop.fs.Path"
  1291. abstract="false" native="false" synchronized="false"
  1292. static="true" final="false" visibility="public"
  1293. deprecated="not deprecated">
  1294. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1295. <param name="name" type="java.lang.String"/>
  1296. <doc>
  1297. <![CDATA[Helper function to generate a {@link Path} for a file that is unique for
  1298. the task within the job output directory.
  1299. <p>The path can be used to create custom files from within the map and
  1300. reduce tasks. The path name will be unique for each task. The path parent
  1301. will be the job output directory.</p>ls
  1302. <p>This method uses the {@link #getUniqueName} method to make the file name
  1303. unique for the task.</p>
  1304. @param conf the configuration for the job.
  1305. @param name the name for the file.
  1306. @return a unique path accross all tasks of the job.]]>
  1307. </doc>
  1308. </method>
  1309. <doc>
  1310. <![CDATA[A base class for {@link OutputFormat}.]]>
  1311. </doc>
  1312. </class>
  1313. <!-- end class org.apache.hadoop.mapred.FileOutputFormat -->
  1314. <!-- start class org.apache.hadoop.mapred.FileSplit -->
  1315. <class name="FileSplit" extends="org.apache.hadoop.mapreduce.InputSplit"
  1316. abstract="false"
  1317. static="false" final="false" visibility="public"
  1318. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.input.FileSplit}
  1319. instead.">
  1320. <implements name="org.apache.hadoop.mapred.InputSplit"/>
  1321. <constructor name="FileSplit"
  1322. static="false" final="false" visibility="protected"
  1323. deprecated="not deprecated">
  1324. </constructor>
  1325. <constructor name="FileSplit" type="org.apache.hadoop.fs.Path, long, long, org.apache.hadoop.mapred.JobConf"
  1326. static="false" final="false" visibility="public"
  1327. deprecated="deprecated, no comment">
  1328. <doc>
  1329. <![CDATA[Constructs a split.
  1330. @deprecated
  1331. @param file the file name
  1332. @param start the position of the first byte in the file to process
  1333. @param length the number of bytes in the file to process]]>
  1334. </doc>
  1335. </constructor>
  1336. <constructor name="FileSplit" type="org.apache.hadoop.fs.Path, long, long, java.lang.String[]"
  1337. static="false" final="false" visibility="public"
  1338. deprecated="not deprecated">
  1339. <doc>
  1340. <![CDATA[Constructs a split with host information
  1341. @param file the file name
  1342. @param start the position of the first byte in the file to process
  1343. @param length the number of bytes in the file to process
  1344. @param hosts the list of hosts containing the block, possibly null]]>
  1345. </doc>
  1346. </constructor>
  1347. <constructor name="FileSplit" type="org.apache.hadoop.mapreduce.lib.input.FileSplit"
  1348. static="false" final="false" visibility="public"
  1349. deprecated="not deprecated">
  1350. </constructor>
  1351. <method name="getPath" return="org.apache.hadoop.fs.Path"
  1352. abstract="false" native="false" synchronized="false"
  1353. static="false" final="false" visibility="public"
  1354. deprecated="not deprecated">
  1355. <doc>
  1356. <![CDATA[The file containing this split's data.]]>
  1357. </doc>
  1358. </method>
  1359. <method name="getStart" return="long"
  1360. abstract="false" native="false" synchronized="false"
  1361. static="false" final="false" visibility="public"
  1362. deprecated="not deprecated">
  1363. <doc>
  1364. <![CDATA[The position of the first byte in the file to process.]]>
  1365. </doc>
  1366. </method>
  1367. <method name="getLength" return="long"
  1368. abstract="false" native="false" synchronized="false"
  1369. static="false" final="false" visibility="public"
  1370. deprecated="not deprecated">
  1371. <doc>
  1372. <![CDATA[The number of bytes in the file to process.]]>
  1373. </doc>
  1374. </method>
  1375. <method name="toString" return="java.lang.String"
  1376. abstract="false" native="false" synchronized="false"
  1377. static="false" final="false" visibility="public"
  1378. deprecated="not deprecated">
  1379. </method>
  1380. <method name="write"
  1381. abstract="false" native="false" synchronized="false"
  1382. static="false" final="false" visibility="public"
  1383. deprecated="not deprecated">
  1384. <param name="out" type="java.io.DataOutput"/>
  1385. <exception name="IOException" type="java.io.IOException"/>
  1386. </method>
  1387. <method name="readFields"
  1388. abstract="false" native="false" synchronized="false"
  1389. static="false" final="false" visibility="public"
  1390. deprecated="not deprecated">
  1391. <param name="in" type="java.io.DataInput"/>
  1392. <exception name="IOException" type="java.io.IOException"/>
  1393. </method>
  1394. <method name="getLocations" return="java.lang.String[]"
  1395. abstract="false" native="false" synchronized="false"
  1396. static="false" final="false" visibility="public"
  1397. deprecated="not deprecated">
  1398. <exception name="IOException" type="java.io.IOException"/>
  1399. </method>
  1400. <doc>
  1401. <![CDATA[A section of an input file. Returned by {@link
  1402. InputFormat#getSplits(JobConf, int)} and passed to
  1403. {@link InputFormat#getRecordReader(InputSplit,JobConf,Reporter)}.
  1404. @deprecated Use {@link org.apache.hadoop.mapreduce.lib.input.FileSplit}
  1405. instead.]]>
  1406. </doc>
  1407. </class>
  1408. <!-- end class org.apache.hadoop.mapred.FileSplit -->
  1409. <!-- start class org.apache.hadoop.mapred.ID -->
  1410. <class name="ID" extends="org.apache.hadoop.mapreduce.ID"
  1411. abstract="true"
  1412. static="false" final="false" visibility="public"
  1413. deprecated="not deprecated">
  1414. <constructor name="ID" type="int"
  1415. static="false" final="false" visibility="public"
  1416. deprecated="not deprecated">
  1417. <doc>
  1418. <![CDATA[constructs an ID object from the given int]]>
  1419. </doc>
  1420. </constructor>
  1421. <constructor name="ID"
  1422. static="false" final="false" visibility="protected"
  1423. deprecated="not deprecated">
  1424. </constructor>
  1425. <doc>
  1426. <![CDATA[A general identifier, which internally stores the id
  1427. as an integer. This is the super class of {@link JobID},
  1428. {@link TaskID} and {@link TaskAttemptID}.
  1429. @see JobID
  1430. @see TaskID
  1431. @see TaskAttemptID]]>
  1432. </doc>
  1433. </class>
  1434. <!-- end class org.apache.hadoop.mapred.ID -->
  1435. <!-- start interface org.apache.hadoop.mapred.InputFormat -->
  1436. <interface name="InputFormat" abstract="true"
  1437. static="false" final="false" visibility="public"
  1438. deprecated="Use {@link org.apache.hadoop.mapreduce.InputFormat} instead.">
  1439. <method name="getSplits" return="org.apache.hadoop.mapred.InputSplit[]"
  1440. abstract="false" native="false" synchronized="false"
  1441. static="false" final="false" visibility="public"
  1442. deprecated="not deprecated">
  1443. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  1444. <param name="numSplits" type="int"/>
  1445. <exception name="IOException" type="java.io.IOException"/>
  1446. <doc>
  1447. <![CDATA[Logically split the set of input files for the job.
  1448. <p>Each {@link InputSplit} is then assigned to an individual {@link Mapper}
  1449. for processing.</p>
  1450. <p><i>Note</i>: The split is a <i>logical</i> split of the inputs and the
  1451. input files are not physically split into chunks. For e.g. a split could
  1452. be <i>&lt;input-file-path, start, offset&gt;</i> tuple.
  1453. @param job job configuration.
  1454. @param numSplits the desired number of splits, a hint.
  1455. @return an array of {@link InputSplit}s for the job.]]>
  1456. </doc>
  1457. </method>
  1458. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  1459. abstract="false" native="false" synchronized="false"
  1460. static="false" final="false" visibility="public"
  1461. deprecated="not deprecated">
  1462. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  1463. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  1464. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  1465. <exception name="IOException" type="java.io.IOException"/>
  1466. <doc>
  1467. <![CDATA[Get the {@link RecordReader} for the given {@link InputSplit}.
  1468. <p>It is the responsibility of the <code>RecordReader</code> to respect
  1469. record boundaries while processing the logical split to present a
  1470. record-oriented view to the individual task.</p>
  1471. @param split the {@link InputSplit}
  1472. @param job the job that this split belongs to
  1473. @return a {@link RecordReader}]]>
  1474. </doc>
  1475. </method>
  1476. <doc>
  1477. <![CDATA[<code>InputFormat</code> describes the input-specification for a
  1478. Map-Reduce job.
  1479. <p>The Map-Reduce framework relies on the <code>InputFormat</code> of the
  1480. job to:<p>
  1481. <ol>
  1482. <li>
  1483. Validate the input-specification of the job.
  1484. <li>
  1485. Split-up the input file(s) into logical {@link InputSplit}s, each of
  1486. which is then assigned to an individual {@link Mapper}.
  1487. </li>
  1488. <li>
  1489. Provide the {@link RecordReader} implementation to be used to glean
  1490. input records from the logical <code>InputSplit</code> for processing by
  1491. the {@link Mapper}.
  1492. </li>
  1493. </ol>
  1494. <p>The default behavior of file-based {@link InputFormat}s, typically
  1495. sub-classes of {@link FileInputFormat}, is to split the
  1496. input into <i>logical</i> {@link InputSplit}s based on the total size, in
  1497. bytes, of the input files. However, the {@link FileSystem} blocksize of
  1498. the input files is treated as an upper bound for input splits. A lower bound
  1499. on the split size can be set via
  1500. <a href="{@docRoot}/../mapred-default.html#mapreduce.input.fileinputformat.split.minsize">
  1501. mapreduce.input.fileinputformat.split.minsize</a>.</p>
  1502. <p>Clearly, logical splits based on input-size is insufficient for many
  1503. applications since record boundaries are to respected. In such cases, the
  1504. application has to also implement a {@link RecordReader} on whom lies the
  1505. responsibilty to respect record-boundaries and present a record-oriented
  1506. view of the logical <code>InputSplit</code> to the individual task.
  1507. @see InputSplit
  1508. @see RecordReader
  1509. @see JobClient
  1510. @see FileInputFormat
  1511. @deprecated Use {@link org.apache.hadoop.mapreduce.InputFormat} instead.]]>
  1512. </doc>
  1513. </interface>
  1514. <!-- end interface org.apache.hadoop.mapred.InputFormat -->
  1515. <!-- start interface org.apache.hadoop.mapred.InputSplit -->
  1516. <interface name="InputSplit" abstract="true"
  1517. static="false" final="false" visibility="public"
  1518. deprecated="Use {@link org.apache.hadoop.mapreduce.InputSplit} instead.">
  1519. <implements name="org.apache.hadoop.io.Writable"/>
  1520. <method name="getLength" return="long"
  1521. abstract="false" native="false" synchronized="false"
  1522. static="false" final="false" visibility="public"
  1523. deprecated="not deprecated">
  1524. <exception name="IOException" type="java.io.IOException"/>
  1525. <doc>
  1526. <![CDATA[Get the total number of bytes in the data of the <code>InputSplit</code>.
  1527. @return the number of bytes in the input split.
  1528. @throws IOException]]>
  1529. </doc>
  1530. </method>
  1531. <method name="getLocations" return="java.lang.String[]"
  1532. abstract="false" native="false" synchronized="false"
  1533. static="false" final="false" visibility="public"
  1534. deprecated="not deprecated">
  1535. <exception name="IOException" type="java.io.IOException"/>
  1536. <doc>
  1537. <![CDATA[Get the list of hostnames where the input split is located.
  1538. @return list of hostnames where data of the <code>InputSplit</code> is
  1539. located as an array of <code>String</code>s.
  1540. @throws IOException]]>
  1541. </doc>
  1542. </method>
  1543. <doc>
  1544. <![CDATA[<code>InputSplit</code> represents the data to be processed by an
  1545. individual {@link Mapper}.
  1546. <p>Typically, it presents a byte-oriented view on the input and is the
  1547. responsibility of {@link RecordReader} of the job to process this and present
  1548. a record-oriented view.
  1549. @see InputFormat
  1550. @see RecordReader
  1551. @deprecated Use {@link org.apache.hadoop.mapreduce.InputSplit} instead.]]>
  1552. </doc>
  1553. </interface>
  1554. <!-- end interface org.apache.hadoop.mapred.InputSplit -->
  1555. <!-- start class org.apache.hadoop.mapred.InvalidFileTypeException -->
  1556. <class name="InvalidFileTypeException" extends="java.io.IOException"
  1557. abstract="false"
  1558. static="false" final="false" visibility="public"
  1559. deprecated="not deprecated">
  1560. <constructor name="InvalidFileTypeException"
  1561. static="false" final="false" visibility="public"
  1562. deprecated="not deprecated">
  1563. </constructor>
  1564. <constructor name="InvalidFileTypeException" type="java.lang.String"
  1565. static="false" final="false" visibility="public"
  1566. deprecated="not deprecated">
  1567. </constructor>
  1568. <doc>
  1569. <![CDATA[Used when file type differs from the desired file type. like
  1570. getting a file when a directory is expected. Or a wrong file type.]]>
  1571. </doc>
  1572. </class>
  1573. <!-- end class org.apache.hadoop.mapred.InvalidFileTypeException -->
  1574. <!-- start class org.apache.hadoop.mapred.InvalidInputException -->
  1575. <class name="InvalidInputException" extends="java.io.IOException"
  1576. abstract="false"
  1577. static="false" final="false" visibility="public"
  1578. deprecated="not deprecated">
  1579. <constructor name="InvalidInputException" type="java.util.List"
  1580. static="false" final="false" visibility="public"
  1581. deprecated="not deprecated">
  1582. <doc>
  1583. <![CDATA[Create the exception with the given list.
  1584. @param probs the list of problems to report. this list is not copied.]]>
  1585. </doc>
  1586. </constructor>
  1587. <method name="getProblems" return="java.util.List"
  1588. abstract="false" native="false" synchronized="false"
  1589. static="false" final="false" visibility="public"
  1590. deprecated="not deprecated">
  1591. <doc>
  1592. <![CDATA[Get the complete list of the problems reported.
  1593. @return the list of problems, which must not be modified]]>
  1594. </doc>
  1595. </method>
  1596. <method name="getMessage" return="java.lang.String"
  1597. abstract="false" native="false" synchronized="false"
  1598. static="false" final="false" visibility="public"
  1599. deprecated="not deprecated">
  1600. <doc>
  1601. <![CDATA[Get a summary message of the problems found.
  1602. @return the concatenated messages from all of the problems.]]>
  1603. </doc>
  1604. </method>
  1605. <doc>
  1606. <![CDATA[This class wraps a list of problems with the input, so that the user
  1607. can get a list of problems together instead of finding and fixing them one
  1608. by one.]]>
  1609. </doc>
  1610. </class>
  1611. <!-- end class org.apache.hadoop.mapred.InvalidInputException -->
  1612. <!-- start class org.apache.hadoop.mapred.InvalidJobConfException -->
  1613. <class name="InvalidJobConfException" extends="java.io.IOException"
  1614. abstract="false"
  1615. static="false" final="false" visibility="public"
  1616. deprecated="not deprecated">
  1617. <constructor name="InvalidJobConfException"
  1618. static="false" final="false" visibility="public"
  1619. deprecated="not deprecated">
  1620. </constructor>
  1621. <constructor name="InvalidJobConfException" type="java.lang.String"
  1622. static="false" final="false" visibility="public"
  1623. deprecated="not deprecated">
  1624. </constructor>
  1625. <doc>
  1626. <![CDATA[This exception is thrown when jobconf misses some mendatory attributes
  1627. or value of some attributes is invalid.]]>
  1628. </doc>
  1629. </class>
  1630. <!-- end class org.apache.hadoop.mapred.InvalidJobConfException -->
  1631. <!-- start class org.apache.hadoop.mapred.IsolationRunner -->
  1632. <class name="IsolationRunner" extends="java.lang.Object"
  1633. abstract="false"
  1634. static="false" final="false" visibility="public"
  1635. deprecated="not deprecated">
  1636. <constructor name="IsolationRunner"
  1637. static="false" final="false" visibility="public"
  1638. deprecated="not deprecated">
  1639. </constructor>
  1640. <method name="main"
  1641. abstract="false" native="false" synchronized="false"
  1642. static="true" final="false" visibility="public"
  1643. deprecated="not deprecated">
  1644. <param name="args" type="java.lang.String[]"/>
  1645. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  1646. <exception name="IOException" type="java.io.IOException"/>
  1647. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  1648. <doc>
  1649. <![CDATA[Run a single task.
  1650. @param args the first argument is the task directory]]>
  1651. </doc>
  1652. </method>
  1653. <doc>
  1654. <![CDATA[IsolationRunner is intended to facilitate debugging by re-running a specific
  1655. task, given left-over task files for a (typically failed) past job.
  1656. Currently, it is limited to re-running map tasks.
  1657. Users may coerce MapReduce to keep task files around by setting
  1658. mapreduce.task.files.preserve.failedtasks. See mapred_tutorial.xml for more documentation.]]>
  1659. </doc>
  1660. </class>
  1661. <!-- end class org.apache.hadoop.mapred.IsolationRunner -->
  1662. <!-- start class org.apache.hadoop.mapred.JobClient -->
  1663. <class name="JobClient" extends="org.apache.hadoop.mapreduce.tools.CLI"
  1664. abstract="false"
  1665. static="false" final="false" visibility="public"
  1666. deprecated="Use {@link Job} and {@link Cluster} instead">
  1667. <constructor name="JobClient"
  1668. static="false" final="false" visibility="public"
  1669. deprecated="not deprecated">
  1670. <doc>
  1671. <![CDATA[Create a job client.]]>
  1672. </doc>
  1673. </constructor>
  1674. <constructor name="JobClient" type="org.apache.hadoop.mapred.JobConf"
  1675. static="false" final="false" visibility="public"
  1676. deprecated="not deprecated">
  1677. <exception name="IOException" type="java.io.IOException"/>
  1678. <doc>
  1679. <![CDATA[Build a job client with the given {@link JobConf}, and connect to the
  1680. default {@link JobTracker}.
  1681. @param conf the job configuration.
  1682. @throws IOException]]>
  1683. </doc>
  1684. </constructor>
  1685. <constructor name="JobClient" type="org.apache.hadoop.conf.Configuration"
  1686. static="false" final="false" visibility="public"
  1687. deprecated="not deprecated">
  1688. <exception name="IOException" type="java.io.IOException"/>
  1689. <doc>
  1690. <![CDATA[Build a job client with the given {@link Configuration},
  1691. and connect to the default {@link JobTracker}.
  1692. @param conf the configuration.
  1693. @throws IOException]]>
  1694. </doc>
  1695. </constructor>
  1696. <constructor name="JobClient" type="java.net.InetSocketAddress, org.apache.hadoop.conf.Configuration"
  1697. static="false" final="false" visibility="public"
  1698. deprecated="not deprecated">
  1699. <exception name="IOException" type="java.io.IOException"/>
  1700. <doc>
  1701. <![CDATA[Build a job client, connect to the indicated job tracker.
  1702. @param jobTrackAddr the job tracker to connect to.
  1703. @param conf configuration.]]>
  1704. </doc>
  1705. </constructor>
  1706. <method name="init"
  1707. abstract="false" native="false" synchronized="false"
  1708. static="false" final="false" visibility="public"
  1709. deprecated="not deprecated">
  1710. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1711. <exception name="IOException" type="java.io.IOException"/>
  1712. <doc>
  1713. <![CDATA[Connect to the default {@link JobTracker}.
  1714. @param conf the job configuration.
  1715. @throws IOException]]>
  1716. </doc>
  1717. </method>
  1718. <method name="close"
  1719. abstract="false" native="false" synchronized="true"
  1720. static="false" final="false" visibility="public"
  1721. deprecated="not deprecated">
  1722. <exception name="IOException" type="java.io.IOException"/>
  1723. <doc>
  1724. <![CDATA[Close the <code>JobClient</code>.]]>
  1725. </doc>
  1726. </method>
  1727. <method name="getFs" return="org.apache.hadoop.fs.FileSystem"
  1728. abstract="false" native="false" synchronized="true"
  1729. static="false" final="false" visibility="public"
  1730. deprecated="not deprecated">
  1731. <exception name="IOException" type="java.io.IOException"/>
  1732. <doc>
  1733. <![CDATA[Get a filesystem handle. We need this to prepare jobs
  1734. for submission to the MapReduce system.
  1735. @return the filesystem handle.]]>
  1736. </doc>
  1737. </method>
  1738. <method name="getClusterHandle" return="org.apache.hadoop.mapreduce.Cluster"
  1739. abstract="false" native="false" synchronized="false"
  1740. static="false" final="false" visibility="public"
  1741. deprecated="not deprecated">
  1742. <doc>
  1743. <![CDATA[Get a handle to the Cluster]]>
  1744. </doc>
  1745. </method>
  1746. <method name="submitJob" return="org.apache.hadoop.mapred.RunningJob"
  1747. abstract="false" native="false" synchronized="false"
  1748. static="false" final="false" visibility="public"
  1749. deprecated="not deprecated">
  1750. <param name="jobFile" type="java.lang.String"/>
  1751. <exception name="FileNotFoundException" type="java.io.FileNotFoundException"/>
  1752. <exception name="InvalidJobConfException" type="org.apache.hadoop.mapred.InvalidJobConfException"/>
  1753. <exception name="IOException" type="java.io.IOException"/>
  1754. <doc>
  1755. <![CDATA[Submit a job to the MR system.
  1756. This returns a handle to the {@link RunningJob} which can be used to track
  1757. the running-job.
  1758. @param jobFile the job configuration.
  1759. @return a handle to the {@link RunningJob} which can be used to track the
  1760. running-job.
  1761. @throws FileNotFoundException
  1762. @throws InvalidJobConfException
  1763. @throws IOException]]>
  1764. </doc>
  1765. </method>
  1766. <method name="submitJob" return="org.apache.hadoop.mapred.RunningJob"
  1767. abstract="false" native="false" synchronized="false"
  1768. static="false" final="false" visibility="public"
  1769. deprecated="not deprecated">
  1770. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1771. <exception name="FileNotFoundException" type="java.io.FileNotFoundException"/>
  1772. <exception name="IOException" type="java.io.IOException"/>
  1773. <doc>
  1774. <![CDATA[Submit a job to the MR system.
  1775. This returns a handle to the {@link RunningJob} which can be used to track
  1776. the running-job.
  1777. @param conf the job configuration.
  1778. @return a handle to the {@link RunningJob} which can be used to track the
  1779. running-job.
  1780. @throws FileNotFoundException
  1781. @throws IOException]]>
  1782. </doc>
  1783. </method>
  1784. <method name="getJob" return="org.apache.hadoop.mapred.RunningJob"
  1785. abstract="false" native="false" synchronized="false"
  1786. static="false" final="false" visibility="public"
  1787. deprecated="not deprecated">
  1788. <param name="jobid" type="org.apache.hadoop.mapred.JobID"/>
  1789. <exception name="IOException" type="java.io.IOException"/>
  1790. <doc>
  1791. <![CDATA[Get an {@link RunningJob} object to track an ongoing job. Returns
  1792. null if the id does not correspond to any known job.
  1793. @param jobid the jobid of the job.
  1794. @return the {@link RunningJob} handle to track the job, null if the
  1795. <code>jobid</code> doesn't correspond to any known job.
  1796. @throws IOException]]>
  1797. </doc>
  1798. </method>
  1799. <method name="getJob" return="org.apache.hadoop.mapred.RunningJob"
  1800. abstract="false" native="false" synchronized="false"
  1801. static="false" final="false" visibility="public"
  1802. deprecated="Applications should rather use {@link #getJob(JobID)}.">
  1803. <param name="jobid" type="java.lang.String"/>
  1804. <exception name="IOException" type="java.io.IOException"/>
  1805. <doc>
  1806. <![CDATA[@deprecated Applications should rather use {@link #getJob(JobID)}.]]>
  1807. </doc>
  1808. </method>
  1809. <method name="getMapTaskReports" return="org.apache.hadoop.mapred.TaskReport[]"
  1810. abstract="false" native="false" synchronized="false"
  1811. static="false" final="false" visibility="public"
  1812. deprecated="not deprecated">
  1813. <param name="jobId" type="org.apache.hadoop.mapred.JobID"/>
  1814. <exception name="IOException" type="java.io.IOException"/>
  1815. <doc>
  1816. <![CDATA[Get the information of the current state of the map tasks of a job.
  1817. @param jobId the job to query.
  1818. @return the list of all of the map tips.
  1819. @throws IOException]]>
  1820. </doc>
  1821. </method>
  1822. <method name="getMapTaskReports" return="org.apache.hadoop.mapred.TaskReport[]"
  1823. abstract="false" native="false" synchronized="false"
  1824. static="false" final="false" visibility="public"
  1825. deprecated="Applications should rather use {@link #getMapTaskReports(JobID)}">
  1826. <param name="jobId" type="java.lang.String"/>
  1827. <exception name="IOException" type="java.io.IOException"/>
  1828. <doc>
  1829. <![CDATA[@deprecated Applications should rather use {@link #getMapTaskReports(JobID)}]]>
  1830. </doc>
  1831. </method>
  1832. <method name="getReduceTaskReports" return="org.apache.hadoop.mapred.TaskReport[]"
  1833. abstract="false" native="false" synchronized="false"
  1834. static="false" final="false" visibility="public"
  1835. deprecated="not deprecated">
  1836. <param name="jobId" type="org.apache.hadoop.mapred.JobID"/>
  1837. <exception name="IOException" type="java.io.IOException"/>
  1838. <doc>
  1839. <![CDATA[Get the information of the current state of the reduce tasks of a job.
  1840. @param jobId the job to query.
  1841. @return the list of all of the reduce tips.
  1842. @throws IOException]]>
  1843. </doc>
  1844. </method>
  1845. <method name="getCleanupTaskReports" return="org.apache.hadoop.mapred.TaskReport[]"
  1846. abstract="false" native="false" synchronized="false"
  1847. static="false" final="false" visibility="public"
  1848. deprecated="not deprecated">
  1849. <param name="jobId" type="org.apache.hadoop.mapred.JobID"/>
  1850. <exception name="IOException" type="java.io.IOException"/>
  1851. <doc>
  1852. <![CDATA[Get the information of the current state of the cleanup tasks of a job.
  1853. @param jobId the job to query.
  1854. @return the list of all of the cleanup tips.
  1855. @throws IOException]]>
  1856. </doc>
  1857. </method>
  1858. <method name="getSetupTaskReports" return="org.apache.hadoop.mapred.TaskReport[]"
  1859. abstract="false" native="false" synchronized="false"
  1860. static="false" final="false" visibility="public"
  1861. deprecated="not deprecated">
  1862. <param name="jobId" type="org.apache.hadoop.mapred.JobID"/>
  1863. <exception name="IOException" type="java.io.IOException"/>
  1864. <doc>
  1865. <![CDATA[Get the information of the current state of the setup tasks of a job.
  1866. @param jobId the job to query.
  1867. @return the list of all of the setup tips.
  1868. @throws IOException]]>
  1869. </doc>
  1870. </method>
  1871. <method name="getReduceTaskReports" return="org.apache.hadoop.mapred.TaskReport[]"
  1872. abstract="false" native="false" synchronized="false"
  1873. static="false" final="false" visibility="public"
  1874. deprecated="Applications should rather use {@link #getReduceTaskReports(JobID)}">
  1875. <param name="jobId" type="java.lang.String"/>
  1876. <exception name="IOException" type="java.io.IOException"/>
  1877. <doc>
  1878. <![CDATA[@deprecated Applications should rather use {@link #getReduceTaskReports(JobID)}]]>
  1879. </doc>
  1880. </method>
  1881. <method name="displayTasks"
  1882. abstract="false" native="false" synchronized="false"
  1883. static="false" final="false" visibility="public"
  1884. deprecated="not deprecated">
  1885. <param name="jobId" type="org.apache.hadoop.mapred.JobID"/>
  1886. <param name="type" type="java.lang.String"/>
  1887. <param name="state" type="java.lang.String"/>
  1888. <exception name="IOException" type="java.io.IOException"/>
  1889. <doc>
  1890. <![CDATA[Display the information about a job's tasks, of a particular type and
  1891. in a particular state
  1892. @param jobId the ID of the job
  1893. @param type the type of the task (map/reduce/setup/cleanup)
  1894. @param state the state of the task
  1895. (pending/running/completed/failed/killed)]]>
  1896. </doc>
  1897. </method>
  1898. <method name="getClusterStatus" return="org.apache.hadoop.mapred.ClusterStatus"
  1899. abstract="false" native="false" synchronized="false"
  1900. static="false" final="false" visibility="public"
  1901. deprecated="not deprecated">
  1902. <exception name="IOException" type="java.io.IOException"/>
  1903. <doc>
  1904. <![CDATA[Get status information about the Map-Reduce cluster.
  1905. @return the status information about the Map-Reduce cluster as an object
  1906. of {@link ClusterStatus}.
  1907. @throws IOException]]>
  1908. </doc>
  1909. </method>
  1910. <method name="getClusterStatus" return="org.apache.hadoop.mapred.ClusterStatus"
  1911. abstract="false" native="false" synchronized="false"
  1912. static="false" final="false" visibility="public"
  1913. deprecated="not deprecated">
  1914. <param name="detailed" type="boolean"/>
  1915. <exception name="IOException" type="java.io.IOException"/>
  1916. <doc>
  1917. <![CDATA[Get status information about the Map-Reduce cluster.
  1918. @param detailed if true then get a detailed status including the
  1919. tracker names
  1920. @return the status information about the Map-Reduce cluster as an object
  1921. of {@link ClusterStatus}.
  1922. @throws IOException]]>
  1923. </doc>
  1924. </method>
  1925. <method name="jobsToComplete" return="org.apache.hadoop.mapred.JobStatus[]"
  1926. abstract="false" native="false" synchronized="false"
  1927. static="false" final="false" visibility="public"
  1928. deprecated="not deprecated">
  1929. <exception name="IOException" type="java.io.IOException"/>
  1930. <doc>
  1931. <![CDATA[Get the jobs that are not completed and not failed.
  1932. @return array of {@link JobStatus} for the running/to-be-run jobs.
  1933. @throws IOException]]>
  1934. </doc>
  1935. </method>
  1936. <method name="getAllJobs" return="org.apache.hadoop.mapred.JobStatus[]"
  1937. abstract="false" native="false" synchronized="false"
  1938. static="false" final="false" visibility="public"
  1939. deprecated="not deprecated">
  1940. <exception name="IOException" type="java.io.IOException"/>
  1941. <doc>
  1942. <![CDATA[Get the jobs that are submitted.
  1943. @return array of {@link JobStatus} for the submitted jobs.
  1944. @throws IOException]]>
  1945. </doc>
  1946. </method>
  1947. <method name="runJob" return="org.apache.hadoop.mapred.RunningJob"
  1948. abstract="false" native="false" synchronized="false"
  1949. static="true" final="false" visibility="public"
  1950. deprecated="not deprecated">
  1951. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  1952. <exception name="IOException" type="java.io.IOException"/>
  1953. <doc>
  1954. <![CDATA[Utility that submits a job, then polls for progress until the job is
  1955. complete.
  1956. @param job the job configuration.
  1957. @throws IOException if the job fails]]>
  1958. </doc>
  1959. </method>
  1960. <method name="monitorAndPrintJob" return="boolean"
  1961. abstract="false" native="false" synchronized="false"
  1962. static="false" final="false" visibility="public"
  1963. deprecated="not deprecated">
  1964. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  1965. <param name="job" type="org.apache.hadoop.mapred.RunningJob"/>
  1966. <exception name="IOException" type="java.io.IOException"/>
  1967. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  1968. <doc>
  1969. <![CDATA[Monitor a job and print status in real-time as progress is made and tasks
  1970. fail.
  1971. @param conf the job's configuration
  1972. @param job the job to track
  1973. @return true if the job succeeded
  1974. @throws IOException if communication to the JobTracker fails]]>
  1975. </doc>
  1976. </method>
  1977. <method name="setTaskOutputFilter"
  1978. abstract="false" native="false" synchronized="false"
  1979. static="false" final="false" visibility="public"
  1980. deprecated="not deprecated">
  1981. <param name="newValue" type="org.apache.hadoop.mapred.JobClient.TaskStatusFilter"/>
  1982. <doc>
  1983. <![CDATA[Sets the output filter for tasks. only those tasks are printed whose
  1984. output matches the filter.
  1985. @param newValue task filter.]]>
  1986. </doc>
  1987. </method>
  1988. <method name="getTaskOutputFilter" return="org.apache.hadoop.mapred.JobClient.TaskStatusFilter"
  1989. abstract="false" native="false" synchronized="false"
  1990. static="true" final="false" visibility="public"
  1991. deprecated="not deprecated">
  1992. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  1993. <doc>
  1994. <![CDATA[Get the task output filter out of the JobConf.
  1995. @param job the JobConf to examine.
  1996. @return the filter level.]]>
  1997. </doc>
  1998. </method>
  1999. <method name="setTaskOutputFilter"
  2000. abstract="false" native="false" synchronized="false"
  2001. static="true" final="false" visibility="public"
  2002. deprecated="not deprecated">
  2003. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  2004. <param name="newValue" type="org.apache.hadoop.mapred.JobClient.TaskStatusFilter"/>
  2005. <doc>
  2006. <![CDATA[Modify the JobConf to set the task output filter.
  2007. @param job the JobConf to modify.
  2008. @param newValue the value to set.]]>
  2009. </doc>
  2010. </method>
  2011. <method name="getTaskOutputFilter" return="org.apache.hadoop.mapred.JobClient.TaskStatusFilter"
  2012. abstract="false" native="false" synchronized="false"
  2013. static="false" final="false" visibility="public"
  2014. deprecated="not deprecated">
  2015. <doc>
  2016. <![CDATA[Returns task output filter.
  2017. @return task filter.]]>
  2018. </doc>
  2019. </method>
  2020. <method name="getCounter" return="long"
  2021. abstract="false" native="false" synchronized="false"
  2022. static="false" final="false" visibility="protected"
  2023. deprecated="not deprecated">
  2024. <param name="cntrs" type="org.apache.hadoop.mapreduce.Counters"/>
  2025. <param name="counterGroupName" type="java.lang.String"/>
  2026. <param name="counterName" type="java.lang.String"/>
  2027. <exception name="IOException" type="java.io.IOException"/>
  2028. </method>
  2029. <method name="getDefaultMaps" return="int"
  2030. abstract="false" native="false" synchronized="false"
  2031. static="false" final="false" visibility="public"
  2032. deprecated="not deprecated">
  2033. <exception name="IOException" type="java.io.IOException"/>
  2034. <doc>
  2035. <![CDATA[Get status information about the max available Maps in the cluster.
  2036. @return the max available Maps in the cluster
  2037. @throws IOException]]>
  2038. </doc>
  2039. </method>
  2040. <method name="getDefaultReduces" return="int"
  2041. abstract="false" native="false" synchronized="false"
  2042. static="false" final="false" visibility="public"
  2043. deprecated="not deprecated">
  2044. <exception name="IOException" type="java.io.IOException"/>
  2045. <doc>
  2046. <![CDATA[Get status information about the max available Reduces in the cluster.
  2047. @return the max available Reduces in the cluster
  2048. @throws IOException]]>
  2049. </doc>
  2050. </method>
  2051. <method name="getSystemDir" return="org.apache.hadoop.fs.Path"
  2052. abstract="false" native="false" synchronized="false"
  2053. static="false" final="false" visibility="public"
  2054. deprecated="not deprecated">
  2055. <doc>
  2056. <![CDATA[Grab the jobtracker system directory path where job-specific files are to be placed.
  2057. @return the system directory where job-specific files are to be placed.]]>
  2058. </doc>
  2059. </method>
  2060. <method name="getRootQueues" return="org.apache.hadoop.mapred.JobQueueInfo[]"
  2061. abstract="false" native="false" synchronized="false"
  2062. static="false" final="false" visibility="public"
  2063. deprecated="not deprecated">
  2064. <exception name="IOException" type="java.io.IOException"/>
  2065. <doc>
  2066. <![CDATA[Returns an array of queue information objects about root level queues
  2067. configured
  2068. @return the array of root level JobQueueInfo objects
  2069. @throws IOException]]>
  2070. </doc>
  2071. </method>
  2072. <method name="getChildQueues" return="org.apache.hadoop.mapred.JobQueueInfo[]"
  2073. abstract="false" native="false" synchronized="false"
  2074. static="false" final="false" visibility="public"
  2075. deprecated="not deprecated">
  2076. <param name="queueName" type="java.lang.String"/>
  2077. <exception name="IOException" type="java.io.IOException"/>
  2078. <doc>
  2079. <![CDATA[Returns an array of queue information objects about immediate children
  2080. of queue queueName.
  2081. @param queueName
  2082. @return the array of immediate children JobQueueInfo objects
  2083. @throws IOException]]>
  2084. </doc>
  2085. </method>
  2086. <method name="getQueues" return="org.apache.hadoop.mapred.JobQueueInfo[]"
  2087. abstract="false" native="false" synchronized="false"
  2088. static="false" final="false" visibility="public"
  2089. deprecated="not deprecated">
  2090. <exception name="IOException" type="java.io.IOException"/>
  2091. <doc>
  2092. <![CDATA[Return an array of queue information objects about all the Job Queues
  2093. configured.
  2094. @return Array of JobQueueInfo objects
  2095. @throws IOException]]>
  2096. </doc>
  2097. </method>
  2098. <method name="getJobsFromQueue" return="org.apache.hadoop.mapred.JobStatus[]"
  2099. abstract="false" native="false" synchronized="false"
  2100. static="false" final="false" visibility="public"
  2101. deprecated="not deprecated">
  2102. <param name="queueName" type="java.lang.String"/>
  2103. <exception name="IOException" type="java.io.IOException"/>
  2104. <doc>
  2105. <![CDATA[Gets all the jobs which were added to particular Job Queue
  2106. @param queueName name of the Job Queue
  2107. @return Array of jobs present in the job queue
  2108. @throws IOException]]>
  2109. </doc>
  2110. </method>
  2111. <method name="getQueueInfo" return="org.apache.hadoop.mapred.JobQueueInfo"
  2112. abstract="false" native="false" synchronized="false"
  2113. static="false" final="false" visibility="public"
  2114. deprecated="not deprecated">
  2115. <param name="queueName" type="java.lang.String"/>
  2116. <exception name="IOException" type="java.io.IOException"/>
  2117. <doc>
  2118. <![CDATA[Gets the queue information associated to a particular Job Queue
  2119. @param queueName name of the job queue.
  2120. @return Queue information associated to particular queue.
  2121. @throws IOException]]>
  2122. </doc>
  2123. </method>
  2124. <method name="getQueueAclsForCurrentUser" return="org.apache.hadoop.mapred.QueueAclsInfo[]"
  2125. abstract="false" native="false" synchronized="false"
  2126. static="false" final="false" visibility="public"
  2127. deprecated="not deprecated">
  2128. <exception name="IOException" type="java.io.IOException"/>
  2129. <doc>
  2130. <![CDATA[Gets the Queue ACLs for current user
  2131. @return array of QueueAclsInfo object for current user.
  2132. @throws IOException]]>
  2133. </doc>
  2134. </method>
  2135. <method name="getDelegationToken" return="org.apache.hadoop.security.token.Token"
  2136. abstract="false" native="false" synchronized="false"
  2137. static="false" final="false" visibility="public"
  2138. deprecated="not deprecated">
  2139. <param name="renewer" type="org.apache.hadoop.io.Text"/>
  2140. <exception name="IOException" type="java.io.IOException"/>
  2141. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  2142. <doc>
  2143. <![CDATA[Get a delegation token for the user from the JobTracker.
  2144. @param renewer the user who can renew the token
  2145. @return the new token
  2146. @throws IOException]]>
  2147. </doc>
  2148. </method>
  2149. <method name="renewDelegationToken" return="long"
  2150. abstract="false" native="false" synchronized="false"
  2151. static="false" final="false" visibility="public"
  2152. deprecated="not deprecated">
  2153. <param name="token" type="org.apache.hadoop.security.token.Token"/>
  2154. <exception name="SecretManager.InvalidToken" type="org.apache.hadoop.security.token.SecretManager.InvalidToken"/>
  2155. <exception name="IOException" type="java.io.IOException"/>
  2156. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  2157. <doc>
  2158. <![CDATA[Renew a delegation token
  2159. @param token the token to renew
  2160. @return true if the renewal went well
  2161. @throws InvalidToken
  2162. @throws IOException]]>
  2163. </doc>
  2164. </method>
  2165. <method name="cancelDelegationToken"
  2166. abstract="false" native="false" synchronized="false"
  2167. static="false" final="false" visibility="public"
  2168. deprecated="not deprecated">
  2169. <param name="token" type="org.apache.hadoop.security.token.Token"/>
  2170. <exception name="SecretManager.InvalidToken" type="org.apache.hadoop.security.token.SecretManager.InvalidToken"/>
  2171. <exception name="IOException" type="java.io.IOException"/>
  2172. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  2173. <doc>
  2174. <![CDATA[Cancel a delegation token from the JobTracker
  2175. @param token the token to cancel
  2176. @throws IOException]]>
  2177. </doc>
  2178. </method>
  2179. <method name="main"
  2180. abstract="false" native="false" synchronized="false"
  2181. static="true" final="false" visibility="public"
  2182. deprecated="not deprecated">
  2183. <param name="argv" type="java.lang.String[]"/>
  2184. <exception name="Exception" type="java.lang.Exception"/>
  2185. </method>
  2186. <doc>
  2187. <![CDATA[<code>JobClient</code> is the primary interface for the user-job to interact
  2188. with the {@link JobTracker}.
  2189. <code>JobClient</code> provides facilities to submit jobs, track their
  2190. progress, access component-tasks' reports/logs, get the Map-Reduce cluster
  2191. status information etc.
  2192. <p>The job submission process involves:
  2193. <ol>
  2194. <li>
  2195. Checking the input and output specifications of the job.
  2196. </li>
  2197. <li>
  2198. Computing the {@link InputSplit}s for the job.
  2199. </li>
  2200. <li>
  2201. Setup the requisite accounting information for the {@link DistributedCache}
  2202. of the job, if necessary.
  2203. </li>
  2204. <li>
  2205. Copying the job's jar and configuration to the map-reduce system directory
  2206. on the distributed file-system.
  2207. </li>
  2208. <li>
  2209. Submitting the job to the <code>JobTracker</code> and optionally monitoring
  2210. it's status.
  2211. </li>
  2212. </ol></p>
  2213. Normally the user creates the application, describes various facets of the
  2214. job via {@link JobConf} and then uses the <code>JobClient</code> to submit
  2215. the job and monitor its progress.
  2216. <p>Here is an example on how to use <code>JobClient</code>:</p>
  2217. <p><blockquote><pre>
  2218. // Create a new JobConf
  2219. JobConf job = new JobConf(new Configuration(), MyJob.class);
  2220. // Specify various job-specific parameters
  2221. job.setJobName("myjob");
  2222. job.setInputPath(new Path("in"));
  2223. job.setOutputPath(new Path("out"));
  2224. job.setMapperClass(MyJob.MyMapper.class);
  2225. job.setReducerClass(MyJob.MyReducer.class);
  2226. // Submit the job, then poll for progress until the job is complete
  2227. JobClient.runJob(job);
  2228. </pre></blockquote></p>
  2229. <h4 id="JobControl">Job Control</h4>
  2230. <p>At times clients would chain map-reduce jobs to accomplish complex tasks
  2231. which cannot be done via a single map-reduce job. This is fairly easy since
  2232. the output of the job, typically, goes to distributed file-system and that
  2233. can be used as the input for the next job.</p>
  2234. <p>However, this also means that the onus on ensuring jobs are complete
  2235. (success/failure) lies squarely on the clients. In such situations the
  2236. various job-control options are:
  2237. <ol>
  2238. <li>
  2239. {@link #runJob(JobConf)} : submits the job and returns only after
  2240. the job has completed.
  2241. </li>
  2242. <li>
  2243. {@link #submitJob(JobConf)} : only submits the job, then poll the
  2244. returned handle to the {@link RunningJob} to query status and make
  2245. scheduling decisions.
  2246. </li>
  2247. <li>
  2248. {@link JobConf#setJobEndNotificationURI(String)} : setup a notification
  2249. on job-completion, thus avoiding polling.
  2250. </li>
  2251. </ol></p>
  2252. @see JobConf
  2253. @see ClusterStatus
  2254. @see Tool
  2255. @see DistributedCache
  2256. @deprecated Use {@link Job} and {@link Cluster} instead]]>
  2257. </doc>
  2258. </class>
  2259. <!-- end class org.apache.hadoop.mapred.JobClient -->
  2260. <!-- start class org.apache.hadoop.mapred.JobClient.TaskStatusFilter -->
  2261. <class name="JobClient.TaskStatusFilter" extends="java.lang.Enum"
  2262. abstract="false"
  2263. static="true" final="true" visibility="public"
  2264. deprecated="not deprecated">
  2265. <method name="values" return="org.apache.hadoop.mapred.JobClient.TaskStatusFilter[]"
  2266. abstract="false" native="false" synchronized="false"
  2267. static="true" final="false" visibility="public"
  2268. deprecated="not deprecated">
  2269. </method>
  2270. <method name="valueOf" return="org.apache.hadoop.mapred.JobClient.TaskStatusFilter"
  2271. abstract="false" native="false" synchronized="false"
  2272. static="true" final="false" visibility="public"
  2273. deprecated="not deprecated">
  2274. <param name="name" type="java.lang.String"/>
  2275. </method>
  2276. </class>
  2277. <!-- end class org.apache.hadoop.mapred.JobClient.TaskStatusFilter -->
  2278. <!-- start class org.apache.hadoop.mapred.JobConf -->
  2279. <class name="JobConf" extends="org.apache.hadoop.conf.Configuration"
  2280. abstract="false"
  2281. static="false" final="false" visibility="public"
  2282. deprecated="Use {@link Configuration} instead">
  2283. <constructor name="JobConf"
  2284. static="false" final="false" visibility="public"
  2285. deprecated="not deprecated">
  2286. <doc>
  2287. <![CDATA[Construct a map/reduce job configuration.]]>
  2288. </doc>
  2289. </constructor>
  2290. <constructor name="JobConf" type="java.lang.Class"
  2291. static="false" final="false" visibility="public"
  2292. deprecated="not deprecated">
  2293. <doc>
  2294. <![CDATA[Construct a map/reduce job configuration.
  2295. @param exampleClass a class whose containing jar is used as the job's jar.]]>
  2296. </doc>
  2297. </constructor>
  2298. <constructor name="JobConf" type="org.apache.hadoop.conf.Configuration"
  2299. static="false" final="false" visibility="public"
  2300. deprecated="not deprecated">
  2301. <doc>
  2302. <![CDATA[Construct a map/reduce job configuration.
  2303. @param conf a Configuration whose settings will be inherited.]]>
  2304. </doc>
  2305. </constructor>
  2306. <constructor name="JobConf" type="org.apache.hadoop.conf.Configuration, java.lang.Class"
  2307. static="false" final="false" visibility="public"
  2308. deprecated="not deprecated">
  2309. <doc>
  2310. <![CDATA[Construct a map/reduce job configuration.
  2311. @param conf a Configuration whose settings will be inherited.
  2312. @param exampleClass a class whose containing jar is used as the job's jar.]]>
  2313. </doc>
  2314. </constructor>
  2315. <constructor name="JobConf" type="java.lang.String"
  2316. static="false" final="false" visibility="public"
  2317. deprecated="not deprecated">
  2318. <doc>
  2319. <![CDATA[Construct a map/reduce configuration.
  2320. @param config a Configuration-format XML job description file.]]>
  2321. </doc>
  2322. </constructor>
  2323. <constructor name="JobConf" type="org.apache.hadoop.fs.Path"
  2324. static="false" final="false" visibility="public"
  2325. deprecated="not deprecated">
  2326. <doc>
  2327. <![CDATA[Construct a map/reduce configuration.
  2328. @param config a Configuration-format XML job description file.]]>
  2329. </doc>
  2330. </constructor>
  2331. <constructor name="JobConf" type="boolean"
  2332. static="false" final="false" visibility="public"
  2333. deprecated="not deprecated">
  2334. <doc>
  2335. <![CDATA[A new map/reduce configuration where the behavior of reading from the
  2336. default resources can be turned off.
  2337. <p/>
  2338. If the parameter {@code loadDefaults} is false, the new instance
  2339. will not load resources from the default files.
  2340. @param loadDefaults specifies whether to load from the default files]]>
  2341. </doc>
  2342. </constructor>
  2343. <method name="getCredentials" return="org.apache.hadoop.security.Credentials"
  2344. abstract="false" native="false" synchronized="false"
  2345. static="false" final="false" visibility="public"
  2346. deprecated="not deprecated">
  2347. <doc>
  2348. <![CDATA[Get credentials for the job.
  2349. @return credentials for the job]]>
  2350. </doc>
  2351. </method>
  2352. <method name="getJar" return="java.lang.String"
  2353. abstract="false" native="false" synchronized="false"
  2354. static="false" final="false" visibility="public"
  2355. deprecated="not deprecated">
  2356. <doc>
  2357. <![CDATA[Get the user jar for the map-reduce job.
  2358. @return the user jar for the map-reduce job.]]>
  2359. </doc>
  2360. </method>
  2361. <method name="setJar"
  2362. abstract="false" native="false" synchronized="false"
  2363. static="false" final="false" visibility="public"
  2364. deprecated="not deprecated">
  2365. <param name="jar" type="java.lang.String"/>
  2366. <doc>
  2367. <![CDATA[Set the user jar for the map-reduce job.
  2368. @param jar the user jar for the map-reduce job.]]>
  2369. </doc>
  2370. </method>
  2371. <method name="getJarUnpackPattern" return="java.util.regex.Pattern"
  2372. abstract="false" native="false" synchronized="false"
  2373. static="false" final="false" visibility="public"
  2374. deprecated="not deprecated">
  2375. <doc>
  2376. <![CDATA[Get the pattern for jar contents to unpack on the tasktracker]]>
  2377. </doc>
  2378. </method>
  2379. <method name="setJarByClass"
  2380. abstract="false" native="false" synchronized="false"
  2381. static="false" final="false" visibility="public"
  2382. deprecated="not deprecated">
  2383. <param name="cls" type="java.lang.Class"/>
  2384. <doc>
  2385. <![CDATA[Set the job's jar file by finding an example class location.
  2386. @param cls the example class.]]>
  2387. </doc>
  2388. </method>
  2389. <method name="getLocalDirs" return="java.lang.String[]"
  2390. abstract="false" native="false" synchronized="false"
  2391. static="false" final="false" visibility="public"
  2392. deprecated="not deprecated">
  2393. <exception name="IOException" type="java.io.IOException"/>
  2394. </method>
  2395. <method name="deleteLocalFiles"
  2396. abstract="false" native="false" synchronized="false"
  2397. static="false" final="false" visibility="public"
  2398. deprecated="not deprecated">
  2399. <exception name="IOException" type="java.io.IOException"/>
  2400. <doc>
  2401. <![CDATA[Use MRAsyncDiskService.moveAndDeleteAllVolumes instead.
  2402. @see org.apache.hadoop.mapreduce.util.MRAsyncDiskService#cleanupAllVolumes()]]>
  2403. </doc>
  2404. </method>
  2405. <method name="deleteLocalFiles"
  2406. abstract="false" native="false" synchronized="false"
  2407. static="false" final="false" visibility="public"
  2408. deprecated="not deprecated">
  2409. <param name="subdir" type="java.lang.String"/>
  2410. <exception name="IOException" type="java.io.IOException"/>
  2411. </method>
  2412. <method name="getLocalPath" return="org.apache.hadoop.fs.Path"
  2413. abstract="false" native="false" synchronized="false"
  2414. static="false" final="false" visibility="public"
  2415. deprecated="not deprecated">
  2416. <param name="pathString" type="java.lang.String"/>
  2417. <exception name="IOException" type="java.io.IOException"/>
  2418. <doc>
  2419. <![CDATA[Constructs a local file name. Files are distributed among configured
  2420. local directories.]]>
  2421. </doc>
  2422. </method>
  2423. <method name="getUser" return="java.lang.String"
  2424. abstract="false" native="false" synchronized="false"
  2425. static="false" final="false" visibility="public"
  2426. deprecated="not deprecated">
  2427. <doc>
  2428. <![CDATA[Get the reported username for this job.
  2429. @return the username]]>
  2430. </doc>
  2431. </method>
  2432. <method name="setUser"
  2433. abstract="false" native="false" synchronized="false"
  2434. static="false" final="false" visibility="public"
  2435. deprecated="not deprecated">
  2436. <param name="user" type="java.lang.String"/>
  2437. <doc>
  2438. <![CDATA[Set the reported username for this job.
  2439. @param user the username for this job.]]>
  2440. </doc>
  2441. </method>
  2442. <method name="setKeepFailedTaskFiles"
  2443. abstract="false" native="false" synchronized="false"
  2444. static="false" final="false" visibility="public"
  2445. deprecated="not deprecated">
  2446. <param name="keep" type="boolean"/>
  2447. <doc>
  2448. <![CDATA[Set whether the framework should keep the intermediate files for
  2449. failed tasks.
  2450. @param keep <code>true</code> if framework should keep the intermediate files
  2451. for failed tasks, <code>false</code> otherwise.]]>
  2452. </doc>
  2453. </method>
  2454. <method name="getKeepFailedTaskFiles" return="boolean"
  2455. abstract="false" native="false" synchronized="false"
  2456. static="false" final="false" visibility="public"
  2457. deprecated="not deprecated">
  2458. <doc>
  2459. <![CDATA[Should the temporary files for failed tasks be kept?
  2460. @return should the files be kept?]]>
  2461. </doc>
  2462. </method>
  2463. <method name="setKeepTaskFilesPattern"
  2464. abstract="false" native="false" synchronized="false"
  2465. static="false" final="false" visibility="public"
  2466. deprecated="not deprecated">
  2467. <param name="pattern" type="java.lang.String"/>
  2468. <doc>
  2469. <![CDATA[Set a regular expression for task names that should be kept.
  2470. The regular expression ".*_m_000123_0" would keep the files
  2471. for the first instance of map 123 that ran.
  2472. @param pattern the java.util.regex.Pattern to match against the
  2473. task names.]]>
  2474. </doc>
  2475. </method>
  2476. <method name="getKeepTaskFilesPattern" return="java.lang.String"
  2477. abstract="false" native="false" synchronized="false"
  2478. static="false" final="false" visibility="public"
  2479. deprecated="not deprecated">
  2480. <doc>
  2481. <![CDATA[Get the regular expression that is matched against the task names
  2482. to see if we need to keep the files.
  2483. @return the pattern as a string, if it was set, othewise null.]]>
  2484. </doc>
  2485. </method>
  2486. <method name="setWorkingDirectory"
  2487. abstract="false" native="false" synchronized="false"
  2488. static="false" final="false" visibility="public"
  2489. deprecated="not deprecated">
  2490. <param name="dir" type="org.apache.hadoop.fs.Path"/>
  2491. <doc>
  2492. <![CDATA[Set the current working directory for the default file system.
  2493. @param dir the new current working directory.]]>
  2494. </doc>
  2495. </method>
  2496. <method name="getWorkingDirectory" return="org.apache.hadoop.fs.Path"
  2497. abstract="false" native="false" synchronized="false"
  2498. static="false" final="false" visibility="public"
  2499. deprecated="not deprecated">
  2500. <doc>
  2501. <![CDATA[Get the current working directory for the default file system.
  2502. @return the directory name.]]>
  2503. </doc>
  2504. </method>
  2505. <method name="setNumTasksToExecutePerJvm"
  2506. abstract="false" native="false" synchronized="false"
  2507. static="false" final="false" visibility="public"
  2508. deprecated="not deprecated">
  2509. <param name="numTasks" type="int"/>
  2510. <doc>
  2511. <![CDATA[Sets the number of tasks that a spawned task JVM should run
  2512. before it exits
  2513. @param numTasks the number of tasks to execute; defaults to 1;
  2514. -1 signifies no limit]]>
  2515. </doc>
  2516. </method>
  2517. <method name="getNumTasksToExecutePerJvm" return="int"
  2518. abstract="false" native="false" synchronized="false"
  2519. static="false" final="false" visibility="public"
  2520. deprecated="not deprecated">
  2521. <doc>
  2522. <![CDATA[Get the number of tasks that a spawned JVM should execute]]>
  2523. </doc>
  2524. </method>
  2525. <method name="getInputFormat" return="org.apache.hadoop.mapred.InputFormat"
  2526. abstract="false" native="false" synchronized="false"
  2527. static="false" final="false" visibility="public"
  2528. deprecated="not deprecated">
  2529. <doc>
  2530. <![CDATA[Get the {@link InputFormat} implementation for the map-reduce job,
  2531. defaults to {@link TextInputFormat} if not specified explicity.
  2532. @return the {@link InputFormat} implementation for the map-reduce job.]]>
  2533. </doc>
  2534. </method>
  2535. <method name="setInputFormat"
  2536. abstract="false" native="false" synchronized="false"
  2537. static="false" final="false" visibility="public"
  2538. deprecated="not deprecated">
  2539. <param name="theClass" type="java.lang.Class"/>
  2540. <doc>
  2541. <![CDATA[Set the {@link InputFormat} implementation for the map-reduce job.
  2542. @param theClass the {@link InputFormat} implementation for the map-reduce
  2543. job.]]>
  2544. </doc>
  2545. </method>
  2546. <method name="getOutputFormat" return="org.apache.hadoop.mapred.OutputFormat"
  2547. abstract="false" native="false" synchronized="false"
  2548. static="false" final="false" visibility="public"
  2549. deprecated="not deprecated">
  2550. <doc>
  2551. <![CDATA[Get the {@link OutputFormat} implementation for the map-reduce job,
  2552. defaults to {@link TextOutputFormat} if not specified explicity.
  2553. @return the {@link OutputFormat} implementation for the map-reduce job.]]>
  2554. </doc>
  2555. </method>
  2556. <method name="getOutputCommitter" return="org.apache.hadoop.mapred.OutputCommitter"
  2557. abstract="false" native="false" synchronized="false"
  2558. static="false" final="false" visibility="public"
  2559. deprecated="not deprecated">
  2560. <doc>
  2561. <![CDATA[Get the {@link OutputCommitter} implementation for the map-reduce job,
  2562. defaults to {@link FileOutputCommitter} if not specified explicitly.
  2563. @return the {@link OutputCommitter} implementation for the map-reduce job.]]>
  2564. </doc>
  2565. </method>
  2566. <method name="setOutputCommitter"
  2567. abstract="false" native="false" synchronized="false"
  2568. static="false" final="false" visibility="public"
  2569. deprecated="not deprecated">
  2570. <param name="theClass" type="java.lang.Class"/>
  2571. <doc>
  2572. <![CDATA[Set the {@link OutputCommitter} implementation for the map-reduce job.
  2573. @param theClass the {@link OutputCommitter} implementation for the map-reduce
  2574. job.]]>
  2575. </doc>
  2576. </method>
  2577. <method name="setOutputFormat"
  2578. abstract="false" native="false" synchronized="false"
  2579. static="false" final="false" visibility="public"
  2580. deprecated="not deprecated">
  2581. <param name="theClass" type="java.lang.Class"/>
  2582. <doc>
  2583. <![CDATA[Set the {@link OutputFormat} implementation for the map-reduce job.
  2584. @param theClass the {@link OutputFormat} implementation for the map-reduce
  2585. job.]]>
  2586. </doc>
  2587. </method>
  2588. <method name="setCompressMapOutput"
  2589. abstract="false" native="false" synchronized="false"
  2590. static="false" final="false" visibility="public"
  2591. deprecated="not deprecated">
  2592. <param name="compress" type="boolean"/>
  2593. <doc>
  2594. <![CDATA[Should the map outputs be compressed before transfer?
  2595. Uses the SequenceFile compression.
  2596. @param compress should the map outputs be compressed?]]>
  2597. </doc>
  2598. </method>
  2599. <method name="getCompressMapOutput" return="boolean"
  2600. abstract="false" native="false" synchronized="false"
  2601. static="false" final="false" visibility="public"
  2602. deprecated="not deprecated">
  2603. <doc>
  2604. <![CDATA[Are the outputs of the maps be compressed?
  2605. @return <code>true</code> if the outputs of the maps are to be compressed,
  2606. <code>false</code> otherwise.]]>
  2607. </doc>
  2608. </method>
  2609. <method name="setMapOutputCompressorClass"
  2610. abstract="false" native="false" synchronized="false"
  2611. static="false" final="false" visibility="public"
  2612. deprecated="not deprecated">
  2613. <param name="codecClass" type="java.lang.Class"/>
  2614. <doc>
  2615. <![CDATA[Set the given class as the {@link CompressionCodec} for the map outputs.
  2616. @param codecClass the {@link CompressionCodec} class that will compress
  2617. the map outputs.]]>
  2618. </doc>
  2619. </method>
  2620. <method name="getMapOutputCompressorClass" return="java.lang.Class"
  2621. abstract="false" native="false" synchronized="false"
  2622. static="false" final="false" visibility="public"
  2623. deprecated="not deprecated">
  2624. <param name="defaultValue" type="java.lang.Class"/>
  2625. <doc>
  2626. <![CDATA[Get the {@link CompressionCodec} for compressing the map outputs.
  2627. @param defaultValue the {@link CompressionCodec} to return if not set
  2628. @return the {@link CompressionCodec} class that should be used to compress the
  2629. map outputs.
  2630. @throws IllegalArgumentException if the class was specified, but not found]]>
  2631. </doc>
  2632. </method>
  2633. <method name="getMapOutputKeyClass" return="java.lang.Class"
  2634. abstract="false" native="false" synchronized="false"
  2635. static="false" final="false" visibility="public"
  2636. deprecated="not deprecated">
  2637. <doc>
  2638. <![CDATA[Get the key class for the map output data. If it is not set, use the
  2639. (final) output key class. This allows the map output key class to be
  2640. different than the final output key class.
  2641. @return the map output key class.]]>
  2642. </doc>
  2643. </method>
  2644. <method name="setMapOutputKeyClass"
  2645. abstract="false" native="false" synchronized="false"
  2646. static="false" final="false" visibility="public"
  2647. deprecated="not deprecated">
  2648. <param name="theClass" type="java.lang.Class"/>
  2649. <doc>
  2650. <![CDATA[Set the key class for the map output data. This allows the user to
  2651. specify the map output key class to be different than the final output
  2652. value class.
  2653. @param theClass the map output key class.]]>
  2654. </doc>
  2655. </method>
  2656. <method name="getMapOutputValueClass" return="java.lang.Class"
  2657. abstract="false" native="false" synchronized="false"
  2658. static="false" final="false" visibility="public"
  2659. deprecated="not deprecated">
  2660. <doc>
  2661. <![CDATA[Get the value class for the map output data. If it is not set, use the
  2662. (final) output value class This allows the map output value class to be
  2663. different than the final output value class.
  2664. @return the map output value class.]]>
  2665. </doc>
  2666. </method>
  2667. <method name="setMapOutputValueClass"
  2668. abstract="false" native="false" synchronized="false"
  2669. static="false" final="false" visibility="public"
  2670. deprecated="not deprecated">
  2671. <param name="theClass" type="java.lang.Class"/>
  2672. <doc>
  2673. <![CDATA[Set the value class for the map output data. This allows the user to
  2674. specify the map output value class to be different than the final output
  2675. value class.
  2676. @param theClass the map output value class.]]>
  2677. </doc>
  2678. </method>
  2679. <method name="getOutputKeyClass" return="java.lang.Class"
  2680. abstract="false" native="false" synchronized="false"
  2681. static="false" final="false" visibility="public"
  2682. deprecated="not deprecated">
  2683. <doc>
  2684. <![CDATA[Get the key class for the job output data.
  2685. @return the key class for the job output data.]]>
  2686. </doc>
  2687. </method>
  2688. <method name="setOutputKeyClass"
  2689. abstract="false" native="false" synchronized="false"
  2690. static="false" final="false" visibility="public"
  2691. deprecated="not deprecated">
  2692. <param name="theClass" type="java.lang.Class"/>
  2693. <doc>
  2694. <![CDATA[Set the key class for the job output data.
  2695. @param theClass the key class for the job output data.]]>
  2696. </doc>
  2697. </method>
  2698. <method name="getOutputKeyComparator" return="org.apache.hadoop.io.RawComparator"
  2699. abstract="false" native="false" synchronized="false"
  2700. static="false" final="false" visibility="public"
  2701. deprecated="not deprecated">
  2702. <doc>
  2703. <![CDATA[Get the {@link RawComparator} comparator used to compare keys.
  2704. @return the {@link RawComparator} comparator used to compare keys.]]>
  2705. </doc>
  2706. </method>
  2707. <method name="setOutputKeyComparatorClass"
  2708. abstract="false" native="false" synchronized="false"
  2709. static="false" final="false" visibility="public"
  2710. deprecated="not deprecated">
  2711. <param name="theClass" type="java.lang.Class"/>
  2712. <doc>
  2713. <![CDATA[Set the {@link RawComparator} comparator used to compare keys.
  2714. @param theClass the {@link RawComparator} comparator used to
  2715. compare keys.
  2716. @see #setOutputValueGroupingComparator(Class)]]>
  2717. </doc>
  2718. </method>
  2719. <method name="setKeyFieldComparatorOptions"
  2720. abstract="false" native="false" synchronized="false"
  2721. static="false" final="false" visibility="public"
  2722. deprecated="not deprecated">
  2723. <param name="keySpec" type="java.lang.String"/>
  2724. <doc>
  2725. <![CDATA[Set the {@link KeyFieldBasedComparator} options used to compare keys.
  2726. @param keySpec the key specification of the form -k pos1[,pos2], where,
  2727. pos is of the form f[.c][opts], where f is the number
  2728. of the key field to use, and c is the number of the first character from
  2729. the beginning of the field. Fields and character posns are numbered
  2730. starting with 1; a character position of zero in pos2 indicates the
  2731. field's last character. If '.c' is omitted from pos1, it defaults to 1
  2732. (the beginning of the field); if omitted from pos2, it defaults to 0
  2733. (the end of the field). opts are ordering options. The supported options
  2734. are:
  2735. -n, (Sort numerically)
  2736. -r, (Reverse the result of comparison)]]>
  2737. </doc>
  2738. </method>
  2739. <method name="getKeyFieldComparatorOption" return="java.lang.String"
  2740. abstract="false" native="false" synchronized="false"
  2741. static="false" final="false" visibility="public"
  2742. deprecated="not deprecated">
  2743. <doc>
  2744. <![CDATA[Get the {@link KeyFieldBasedComparator} options]]>
  2745. </doc>
  2746. </method>
  2747. <method name="setKeyFieldPartitionerOptions"
  2748. abstract="false" native="false" synchronized="false"
  2749. static="false" final="false" visibility="public"
  2750. deprecated="not deprecated">
  2751. <param name="keySpec" type="java.lang.String"/>
  2752. <doc>
  2753. <![CDATA[Set the {@link KeyFieldBasedPartitioner} options used for
  2754. {@link Partitioner}
  2755. @param keySpec the key specification of the form -k pos1[,pos2], where,
  2756. pos is of the form f[.c][opts], where f is the number
  2757. of the key field to use, and c is the number of the first character from
  2758. the beginning of the field. Fields and character posns are numbered
  2759. starting with 1; a character position of zero in pos2 indicates the
  2760. field's last character. If '.c' is omitted from pos1, it defaults to 1
  2761. (the beginning of the field); if omitted from pos2, it defaults to 0
  2762. (the end of the field).]]>
  2763. </doc>
  2764. </method>
  2765. <method name="getKeyFieldPartitionerOption" return="java.lang.String"
  2766. abstract="false" native="false" synchronized="false"
  2767. static="false" final="false" visibility="public"
  2768. deprecated="not deprecated">
  2769. <doc>
  2770. <![CDATA[Get the {@link KeyFieldBasedPartitioner} options]]>
  2771. </doc>
  2772. </method>
  2773. <method name="getOutputValueGroupingComparator" return="org.apache.hadoop.io.RawComparator"
  2774. abstract="false" native="false" synchronized="false"
  2775. static="false" final="false" visibility="public"
  2776. deprecated="not deprecated">
  2777. <doc>
  2778. <![CDATA[Get the user defined {@link WritableComparable} comparator for
  2779. grouping keys of inputs to the reduce.
  2780. @return comparator set by the user for grouping values.
  2781. @see #setOutputValueGroupingComparator(Class) for details.]]>
  2782. </doc>
  2783. </method>
  2784. <method name="setOutputValueGroupingComparator"
  2785. abstract="false" native="false" synchronized="false"
  2786. static="false" final="false" visibility="public"
  2787. deprecated="not deprecated">
  2788. <param name="theClass" type="java.lang.Class"/>
  2789. <doc>
  2790. <![CDATA[Set the user defined {@link RawComparator} comparator for
  2791. grouping keys in the input to the reduce.
  2792. <p>This comparator should be provided if the equivalence rules for keys
  2793. for sorting the intermediates are different from those for grouping keys
  2794. before each call to
  2795. {@link Reducer#reduce(Object, java.util.Iterator, OutputCollector, Reporter)}.</p>
  2796. <p>For key-value pairs (K1,V1) and (K2,V2), the values (V1, V2) are passed
  2797. in a single call to the reduce function if K1 and K2 compare as equal.</p>
  2798. <p>Since {@link #setOutputKeyComparatorClass(Class)} can be used to control
  2799. how keys are sorted, this can be used in conjunction to simulate
  2800. <i>secondary sort on values</i>.</p>
  2801. <p><i>Note</i>: This is not a guarantee of the reduce sort being
  2802. <i>stable</i> in any sense. (In any case, with the order of available
  2803. map-outputs to the reduce being non-deterministic, it wouldn't make
  2804. that much sense.)</p>
  2805. @param theClass the comparator class to be used for grouping keys.
  2806. It should implement <code>RawComparator</code>.
  2807. @see #setOutputKeyComparatorClass(Class)]]>
  2808. </doc>
  2809. </method>
  2810. <method name="getUseNewMapper" return="boolean"
  2811. abstract="false" native="false" synchronized="false"
  2812. static="false" final="false" visibility="public"
  2813. deprecated="not deprecated">
  2814. <doc>
  2815. <![CDATA[Should the framework use the new context-object code for running
  2816. the mapper?
  2817. @return true, if the new api should be used]]>
  2818. </doc>
  2819. </method>
  2820. <method name="setUseNewMapper"
  2821. abstract="false" native="false" synchronized="false"
  2822. static="false" final="false" visibility="public"
  2823. deprecated="not deprecated">
  2824. <param name="flag" type="boolean"/>
  2825. <doc>
  2826. <![CDATA[Set whether the framework should use the new api for the mapper.
  2827. This is the default for jobs submitted with the new Job api.
  2828. @param flag true, if the new api should be used]]>
  2829. </doc>
  2830. </method>
  2831. <method name="getUseNewReducer" return="boolean"
  2832. abstract="false" native="false" synchronized="false"
  2833. static="false" final="false" visibility="public"
  2834. deprecated="not deprecated">
  2835. <doc>
  2836. <![CDATA[Should the framework use the new context-object code for running
  2837. the reducer?
  2838. @return true, if the new api should be used]]>
  2839. </doc>
  2840. </method>
  2841. <method name="setUseNewReducer"
  2842. abstract="false" native="false" synchronized="false"
  2843. static="false" final="false" visibility="public"
  2844. deprecated="not deprecated">
  2845. <param name="flag" type="boolean"/>
  2846. <doc>
  2847. <![CDATA[Set whether the framework should use the new api for the reducer.
  2848. This is the default for jobs submitted with the new Job api.
  2849. @param flag true, if the new api should be used]]>
  2850. </doc>
  2851. </method>
  2852. <method name="getOutputValueClass" return="java.lang.Class"
  2853. abstract="false" native="false" synchronized="false"
  2854. static="false" final="false" visibility="public"
  2855. deprecated="not deprecated">
  2856. <doc>
  2857. <![CDATA[Get the value class for job outputs.
  2858. @return the value class for job outputs.]]>
  2859. </doc>
  2860. </method>
  2861. <method name="setOutputValueClass"
  2862. abstract="false" native="false" synchronized="false"
  2863. static="false" final="false" visibility="public"
  2864. deprecated="not deprecated">
  2865. <param name="theClass" type="java.lang.Class"/>
  2866. <doc>
  2867. <![CDATA[Set the value class for job outputs.
  2868. @param theClass the value class for job outputs.]]>
  2869. </doc>
  2870. </method>
  2871. <method name="getMapperClass" return="java.lang.Class"
  2872. abstract="false" native="false" synchronized="false"
  2873. static="false" final="false" visibility="public"
  2874. deprecated="not deprecated">
  2875. <doc>
  2876. <![CDATA[Get the {@link Mapper} class for the job.
  2877. @return the {@link Mapper} class for the job.]]>
  2878. </doc>
  2879. </method>
  2880. <method name="setMapperClass"
  2881. abstract="false" native="false" synchronized="false"
  2882. static="false" final="false" visibility="public"
  2883. deprecated="not deprecated">
  2884. <param name="theClass" type="java.lang.Class"/>
  2885. <doc>
  2886. <![CDATA[Set the {@link Mapper} class for the job.
  2887. @param theClass the {@link Mapper} class for the job.]]>
  2888. </doc>
  2889. </method>
  2890. <method name="getMapRunnerClass" return="java.lang.Class"
  2891. abstract="false" native="false" synchronized="false"
  2892. static="false" final="false" visibility="public"
  2893. deprecated="not deprecated">
  2894. <doc>
  2895. <![CDATA[Get the {@link MapRunnable} class for the job.
  2896. @return the {@link MapRunnable} class for the job.]]>
  2897. </doc>
  2898. </method>
  2899. <method name="setMapRunnerClass"
  2900. abstract="false" native="false" synchronized="false"
  2901. static="false" final="false" visibility="public"
  2902. deprecated="not deprecated">
  2903. <param name="theClass" type="java.lang.Class"/>
  2904. <doc>
  2905. <![CDATA[Expert: Set the {@link MapRunnable} class for the job.
  2906. Typically used to exert greater control on {@link Mapper}s.
  2907. @param theClass the {@link MapRunnable} class for the job.]]>
  2908. </doc>
  2909. </method>
  2910. <method name="getPartitionerClass" return="java.lang.Class"
  2911. abstract="false" native="false" synchronized="false"
  2912. static="false" final="false" visibility="public"
  2913. deprecated="not deprecated">
  2914. <doc>
  2915. <![CDATA[Get the {@link Partitioner} used to partition {@link Mapper}-outputs
  2916. to be sent to the {@link Reducer}s.
  2917. @return the {@link Partitioner} used to partition map-outputs.]]>
  2918. </doc>
  2919. </method>
  2920. <method name="setPartitionerClass"
  2921. abstract="false" native="false" synchronized="false"
  2922. static="false" final="false" visibility="public"
  2923. deprecated="not deprecated">
  2924. <param name="theClass" type="java.lang.Class"/>
  2925. <doc>
  2926. <![CDATA[Set the {@link Partitioner} class used to partition
  2927. {@link Mapper}-outputs to be sent to the {@link Reducer}s.
  2928. @param theClass the {@link Partitioner} used to partition map-outputs.]]>
  2929. </doc>
  2930. </method>
  2931. <method name="getReducerClass" return="java.lang.Class"
  2932. abstract="false" native="false" synchronized="false"
  2933. static="false" final="false" visibility="public"
  2934. deprecated="not deprecated">
  2935. <doc>
  2936. <![CDATA[Get the {@link Reducer} class for the job.
  2937. @return the {@link Reducer} class for the job.]]>
  2938. </doc>
  2939. </method>
  2940. <method name="setReducerClass"
  2941. abstract="false" native="false" synchronized="false"
  2942. static="false" final="false" visibility="public"
  2943. deprecated="not deprecated">
  2944. <param name="theClass" type="java.lang.Class"/>
  2945. <doc>
  2946. <![CDATA[Set the {@link Reducer} class for the job.
  2947. @param theClass the {@link Reducer} class for the job.]]>
  2948. </doc>
  2949. </method>
  2950. <method name="getCombinerClass" return="java.lang.Class"
  2951. abstract="false" native="false" synchronized="false"
  2952. static="false" final="false" visibility="public"
  2953. deprecated="not deprecated">
  2954. <doc>
  2955. <![CDATA[Get the user-defined <i>combiner</i> class used to combine map-outputs
  2956. before being sent to the reducers. Typically the combiner is same as the
  2957. the {@link Reducer} for the job i.e. {@link #getReducerClass()}.
  2958. @return the user-defined combiner class used to combine map-outputs.]]>
  2959. </doc>
  2960. </method>
  2961. <method name="setCombinerClass"
  2962. abstract="false" native="false" synchronized="false"
  2963. static="false" final="false" visibility="public"
  2964. deprecated="not deprecated">
  2965. <param name="theClass" type="java.lang.Class"/>
  2966. <doc>
  2967. <![CDATA[Set the user-defined <i>combiner</i> class used to combine map-outputs
  2968. before being sent to the reducers.
  2969. <p>The combiner is an application-specified aggregation operation, which
  2970. can help cut down the amount of data transferred between the
  2971. {@link Mapper} and the {@link Reducer}, leading to better performance.</p>
  2972. <p>The framework may invoke the combiner 0, 1, or multiple times, in both
  2973. the mapper and reducer tasks. In general, the combiner is called as the
  2974. sort/merge result is written to disk. The combiner must:
  2975. <ul>
  2976. <li> be side-effect free</li>
  2977. <li> have the same input and output key types and the same input and
  2978. output value types</li>
  2979. </ul></p>
  2980. <p>Typically the combiner is same as the <code>Reducer</code> for the
  2981. job i.e. {@link #setReducerClass(Class)}.</p>
  2982. @param theClass the user-defined combiner class used to combine
  2983. map-outputs.]]>
  2984. </doc>
  2985. </method>
  2986. <method name="getSpeculativeExecution" return="boolean"
  2987. abstract="false" native="false" synchronized="false"
  2988. static="false" final="false" visibility="public"
  2989. deprecated="not deprecated">
  2990. <doc>
  2991. <![CDATA[Should speculative execution be used for this job?
  2992. Defaults to <code>true</code>.
  2993. @return <code>true</code> if speculative execution be used for this job,
  2994. <code>false</code> otherwise.]]>
  2995. </doc>
  2996. </method>
  2997. <method name="setSpeculativeExecution"
  2998. abstract="false" native="false" synchronized="false"
  2999. static="false" final="false" visibility="public"
  3000. deprecated="not deprecated">
  3001. <param name="speculativeExecution" type="boolean"/>
  3002. <doc>
  3003. <![CDATA[Turn speculative execution on or off for this job.
  3004. @param speculativeExecution <code>true</code> if speculative execution
  3005. should be turned on, else <code>false</code>.]]>
  3006. </doc>
  3007. </method>
  3008. <method name="getMapSpeculativeExecution" return="boolean"
  3009. abstract="false" native="false" synchronized="false"
  3010. static="false" final="false" visibility="public"
  3011. deprecated="not deprecated">
  3012. <doc>
  3013. <![CDATA[Should speculative execution be used for this job for map tasks?
  3014. Defaults to <code>true</code>.
  3015. @return <code>true</code> if speculative execution be
  3016. used for this job for map tasks,
  3017. <code>false</code> otherwise.]]>
  3018. </doc>
  3019. </method>
  3020. <method name="setMapSpeculativeExecution"
  3021. abstract="false" native="false" synchronized="false"
  3022. static="false" final="false" visibility="public"
  3023. deprecated="not deprecated">
  3024. <param name="speculativeExecution" type="boolean"/>
  3025. <doc>
  3026. <![CDATA[Turn speculative execution on or off for this job for map tasks.
  3027. @param speculativeExecution <code>true</code> if speculative execution
  3028. should be turned on for map tasks,
  3029. else <code>false</code>.]]>
  3030. </doc>
  3031. </method>
  3032. <method name="getReduceSpeculativeExecution" return="boolean"
  3033. abstract="false" native="false" synchronized="false"
  3034. static="false" final="false" visibility="public"
  3035. deprecated="not deprecated">
  3036. <doc>
  3037. <![CDATA[Should speculative execution be used for this job for reduce tasks?
  3038. Defaults to <code>true</code>.
  3039. @return <code>true</code> if speculative execution be used
  3040. for reduce tasks for this job,
  3041. <code>false</code> otherwise.]]>
  3042. </doc>
  3043. </method>
  3044. <method name="setReduceSpeculativeExecution"
  3045. abstract="false" native="false" synchronized="false"
  3046. static="false" final="false" visibility="public"
  3047. deprecated="not deprecated">
  3048. <param name="speculativeExecution" type="boolean"/>
  3049. <doc>
  3050. <![CDATA[Turn speculative execution on or off for this job for reduce tasks.
  3051. @param speculativeExecution <code>true</code> if speculative execution
  3052. should be turned on for reduce tasks,
  3053. else <code>false</code>.]]>
  3054. </doc>
  3055. </method>
  3056. <method name="getNumMapTasks" return="int"
  3057. abstract="false" native="false" synchronized="false"
  3058. static="false" final="false" visibility="public"
  3059. deprecated="not deprecated">
  3060. <doc>
  3061. <![CDATA[Get configured the number of reduce tasks for this job.
  3062. Defaults to <code>1</code>.
  3063. @return the number of reduce tasks for this job.]]>
  3064. </doc>
  3065. </method>
  3066. <method name="setNumMapTasks"
  3067. abstract="false" native="false" synchronized="false"
  3068. static="false" final="false" visibility="public"
  3069. deprecated="not deprecated">
  3070. <param name="n" type="int"/>
  3071. <doc>
  3072. <![CDATA[Set the number of map tasks for this job.
  3073. <p><i>Note</i>: This is only a <i>hint</i> to the framework. The actual
  3074. number of spawned map tasks depends on the number of {@link InputSplit}s
  3075. generated by the job's {@link InputFormat#getSplits(JobConf, int)}.
  3076. A custom {@link InputFormat} is typically used to accurately control
  3077. the number of map tasks for the job.</p>
  3078. <h4 id="NoOfMaps">How many maps?</h4>
  3079. <p>The number of maps is usually driven by the total size of the inputs
  3080. i.e. total number of blocks of the input files.</p>
  3081. <p>The right level of parallelism for maps seems to be around 10-100 maps
  3082. per-node, although it has been set up to 300 or so for very cpu-light map
  3083. tasks. Task setup takes awhile, so it is best if the maps take at least a
  3084. minute to execute.</p>
  3085. <p>The default behavior of file-based {@link InputFormat}s is to split the
  3086. input into <i>logical</i> {@link InputSplit}s based on the total size, in
  3087. bytes, of input files. However, the {@link FileSystem} blocksize of the
  3088. input files is treated as an upper bound for input splits. A lower bound
  3089. on the split size can be set via
  3090. <a href="{@docRoot}/../mapred-default.html#mapreduce.input.fileinputformat.split.minsize">
  3091. mapreduce.input.fileinputformat.split.minsize</a>.</p>
  3092. <p>Thus, if you expect 10TB of input data and have a blocksize of 128MB,
  3093. you'll end up with 82,000 maps, unless {@link #setNumMapTasks(int)} is
  3094. used to set it even higher.</p>
  3095. @param n the number of map tasks for this job.
  3096. @see InputFormat#getSplits(JobConf, int)
  3097. @see FileInputFormat
  3098. @see FileSystem#getDefaultBlockSize()
  3099. @see FileStatus#getBlockSize()]]>
  3100. </doc>
  3101. </method>
  3102. <method name="getNumReduceTasks" return="int"
  3103. abstract="false" native="false" synchronized="false"
  3104. static="false" final="false" visibility="public"
  3105. deprecated="not deprecated">
  3106. <doc>
  3107. <![CDATA[Get configured the number of reduce tasks for this job. Defaults to
  3108. <code>1</code>.
  3109. @return the number of reduce tasks for this job.]]>
  3110. </doc>
  3111. </method>
  3112. <method name="setNumReduceTasks"
  3113. abstract="false" native="false" synchronized="false"
  3114. static="false" final="false" visibility="public"
  3115. deprecated="not deprecated">
  3116. <param name="n" type="int"/>
  3117. <doc>
  3118. <![CDATA[Set the requisite number of reduce tasks for this job.
  3119. <h4 id="NoOfReduces">How many reduces?</h4>
  3120. <p>The right number of reduces seems to be <code>0.95</code> or
  3121. <code>1.75</code> multiplied by (&lt;<i>no. of nodes</i>&gt; *
  3122. <a href="{@docRoot}/../mapred-default.html#mapreduce.tasktracker.reduce.tasks.maximum">
  3123. mapreduce.tasktracker.reduce.tasks.maximum</a>).
  3124. </p>
  3125. <p>With <code>0.95</code> all of the reduces can launch immediately and
  3126. start transfering map outputs as the maps finish. With <code>1.75</code>
  3127. the faster nodes will finish their first round of reduces and launch a
  3128. second wave of reduces doing a much better job of load balancing.</p>
  3129. <p>Increasing the number of reduces increases the framework overhead, but
  3130. increases load balancing and lowers the cost of failures.</p>
  3131. <p>The scaling factors above are slightly less than whole numbers to
  3132. reserve a few reduce slots in the framework for speculative-tasks, failures
  3133. etc.</p>
  3134. <h4 id="ReducerNone">Reducer NONE</h4>
  3135. <p>It is legal to set the number of reduce-tasks to <code>zero</code>.</p>
  3136. <p>In this case the output of the map-tasks directly go to distributed
  3137. file-system, to the path set by
  3138. {@link FileOutputFormat#setOutputPath(JobConf, Path)}. Also, the
  3139. framework doesn't sort the map-outputs before writing it out to HDFS.</p>
  3140. @param n the number of reduce tasks for this job.]]>
  3141. </doc>
  3142. </method>
  3143. <method name="getMaxMapAttempts" return="int"
  3144. abstract="false" native="false" synchronized="false"
  3145. static="false" final="false" visibility="public"
  3146. deprecated="not deprecated">
  3147. <doc>
  3148. <![CDATA[Get the configured number of maximum attempts that will be made to run a
  3149. map task, as specified by the <code>mapreduce.map.maxattempts</code>
  3150. property. If this property is not already set, the default is 4 attempts.
  3151. @return the max number of attempts per map task.]]>
  3152. </doc>
  3153. </method>
  3154. <method name="setMaxMapAttempts"
  3155. abstract="false" native="false" synchronized="false"
  3156. static="false" final="false" visibility="public"
  3157. deprecated="not deprecated">
  3158. <param name="n" type="int"/>
  3159. <doc>
  3160. <![CDATA[Expert: Set the number of maximum attempts that will be made to run a
  3161. map task.
  3162. @param n the number of attempts per map task.]]>
  3163. </doc>
  3164. </method>
  3165. <method name="getMaxReduceAttempts" return="int"
  3166. abstract="false" native="false" synchronized="false"
  3167. static="false" final="false" visibility="public"
  3168. deprecated="not deprecated">
  3169. <doc>
  3170. <![CDATA[Get the configured number of maximum attempts that will be made to run a
  3171. reduce task, as specified by the <code>mapreduce.reduce.maxattempts</code>
  3172. property. If this property is not already set, the default is 4 attempts.
  3173. @return the max number of attempts per reduce task.]]>
  3174. </doc>
  3175. </method>
  3176. <method name="setMaxReduceAttempts"
  3177. abstract="false" native="false" synchronized="false"
  3178. static="false" final="false" visibility="public"
  3179. deprecated="not deprecated">
  3180. <param name="n" type="int"/>
  3181. <doc>
  3182. <![CDATA[Expert: Set the number of maximum attempts that will be made to run a
  3183. reduce task.
  3184. @param n the number of attempts per reduce task.]]>
  3185. </doc>
  3186. </method>
  3187. <method name="getJobName" return="java.lang.String"
  3188. abstract="false" native="false" synchronized="false"
  3189. static="false" final="false" visibility="public"
  3190. deprecated="not deprecated">
  3191. <doc>
  3192. <![CDATA[Get the user-specified job name. This is only used to identify the
  3193. job to the user.
  3194. @return the job's name, defaulting to "".]]>
  3195. </doc>
  3196. </method>
  3197. <method name="setJobName"
  3198. abstract="false" native="false" synchronized="false"
  3199. static="false" final="false" visibility="public"
  3200. deprecated="not deprecated">
  3201. <param name="name" type="java.lang.String"/>
  3202. <doc>
  3203. <![CDATA[Set the user-specified job name.
  3204. @param name the job's new name.]]>
  3205. </doc>
  3206. </method>
  3207. <method name="getSessionId" return="java.lang.String"
  3208. abstract="false" native="false" synchronized="false"
  3209. static="false" final="false" visibility="public"
  3210. deprecated="not deprecated">
  3211. <doc>
  3212. <![CDATA[Get the user-specified session identifier. The default is the empty string.
  3213. The session identifier is used to tag metric data that is reported to some
  3214. performance metrics system via the org.apache.hadoop.metrics API. The
  3215. session identifier is intended, in particular, for use by Hadoop-On-Demand
  3216. (HOD) which allocates a virtual Hadoop cluster dynamically and transiently.
  3217. HOD will set the session identifier by modifying the mapred-site.xml file
  3218. before starting the cluster.
  3219. When not running under HOD, this identifer is expected to remain set to
  3220. the empty string.
  3221. @return the session identifier, defaulting to "".]]>
  3222. </doc>
  3223. </method>
  3224. <method name="setSessionId"
  3225. abstract="false" native="false" synchronized="false"
  3226. static="false" final="false" visibility="public"
  3227. deprecated="not deprecated">
  3228. <param name="sessionId" type="java.lang.String"/>
  3229. <doc>
  3230. <![CDATA[Set the user-specified session identifier.
  3231. @param sessionId the new session id.]]>
  3232. </doc>
  3233. </method>
  3234. <method name="setMaxTaskFailuresPerTracker"
  3235. abstract="false" native="false" synchronized="false"
  3236. static="false" final="false" visibility="public"
  3237. deprecated="not deprecated">
  3238. <param name="noFailures" type="int"/>
  3239. <doc>
  3240. <![CDATA[Set the maximum no. of failures of a given job per tasktracker.
  3241. If the no. of task failures exceeds <code>noFailures</code>, the
  3242. tasktracker is <i>blacklisted</i> for this job.
  3243. @param noFailures maximum no. of failures of a given job per tasktracker.]]>
  3244. </doc>
  3245. </method>
  3246. <method name="getMaxTaskFailuresPerTracker" return="int"
  3247. abstract="false" native="false" synchronized="false"
  3248. static="false" final="false" visibility="public"
  3249. deprecated="not deprecated">
  3250. <doc>
  3251. <![CDATA[Expert: Get the maximum no. of failures of a given job per tasktracker.
  3252. If the no. of task failures exceeds this, the tasktracker is
  3253. <i>blacklisted</i> for this job.
  3254. @return the maximum no. of failures of a given job per tasktracker.]]>
  3255. </doc>
  3256. </method>
  3257. <method name="getMaxMapTaskFailuresPercent" return="int"
  3258. abstract="false" native="false" synchronized="false"
  3259. static="false" final="false" visibility="public"
  3260. deprecated="not deprecated">
  3261. <doc>
  3262. <![CDATA[Get the maximum percentage of map tasks that can fail without
  3263. the job being aborted.
  3264. Each map task is executed a minimum of {@link #getMaxMapAttempts()}
  3265. attempts before being declared as <i>failed</i>.
  3266. Defaults to <code>zero</code>, i.e. <i>any</i> failed map-task results in
  3267. the job being declared as {@link JobStatus#FAILED}.
  3268. @return the maximum percentage of map tasks that can fail without
  3269. the job being aborted.]]>
  3270. </doc>
  3271. </method>
  3272. <method name="setMaxMapTaskFailuresPercent"
  3273. abstract="false" native="false" synchronized="false"
  3274. static="false" final="false" visibility="public"
  3275. deprecated="not deprecated">
  3276. <param name="percent" type="int"/>
  3277. <doc>
  3278. <![CDATA[Expert: Set the maximum percentage of map tasks that can fail without the
  3279. job being aborted.
  3280. Each map task is executed a minimum of {@link #getMaxMapAttempts} attempts
  3281. before being declared as <i>failed</i>.
  3282. @param percent the maximum percentage of map tasks that can fail without
  3283. the job being aborted.]]>
  3284. </doc>
  3285. </method>
  3286. <method name="getMaxReduceTaskFailuresPercent" return="int"
  3287. abstract="false" native="false" synchronized="false"
  3288. static="false" final="false" visibility="public"
  3289. deprecated="not deprecated">
  3290. <doc>
  3291. <![CDATA[Get the maximum percentage of reduce tasks that can fail without
  3292. the job being aborted.
  3293. Each reduce task is executed a minimum of {@link #getMaxReduceAttempts()}
  3294. attempts before being declared as <i>failed</i>.
  3295. Defaults to <code>zero</code>, i.e. <i>any</i> failed reduce-task results
  3296. in the job being declared as {@link JobStatus#FAILED}.
  3297. @return the maximum percentage of reduce tasks that can fail without
  3298. the job being aborted.]]>
  3299. </doc>
  3300. </method>
  3301. <method name="setMaxReduceTaskFailuresPercent"
  3302. abstract="false" native="false" synchronized="false"
  3303. static="false" final="false" visibility="public"
  3304. deprecated="not deprecated">
  3305. <param name="percent" type="int"/>
  3306. <doc>
  3307. <![CDATA[Set the maximum percentage of reduce tasks that can fail without the job
  3308. being aborted.
  3309. Each reduce task is executed a minimum of {@link #getMaxReduceAttempts()}
  3310. attempts before being declared as <i>failed</i>.
  3311. @param percent the maximum percentage of reduce tasks that can fail without
  3312. the job being aborted.]]>
  3313. </doc>
  3314. </method>
  3315. <method name="setJobPriority"
  3316. abstract="false" native="false" synchronized="false"
  3317. static="false" final="false" visibility="public"
  3318. deprecated="not deprecated">
  3319. <param name="prio" type="org.apache.hadoop.mapred.JobPriority"/>
  3320. <doc>
  3321. <![CDATA[Set {@link JobPriority} for this job.
  3322. @param prio the {@link JobPriority} for this job.]]>
  3323. </doc>
  3324. </method>
  3325. <method name="getJobPriority" return="org.apache.hadoop.mapred.JobPriority"
  3326. abstract="false" native="false" synchronized="false"
  3327. static="false" final="false" visibility="public"
  3328. deprecated="not deprecated">
  3329. <doc>
  3330. <![CDATA[Get the {@link JobPriority} for this job.
  3331. @return the {@link JobPriority} for this job.]]>
  3332. </doc>
  3333. </method>
  3334. <method name="getProfileEnabled" return="boolean"
  3335. abstract="false" native="false" synchronized="false"
  3336. static="false" final="false" visibility="public"
  3337. deprecated="not deprecated">
  3338. <doc>
  3339. <![CDATA[Get whether the task profiling is enabled.
  3340. @return true if some tasks will be profiled]]>
  3341. </doc>
  3342. </method>
  3343. <method name="setProfileEnabled"
  3344. abstract="false" native="false" synchronized="false"
  3345. static="false" final="false" visibility="public"
  3346. deprecated="not deprecated">
  3347. <param name="newValue" type="boolean"/>
  3348. <doc>
  3349. <![CDATA[Set whether the system should collect profiler information for some of
  3350. the tasks in this job? The information is stored in the user log
  3351. directory.
  3352. @param newValue true means it should be gathered]]>
  3353. </doc>
  3354. </method>
  3355. <method name="getProfileParams" return="java.lang.String"
  3356. abstract="false" native="false" synchronized="false"
  3357. static="false" final="false" visibility="public"
  3358. deprecated="not deprecated">
  3359. <doc>
  3360. <![CDATA[Get the profiler configuration arguments.
  3361. The default value for this property is
  3362. "-agentlib:hprof=cpu=samples,heap=sites,force=n,thread=y,verbose=n,file=%s"
  3363. @return the parameters to pass to the task child to configure profiling]]>
  3364. </doc>
  3365. </method>
  3366. <method name="setProfileParams"
  3367. abstract="false" native="false" synchronized="false"
  3368. static="false" final="false" visibility="public"
  3369. deprecated="not deprecated">
  3370. <param name="value" type="java.lang.String"/>
  3371. <doc>
  3372. <![CDATA[Set the profiler configuration arguments. If the string contains a '%s' it
  3373. will be replaced with the name of the profiling output file when the task
  3374. runs.
  3375. This value is passed to the task child JVM on the command line.
  3376. @param value the configuration string]]>
  3377. </doc>
  3378. </method>
  3379. <method name="getProfileTaskRange" return="org.apache.hadoop.conf.Configuration.IntegerRanges"
  3380. abstract="false" native="false" synchronized="false"
  3381. static="false" final="false" visibility="public"
  3382. deprecated="not deprecated">
  3383. <param name="isMap" type="boolean"/>
  3384. <doc>
  3385. <![CDATA[Get the range of maps or reduces to profile.
  3386. @param isMap is the task a map?
  3387. @return the task ranges]]>
  3388. </doc>
  3389. </method>
  3390. <method name="setProfileTaskRange"
  3391. abstract="false" native="false" synchronized="false"
  3392. static="false" final="false" visibility="public"
  3393. deprecated="not deprecated">
  3394. <param name="isMap" type="boolean"/>
  3395. <param name="newValue" type="java.lang.String"/>
  3396. <doc>
  3397. <![CDATA[Set the ranges of maps or reduces to profile. setProfileEnabled(true)
  3398. must also be called.
  3399. @param newValue a set of integer ranges of the map ids]]>
  3400. </doc>
  3401. </method>
  3402. <method name="setMapDebugScript"
  3403. abstract="false" native="false" synchronized="false"
  3404. static="false" final="false" visibility="public"
  3405. deprecated="not deprecated">
  3406. <param name="mDbgScript" type="java.lang.String"/>
  3407. <doc>
  3408. <![CDATA[Set the debug script to run when the map tasks fail.
  3409. <p>The debug script can aid debugging of failed map tasks. The script is
  3410. given task's stdout, stderr, syslog, jobconf files as arguments.</p>
  3411. <p>The debug command, run on the node where the map failed, is:</p>
  3412. <p><pre><blockquote>
  3413. $script $stdout $stderr $syslog $jobconf.
  3414. </blockquote></pre></p>
  3415. <p> The script file is distributed through {@link DistributedCache}
  3416. APIs. The script needs to be symlinked. </p>
  3417. <p>Here is an example on how to submit a script
  3418. <p><blockquote><pre>
  3419. job.setMapDebugScript("./myscript");
  3420. DistributedCache.createSymlink(job);
  3421. DistributedCache.addCacheFile("/debug/scripts/myscript#myscript");
  3422. </pre></blockquote></p>
  3423. @param mDbgScript the script name]]>
  3424. </doc>
  3425. </method>
  3426. <method name="getMapDebugScript" return="java.lang.String"
  3427. abstract="false" native="false" synchronized="false"
  3428. static="false" final="false" visibility="public"
  3429. deprecated="not deprecated">
  3430. <doc>
  3431. <![CDATA[Get the map task's debug script.
  3432. @return the debug Script for the mapred job for failed map tasks.
  3433. @see #setMapDebugScript(String)]]>
  3434. </doc>
  3435. </method>
  3436. <method name="setReduceDebugScript"
  3437. abstract="false" native="false" synchronized="false"
  3438. static="false" final="false" visibility="public"
  3439. deprecated="not deprecated">
  3440. <param name="rDbgScript" type="java.lang.String"/>
  3441. <doc>
  3442. <![CDATA[Set the debug script to run when the reduce tasks fail.
  3443. <p>The debug script can aid debugging of failed reduce tasks. The script
  3444. is given task's stdout, stderr, syslog, jobconf files as arguments.</p>
  3445. <p>The debug command, run on the node where the map failed, is:</p>
  3446. <p><pre><blockquote>
  3447. $script $stdout $stderr $syslog $jobconf.
  3448. </blockquote></pre></p>
  3449. <p> The script file is distributed through {@link DistributedCache}
  3450. APIs. The script file needs to be symlinked </p>
  3451. <p>Here is an example on how to submit a script
  3452. <p><blockquote><pre>
  3453. job.setReduceDebugScript("./myscript");
  3454. DistributedCache.createSymlink(job);
  3455. DistributedCache.addCacheFile("/debug/scripts/myscript#myscript");
  3456. </pre></blockquote></p>
  3457. @param rDbgScript the script name]]>
  3458. </doc>
  3459. </method>
  3460. <method name="getReduceDebugScript" return="java.lang.String"
  3461. abstract="false" native="false" synchronized="false"
  3462. static="false" final="false" visibility="public"
  3463. deprecated="not deprecated">
  3464. <doc>
  3465. <![CDATA[Get the reduce task's debug Script
  3466. @return the debug script for the mapred job for failed reduce tasks.
  3467. @see #setReduceDebugScript(String)]]>
  3468. </doc>
  3469. </method>
  3470. <method name="getJobEndNotificationURI" return="java.lang.String"
  3471. abstract="false" native="false" synchronized="false"
  3472. static="false" final="false" visibility="public"
  3473. deprecated="not deprecated">
  3474. <doc>
  3475. <![CDATA[Get the uri to be invoked in-order to send a notification after the job
  3476. has completed (success/failure).
  3477. @return the job end notification uri, <code>null</code> if it hasn't
  3478. been set.
  3479. @see #setJobEndNotificationURI(String)]]>
  3480. </doc>
  3481. </method>
  3482. <method name="setJobEndNotificationURI"
  3483. abstract="false" native="false" synchronized="false"
  3484. static="false" final="false" visibility="public"
  3485. deprecated="not deprecated">
  3486. <param name="uri" type="java.lang.String"/>
  3487. <doc>
  3488. <![CDATA[Set the uri to be invoked in-order to send a notification after the job
  3489. has completed (success/failure).
  3490. <p>The uri can contain 2 special parameters: <tt>$jobId</tt> and
  3491. <tt>$jobStatus</tt>. Those, if present, are replaced by the job's
  3492. identifier and completion-status respectively.</p>
  3493. <p>This is typically used by application-writers to implement chaining of
  3494. Map-Reduce jobs in an <i>asynchronous manner</i>.</p>
  3495. @param uri the job end notification uri
  3496. @see JobStatus
  3497. @see <a href="{@docRoot}/org/apache/hadoop/mapred/JobClient.html#
  3498. JobCompletionAndChaining">Job Completion and Chaining</a>]]>
  3499. </doc>
  3500. </method>
  3501. <method name="getJobLocalDir" return="java.lang.String"
  3502. abstract="false" native="false" synchronized="false"
  3503. static="false" final="false" visibility="public"
  3504. deprecated="not deprecated">
  3505. <doc>
  3506. <![CDATA[Get job-specific shared directory for use as scratch space
  3507. <p>
  3508. When a job starts, a shared directory is created at location
  3509. <code>
  3510. ${mapreduce.cluster.local.dir}/taskTracker/$user/jobcache/$jobid/work/ </code>.
  3511. This directory is exposed to the users through
  3512. <code>mapreduce.job.local.dir </code>.
  3513. So, the tasks can use this space
  3514. as scratch space and share files among them. </p>
  3515. This value is available as System property also.
  3516. @return The localized job specific shared directory]]>
  3517. </doc>
  3518. </method>
  3519. <method name="getMemoryForMapTask" return="long"
  3520. abstract="false" native="false" synchronized="false"
  3521. static="false" final="false" visibility="public"
  3522. deprecated="not deprecated">
  3523. <doc>
  3524. <![CDATA[Get memory required to run a map task of the job, in MB.
  3525. If a value is specified in the configuration, it is returned.
  3526. Else, it returns {@link #DISABLED_MEMORY_LIMIT}.
  3527. <p/>
  3528. For backward compatibility, if the job configuration sets the
  3529. key {@link #MAPRED_TASK_MAXVMEM_PROPERTY} to a value different
  3530. from {@link #DISABLED_MEMORY_LIMIT}, that value will be used
  3531. after converting it from bytes to MB.
  3532. @return memory required to run a map task of the job, in MB,
  3533. or {@link #DISABLED_MEMORY_LIMIT} if unset.]]>
  3534. </doc>
  3535. </method>
  3536. <method name="setMemoryForMapTask"
  3537. abstract="false" native="false" synchronized="false"
  3538. static="false" final="false" visibility="public"
  3539. deprecated="not deprecated">
  3540. <param name="mem" type="long"/>
  3541. </method>
  3542. <method name="getMemoryForReduceTask" return="long"
  3543. abstract="false" native="false" synchronized="false"
  3544. static="false" final="false" visibility="public"
  3545. deprecated="not deprecated">
  3546. <doc>
  3547. <![CDATA[Get memory required to run a reduce task of the job, in MB.
  3548. If a value is specified in the configuration, it is returned.
  3549. Else, it returns {@link #DISABLED_MEMORY_LIMIT}.
  3550. <p/>
  3551. For backward compatibility, if the job configuration sets the
  3552. key {@link #MAPRED_TASK_MAXVMEM_PROPERTY} to a value different
  3553. from {@link #DISABLED_MEMORY_LIMIT}, that value will be used
  3554. after converting it from bytes to MB.
  3555. @return memory required to run a reduce task of the job, in MB,
  3556. or {@link #DISABLED_MEMORY_LIMIT} if unset.]]>
  3557. </doc>
  3558. </method>
  3559. <method name="setMemoryForReduceTask"
  3560. abstract="false" native="false" synchronized="false"
  3561. static="false" final="false" visibility="public"
  3562. deprecated="not deprecated">
  3563. <param name="mem" type="long"/>
  3564. </method>
  3565. <method name="getQueueName" return="java.lang.String"
  3566. abstract="false" native="false" synchronized="false"
  3567. static="false" final="false" visibility="public"
  3568. deprecated="not deprecated">
  3569. <doc>
  3570. <![CDATA[Return the name of the queue to which this job is submitted.
  3571. Defaults to 'default'.
  3572. @return name of the queue]]>
  3573. </doc>
  3574. </method>
  3575. <method name="setQueueName"
  3576. abstract="false" native="false" synchronized="false"
  3577. static="false" final="false" visibility="public"
  3578. deprecated="not deprecated">
  3579. <param name="queueName" type="java.lang.String"/>
  3580. <doc>
  3581. <![CDATA[Set the name of the queue to which this job should be submitted.
  3582. @param queueName Name of the queue]]>
  3583. </doc>
  3584. </method>
  3585. <method name="normalizeMemoryConfigValue" return="long"
  3586. abstract="false" native="false" synchronized="false"
  3587. static="true" final="false" visibility="public"
  3588. deprecated="not deprecated">
  3589. <param name="val" type="long"/>
  3590. <doc>
  3591. <![CDATA[Normalize the negative values in configuration
  3592. @param val
  3593. @return normalized value]]>
  3594. </doc>
  3595. </method>
  3596. <method name="getMaxVirtualMemoryForTask" return="long"
  3597. abstract="false" native="false" synchronized="false"
  3598. static="false" final="false" visibility="public"
  3599. deprecated="Use {@link #getMemoryForMapTask()} and
  3600. {@link #getMemoryForReduceTask()}">
  3601. <doc>
  3602. <![CDATA[Get the memory required to run a task of this job, in bytes. See
  3603. {@link #MAPRED_TASK_MAXVMEM_PROPERTY}
  3604. <p/>
  3605. This method is deprecated. Now, different memory limits can be
  3606. set for map and reduce tasks of a job, in MB.
  3607. <p/>
  3608. For backward compatibility, if the job configuration sets the
  3609. key {@link #MAPRED_TASK_MAXVMEM_PROPERTY} to a value different
  3610. from {@link #DISABLED_MEMORY_LIMIT}, that value is returned.
  3611. Otherwise, this method will return the larger of the values returned by
  3612. {@link #getMemoryForMapTask()} and {@link #getMemoryForReduceTask()}
  3613. after converting them into bytes.
  3614. @return Memory required to run a task of this job, in bytes,
  3615. or {@link #DISABLED_MEMORY_LIMIT}, if unset.
  3616. @see #setMaxVirtualMemoryForTask(long)
  3617. @deprecated Use {@link #getMemoryForMapTask()} and
  3618. {@link #getMemoryForReduceTask()}]]>
  3619. </doc>
  3620. </method>
  3621. <method name="setMaxVirtualMemoryForTask"
  3622. abstract="false" native="false" synchronized="false"
  3623. static="false" final="false" visibility="public"
  3624. deprecated="Use {@link #setMemoryForMapTask(long mem)} and
  3625. Use {@link #setMemoryForReduceTask(long mem)}">
  3626. <param name="vmem" type="long"/>
  3627. <doc>
  3628. <![CDATA[Set the maximum amount of memory any task of this job can use. See
  3629. {@link #MAPRED_TASK_MAXVMEM_PROPERTY}
  3630. <p/>
  3631. mapred.task.maxvmem is split into
  3632. mapreduce.map.memory.mb
  3633. and mapreduce.map.memory.mb,mapred
  3634. each of the new key are set
  3635. as mapred.task.maxvmem / 1024
  3636. as new values are in MB
  3637. @param vmem Maximum amount of virtual memory in bytes any task of this job
  3638. can use.
  3639. @see #getMaxVirtualMemoryForTask()
  3640. @deprecated
  3641. Use {@link #setMemoryForMapTask(long mem)} and
  3642. Use {@link #setMemoryForReduceTask(long mem)}]]>
  3643. </doc>
  3644. </method>
  3645. <method name="getMaxPhysicalMemoryForTask" return="long"
  3646. abstract="false" native="false" synchronized="false"
  3647. static="false" final="false" visibility="public"
  3648. deprecated="this variable is deprecated and nolonger in use.">
  3649. <doc>
  3650. <![CDATA[@deprecated this variable is deprecated and nolonger in use.]]>
  3651. </doc>
  3652. </method>
  3653. <method name="setMaxPhysicalMemoryForTask"
  3654. abstract="false" native="false" synchronized="false"
  3655. static="false" final="false" visibility="public"
  3656. deprecated="not deprecated">
  3657. <param name="mem" type="long"/>
  3658. </method>
  3659. <field name="MAPRED_TASK_MAXVMEM_PROPERTY" type="java.lang.String"
  3660. transient="false" volatile="false"
  3661. static="true" final="true" visibility="public"
  3662. deprecated="Use {@link #MAPRED_JOB_MAP_MEMORY_MB_PROPERTY} and
  3663. {@link #MAPRED_JOB_REDUCE_MEMORY_MB_PROPERTY}">
  3664. <doc>
  3665. <![CDATA[@deprecated Use {@link #MAPRED_JOB_MAP_MEMORY_MB_PROPERTY} and
  3666. {@link #MAPRED_JOB_REDUCE_MEMORY_MB_PROPERTY}]]>
  3667. </doc>
  3668. </field>
  3669. <field name="UPPER_LIMIT_ON_TASK_VMEM_PROPERTY" type="java.lang.String"
  3670. transient="false" volatile="false"
  3671. static="true" final="true" visibility="public"
  3672. deprecated="deprecated, no comment">
  3673. <doc>
  3674. <![CDATA[@deprecated]]>
  3675. </doc>
  3676. </field>
  3677. <field name="MAPRED_TASK_DEFAULT_MAXVMEM_PROPERTY" type="java.lang.String"
  3678. transient="false" volatile="false"
  3679. static="true" final="true" visibility="public"
  3680. deprecated="deprecated, no comment">
  3681. <doc>
  3682. <![CDATA[@deprecated]]>
  3683. </doc>
  3684. </field>
  3685. <field name="MAPRED_TASK_MAXPMEM_PROPERTY" type="java.lang.String"
  3686. transient="false" volatile="false"
  3687. static="true" final="true" visibility="public"
  3688. deprecated="deprecated, no comment">
  3689. <doc>
  3690. <![CDATA[@deprecated]]>
  3691. </doc>
  3692. </field>
  3693. <field name="DISABLED_MEMORY_LIMIT" type="long"
  3694. transient="false" volatile="false"
  3695. static="true" final="true" visibility="public"
  3696. deprecated="not deprecated">
  3697. <doc>
  3698. <![CDATA[A value which if set for memory related configuration options,
  3699. indicates that the options are turned off.]]>
  3700. </doc>
  3701. </field>
  3702. <field name="MAPRED_LOCAL_DIR_PROPERTY" type="java.lang.String"
  3703. transient="false" volatile="false"
  3704. static="true" final="true" visibility="public"
  3705. deprecated="not deprecated">
  3706. <doc>
  3707. <![CDATA[Property name for the configuration property mapreduce.cluster.local.dir]]>
  3708. </doc>
  3709. </field>
  3710. <field name="DEFAULT_QUEUE_NAME" type="java.lang.String"
  3711. transient="false" volatile="false"
  3712. static="true" final="true" visibility="public"
  3713. deprecated="not deprecated">
  3714. <doc>
  3715. <![CDATA[Name of the queue to which jobs will be submitted, if no queue
  3716. name is mentioned.]]>
  3717. </doc>
  3718. </field>
  3719. <field name="UNPACK_JAR_PATTERN_DEFAULT" type="java.util.regex.Pattern"
  3720. transient="false" volatile="false"
  3721. static="true" final="true" visibility="public"
  3722. deprecated="not deprecated">
  3723. <doc>
  3724. <![CDATA[Pattern for the default unpacking behavior for job jars]]>
  3725. </doc>
  3726. </field>
  3727. <field name="MAPRED_TASK_JAVA_OPTS" type="java.lang.String"
  3728. transient="false" volatile="false"
  3729. static="true" final="true" visibility="public"
  3730. deprecated="Use {@link #MAPRED_MAP_TASK_JAVA_OPTS} or
  3731. {@link #MAPRED_REDUCE_TASK_JAVA_OPTS}">
  3732. <doc>
  3733. <![CDATA[Configuration key to set the java command line options for the child
  3734. map and reduce tasks.
  3735. Java opts for the task tracker child processes.
  3736. The following symbol, if present, will be interpolated: @taskid@.
  3737. It is replaced by current TaskID. Any other occurrences of '@' will go
  3738. unchanged.
  3739. For example, to enable verbose gc logging to a file named for the taskid in
  3740. /tmp and to set the heap maximum to be a gigabyte, pass a 'value' of:
  3741. -Xmx1024m -verbose:gc -Xloggc:/tmp/@taskid@.gc
  3742. The configuration variable {@link #MAPRED_TASK_ULIMIT} can be used to
  3743. control the maximum virtual memory of the child processes.
  3744. The configuration variable {@link #MAPRED_TASK_ENV} can be used to pass
  3745. other environment variables to the child processes.
  3746. @deprecated Use {@link #MAPRED_MAP_TASK_JAVA_OPTS} or
  3747. {@link #MAPRED_REDUCE_TASK_JAVA_OPTS}]]>
  3748. </doc>
  3749. </field>
  3750. <field name="MAPRED_MAP_TASK_JAVA_OPTS" type="java.lang.String"
  3751. transient="false" volatile="false"
  3752. static="true" final="true" visibility="public"
  3753. deprecated="not deprecated">
  3754. <doc>
  3755. <![CDATA[Configuration key to set the java command line options for the map tasks.
  3756. Java opts for the task tracker child map processes.
  3757. The following symbol, if present, will be interpolated: @taskid@.
  3758. It is replaced by current TaskID. Any other occurrences of '@' will go
  3759. unchanged.
  3760. For example, to enable verbose gc logging to a file named for the taskid in
  3761. /tmp and to set the heap maximum to be a gigabyte, pass a 'value' of:
  3762. -Xmx1024m -verbose:gc -Xloggc:/tmp/@taskid@.gc
  3763. The configuration variable {@link #MAPRED_MAP_TASK_ULIMIT} can be used to
  3764. control the maximum virtual memory of the map processes.
  3765. The configuration variable {@link #MAPRED_MAP_TASK_ENV} can be used to pass
  3766. other environment variables to the map processes.]]>
  3767. </doc>
  3768. </field>
  3769. <field name="MAPRED_REDUCE_TASK_JAVA_OPTS" type="java.lang.String"
  3770. transient="false" volatile="false"
  3771. static="true" final="true" visibility="public"
  3772. deprecated="not deprecated">
  3773. <doc>
  3774. <![CDATA[Configuration key to set the java command line options for the reduce tasks.
  3775. Java opts for the task tracker child reduce processes.
  3776. The following symbol, if present, will be interpolated: @taskid@.
  3777. It is replaced by current TaskID. Any other occurrences of '@' will go
  3778. unchanged.
  3779. For example, to enable verbose gc logging to a file named for the taskid in
  3780. /tmp and to set the heap maximum to be a gigabyte, pass a 'value' of:
  3781. -Xmx1024m -verbose:gc -Xloggc:/tmp/@taskid@.gc
  3782. The configuration variable {@link #MAPRED_REDUCE_TASK_ULIMIT} can be used
  3783. to control the maximum virtual memory of the reduce processes.
  3784. The configuration variable {@link #MAPRED_REDUCE_TASK_ENV} can be used to
  3785. pass process environment variables to the reduce processes.]]>
  3786. </doc>
  3787. </field>
  3788. <field name="DEFAULT_MAPRED_TASK_JAVA_OPTS" type="java.lang.String"
  3789. transient="false" volatile="false"
  3790. static="true" final="true" visibility="public"
  3791. deprecated="not deprecated">
  3792. </field>
  3793. <field name="MAPRED_TASK_ULIMIT" type="java.lang.String"
  3794. transient="false" volatile="false"
  3795. static="true" final="true" visibility="public"
  3796. deprecated="Use {@link #MAPRED_MAP_TASK_ULIMIT} or
  3797. {@link #MAPRED_REDUCE_TASK_ULIMIT}">
  3798. <doc>
  3799. <![CDATA[Configuration key to set the maximum virutal memory available to the child
  3800. map and reduce tasks (in kilo-bytes).
  3801. Note: This must be greater than or equal to the -Xmx passed to the JavaVM
  3802. via {@link #MAPRED_TASK_JAVA_OPTS}, else the VM might not start.
  3803. @deprecated Use {@link #MAPRED_MAP_TASK_ULIMIT} or
  3804. {@link #MAPRED_REDUCE_TASK_ULIMIT}]]>
  3805. </doc>
  3806. </field>
  3807. <field name="MAPRED_MAP_TASK_ULIMIT" type="java.lang.String"
  3808. transient="false" volatile="false"
  3809. static="true" final="true" visibility="public"
  3810. deprecated="not deprecated">
  3811. <doc>
  3812. <![CDATA[Configuration key to set the maximum virutal memory available to the
  3813. map tasks (in kilo-bytes).
  3814. Note: This must be greater than or equal to the -Xmx passed to the JavaVM
  3815. via {@link #MAPRED_MAP_TASK_JAVA_OPTS}, else the VM might not start.]]>
  3816. </doc>
  3817. </field>
  3818. <field name="MAPRED_REDUCE_TASK_ULIMIT" type="java.lang.String"
  3819. transient="false" volatile="false"
  3820. static="true" final="true" visibility="public"
  3821. deprecated="not deprecated">
  3822. <doc>
  3823. <![CDATA[Configuration key to set the maximum virutal memory available to the
  3824. reduce tasks (in kilo-bytes).
  3825. Note: This must be greater than or equal to the -Xmx passed to the JavaVM
  3826. via {@link #MAPRED_REDUCE_TASK_JAVA_OPTS}, else the VM might not start.]]>
  3827. </doc>
  3828. </field>
  3829. <field name="MAPRED_TASK_ENV" type="java.lang.String"
  3830. transient="false" volatile="false"
  3831. static="true" final="true" visibility="public"
  3832. deprecated="Use {@link #MAPRED_MAP_TASK_ENV} or
  3833. {@link #MAPRED_REDUCE_TASK_ENV}">
  3834. <doc>
  3835. <![CDATA[Configuration key to set the environment of the child map/reduce tasks.
  3836. The format of the value is <code>k1=v1,k2=v2</code>. Further it can
  3837. reference existing environment variables via <code>$key</code>.
  3838. Example:
  3839. <ul>
  3840. <li> A=foo - This will set the env variable A to foo. </li>
  3841. <li> B=$X:c This is inherit tasktracker's X env variable. </li>
  3842. </ul>
  3843. @deprecated Use {@link #MAPRED_MAP_TASK_ENV} or
  3844. {@link #MAPRED_REDUCE_TASK_ENV}]]>
  3845. </doc>
  3846. </field>
  3847. <field name="MAPRED_MAP_TASK_ENV" type="java.lang.String"
  3848. transient="false" volatile="false"
  3849. static="true" final="true" visibility="public"
  3850. deprecated="not deprecated">
  3851. <doc>
  3852. <![CDATA[Configuration key to set the maximum virutal memory available to the
  3853. map tasks.
  3854. The format of the value is <code>k1=v1,k2=v2</code>. Further it can
  3855. reference existing environment variables via <code>$key</code>.
  3856. Example:
  3857. <ul>
  3858. <li> A=foo - This will set the env variable A to foo. </li>
  3859. <li> B=$X:c This is inherit tasktracker's X env variable. </li>
  3860. </ul>]]>
  3861. </doc>
  3862. </field>
  3863. <field name="MAPRED_REDUCE_TASK_ENV" type="java.lang.String"
  3864. transient="false" volatile="false"
  3865. static="true" final="true" visibility="public"
  3866. deprecated="not deprecated">
  3867. <doc>
  3868. <![CDATA[Configuration key to set the maximum virutal memory available to the
  3869. reduce tasks.
  3870. The format of the value is <code>k1=v1,k2=v2</code>. Further it can
  3871. reference existing environment variables via <code>$key</code>.
  3872. Example:
  3873. <ul>
  3874. <li> A=foo - This will set the env variable A to foo. </li>
  3875. <li> B=$X:c This is inherit tasktracker's X env variable. </li>
  3876. </ul>]]>
  3877. </doc>
  3878. </field>
  3879. <field name="MAPRED_MAP_TASK_LOG_LEVEL" type="java.lang.String"
  3880. transient="false" volatile="false"
  3881. static="true" final="true" visibility="public"
  3882. deprecated="not deprecated">
  3883. <doc>
  3884. <![CDATA[Configuration key to set the logging {@link Level} for the map task.
  3885. The allowed logging levels are:
  3886. OFF, FATAL, ERROR, WARN, INFO, DEBUG, TRACE and ALL.]]>
  3887. </doc>
  3888. </field>
  3889. <field name="MAPRED_REDUCE_TASK_LOG_LEVEL" type="java.lang.String"
  3890. transient="false" volatile="false"
  3891. static="true" final="true" visibility="public"
  3892. deprecated="not deprecated">
  3893. <doc>
  3894. <![CDATA[Configuration key to set the logging {@link Level} for the reduce task.
  3895. The allowed logging levels are:
  3896. OFF, FATAL, ERROR, WARN, INFO, DEBUG, TRACE and ALL.]]>
  3897. </doc>
  3898. </field>
  3899. <field name="DEFAULT_LOG_LEVEL" type="org.apache.log4j.Level"
  3900. transient="false" volatile="false"
  3901. static="true" final="true" visibility="public"
  3902. deprecated="not deprecated">
  3903. <doc>
  3904. <![CDATA[Default logging level for map/reduce tasks.]]>
  3905. </doc>
  3906. </field>
  3907. <doc>
  3908. <![CDATA[A map/reduce job configuration.
  3909. <p><code>JobConf</code> is the primary interface for a user to describe a
  3910. map-reduce job to the Hadoop framework for execution. The framework tries to
  3911. faithfully execute the job as-is described by <code>JobConf</code>, however:
  3912. <ol>
  3913. <li>
  3914. Some configuration parameters might have been marked as
  3915. <a href="{@docRoot}/org/apache/hadoop/conf/Configuration.html#FinalParams">
  3916. final</a> by administrators and hence cannot be altered.
  3917. </li>
  3918. <li>
  3919. While some job parameters are straight-forward to set
  3920. (e.g. {@link #setNumReduceTasks(int)}), some parameters interact subtly
  3921. rest of the framework and/or job-configuration and is relatively more
  3922. complex for the user to control finely (e.g. {@link #setNumMapTasks(int)}).
  3923. </li>
  3924. </ol></p>
  3925. <p><code>JobConf</code> typically specifies the {@link Mapper}, combiner
  3926. (if any), {@link Partitioner}, {@link Reducer}, {@link InputFormat} and
  3927. {@link OutputFormat} implementations to be used etc.
  3928. <p>Optionally <code>JobConf</code> is used to specify other advanced facets
  3929. of the job such as <code>Comparator</code>s to be used, files to be put in
  3930. the {@link DistributedCache}, whether or not intermediate and/or job outputs
  3931. are to be compressed (and how), debugability via user-provided scripts
  3932. ( {@link #setMapDebugScript(String)}/{@link #setReduceDebugScript(String)}),
  3933. for doing post-processing on task logs, task's stdout, stderr, syslog.
  3934. and etc.</p>
  3935. <p>Here is an example on how to configure a job via <code>JobConf</code>:</p>
  3936. <p><blockquote><pre>
  3937. // Create a new JobConf
  3938. JobConf job = new JobConf(new Configuration(), MyJob.class);
  3939. // Specify various job-specific parameters
  3940. job.setJobName("myjob");
  3941. FileInputFormat.setInputPaths(job, new Path("in"));
  3942. FileOutputFormat.setOutputPath(job, new Path("out"));
  3943. job.setMapperClass(MyJob.MyMapper.class);
  3944. job.setCombinerClass(MyJob.MyReducer.class);
  3945. job.setReducerClass(MyJob.MyReducer.class);
  3946. job.setInputFormat(SequenceFileInputFormat.class);
  3947. job.setOutputFormat(SequenceFileOutputFormat.class);
  3948. </pre></blockquote></p>
  3949. @see JobClient
  3950. @see ClusterStatus
  3951. @see Tool
  3952. @see DistributedCache
  3953. @deprecated Use {@link Configuration} instead]]>
  3954. </doc>
  3955. </class>
  3956. <!-- end class org.apache.hadoop.mapred.JobConf -->
  3957. <!-- start interface org.apache.hadoop.mapred.JobConfigurable -->
  3958. <interface name="JobConfigurable" abstract="true"
  3959. static="false" final="false" visibility="public"
  3960. deprecated="not deprecated">
  3961. <method name="configure"
  3962. abstract="false" native="false" synchronized="false"
  3963. static="false" final="false" visibility="public"
  3964. deprecated="not deprecated">
  3965. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  3966. <doc>
  3967. <![CDATA[Initializes a new instance from a {@link JobConf}.
  3968. @param job the configuration]]>
  3969. </doc>
  3970. </method>
  3971. <doc>
  3972. <![CDATA[That what may be configured.]]>
  3973. </doc>
  3974. </interface>
  3975. <!-- end interface org.apache.hadoop.mapred.JobConfigurable -->
  3976. <!-- start interface org.apache.hadoop.mapred.JobContext -->
  3977. <interface name="JobContext" abstract="true"
  3978. static="false" final="false" visibility="public"
  3979. deprecated="Use {@link org.apache.hadoop.mapreduce.JobContext} instead.">
  3980. <implements name="org.apache.hadoop.mapreduce.JobContext"/>
  3981. <method name="getJobConf" return="org.apache.hadoop.mapred.JobConf"
  3982. abstract="false" native="false" synchronized="false"
  3983. static="false" final="false" visibility="public"
  3984. deprecated="not deprecated">
  3985. <doc>
  3986. <![CDATA[Get the job Configuration
  3987. @return JobConf]]>
  3988. </doc>
  3989. </method>
  3990. <method name="getProgressible" return="org.apache.hadoop.util.Progressable"
  3991. abstract="false" native="false" synchronized="false"
  3992. static="false" final="false" visibility="public"
  3993. deprecated="not deprecated">
  3994. <doc>
  3995. <![CDATA[Get the progress mechanism for reporting progress.
  3996. @return progress mechanism]]>
  3997. </doc>
  3998. </method>
  3999. <doc>
  4000. <![CDATA[@deprecated Use {@link org.apache.hadoop.mapreduce.JobContext} instead.]]>
  4001. </doc>
  4002. </interface>
  4003. <!-- end interface org.apache.hadoop.mapred.JobContext -->
  4004. <!-- start class org.apache.hadoop.mapred.JobID -->
  4005. <class name="JobID" extends="org.apache.hadoop.mapreduce.JobID"
  4006. abstract="false"
  4007. static="false" final="false" visibility="public"
  4008. deprecated="not deprecated">
  4009. <constructor name="JobID" type="java.lang.String, int"
  4010. static="false" final="false" visibility="public"
  4011. deprecated="not deprecated">
  4012. <doc>
  4013. <![CDATA[Constructs a JobID object
  4014. @param jtIdentifier jobTracker identifier
  4015. @param id job number]]>
  4016. </doc>
  4017. </constructor>
  4018. <constructor name="JobID"
  4019. static="false" final="false" visibility="public"
  4020. deprecated="not deprecated">
  4021. </constructor>
  4022. <method name="downgrade" return="org.apache.hadoop.mapred.JobID"
  4023. abstract="false" native="false" synchronized="false"
  4024. static="true" final="false" visibility="public"
  4025. deprecated="not deprecated">
  4026. <param name="old" type="org.apache.hadoop.mapreduce.JobID"/>
  4027. <doc>
  4028. <![CDATA[Downgrade a new JobID to an old one
  4029. @param old a new or old JobID
  4030. @return either old or a new JobID build to match old]]>
  4031. </doc>
  4032. </method>
  4033. <method name="read" return="org.apache.hadoop.mapred.JobID"
  4034. abstract="false" native="false" synchronized="false"
  4035. static="true" final="false" visibility="public"
  4036. deprecated="not deprecated">
  4037. <param name="in" type="java.io.DataInput"/>
  4038. <exception name="IOException" type="java.io.IOException"/>
  4039. </method>
  4040. <method name="forName" return="org.apache.hadoop.mapred.JobID"
  4041. abstract="false" native="false" synchronized="false"
  4042. static="true" final="false" visibility="public"
  4043. deprecated="not deprecated">
  4044. <param name="str" type="java.lang.String"/>
  4045. <exception name="IllegalArgumentException" type="java.lang.IllegalArgumentException"/>
  4046. <doc>
  4047. <![CDATA[Construct a JobId object from given string
  4048. @return constructed JobId object or null if the given String is null
  4049. @throws IllegalArgumentException if the given string is malformed]]>
  4050. </doc>
  4051. </method>
  4052. <method name="getJobIDsPattern" return="java.lang.String"
  4053. abstract="false" native="false" synchronized="false"
  4054. static="true" final="false" visibility="public"
  4055. deprecated="not deprecated">
  4056. <param name="jtIdentifier" type="java.lang.String"/>
  4057. <param name="jobId" type="java.lang.Integer"/>
  4058. <doc>
  4059. <![CDATA[Returns a regex pattern which matches task IDs. Arguments can
  4060. be given null, in which case that part of the regex will be generic.
  4061. For example to obtain a regex matching <i>any job</i>
  4062. run on the jobtracker started at <i>200707121733</i>, we would use :
  4063. <pre>
  4064. JobID.getTaskIDsPattern("200707121733", null);
  4065. </pre>
  4066. which will return :
  4067. <pre> "job_200707121733_[0-9]*" </pre>
  4068. @param jtIdentifier jobTracker identifier, or null
  4069. @param jobId job number, or null
  4070. @return a regex pattern matching JobIDs]]>
  4071. </doc>
  4072. </method>
  4073. <doc>
  4074. <![CDATA[JobID represents the immutable and unique identifier for
  4075. the job. JobID consists of two parts. First part
  4076. represents the jobtracker identifier, so that jobID to jobtracker map
  4077. is defined. For cluster setup this string is the jobtracker
  4078. start time, for local setting, it is "local".
  4079. Second part of the JobID is the job number. <br>
  4080. An example JobID is :
  4081. <code>job_200707121733_0003</code> , which represents the third job
  4082. running at the jobtracker started at <code>200707121733</code>.
  4083. <p>
  4084. Applications should never construct or parse JobID strings, but rather
  4085. use appropriate constructors or {@link #forName(String)} method.
  4086. @see TaskID
  4087. @see TaskAttemptID]]>
  4088. </doc>
  4089. </class>
  4090. <!-- end class org.apache.hadoop.mapred.JobID -->
  4091. <!-- start class org.apache.hadoop.mapred.JobPriority -->
  4092. <class name="JobPriority" extends="java.lang.Enum"
  4093. abstract="false"
  4094. static="false" final="true" visibility="public"
  4095. deprecated="Use {@link org.apache.hadoop.mapreduce.JobPriority} instead">
  4096. <method name="values" return="org.apache.hadoop.mapred.JobPriority[]"
  4097. abstract="false" native="false" synchronized="false"
  4098. static="true" final="false" visibility="public"
  4099. deprecated="not deprecated">
  4100. </method>
  4101. <method name="valueOf" return="org.apache.hadoop.mapred.JobPriority"
  4102. abstract="false" native="false" synchronized="false"
  4103. static="true" final="false" visibility="public"
  4104. deprecated="not deprecated">
  4105. <param name="name" type="java.lang.String"/>
  4106. </method>
  4107. <doc>
  4108. <![CDATA[Used to describe the priority of the running job.
  4109. @deprecated Use {@link org.apache.hadoop.mapreduce.JobPriority} instead]]>
  4110. </doc>
  4111. </class>
  4112. <!-- end class org.apache.hadoop.mapred.JobPriority -->
  4113. <!-- start class org.apache.hadoop.mapred.JobQueueInfo -->
  4114. <class name="JobQueueInfo" extends="org.apache.hadoop.mapreduce.QueueInfo"
  4115. abstract="false"
  4116. static="false" final="false" visibility="public"
  4117. deprecated="Use {@link QueueInfo} instead">
  4118. <constructor name="JobQueueInfo"
  4119. static="false" final="false" visibility="public"
  4120. deprecated="not deprecated">
  4121. <doc>
  4122. <![CDATA[Default constructor for Job Queue Info.]]>
  4123. </doc>
  4124. </constructor>
  4125. <constructor name="JobQueueInfo" type="java.lang.String, java.lang.String"
  4126. static="false" final="false" visibility="public"
  4127. deprecated="not deprecated">
  4128. <doc>
  4129. <![CDATA[Construct a new JobQueueInfo object using the queue name and the
  4130. scheduling information passed.
  4131. @param queueName Name of the job queue
  4132. @param schedulingInfo Scheduling Information associated with the job
  4133. queue]]>
  4134. </doc>
  4135. </constructor>
  4136. <method name="setQueueName"
  4137. abstract="false" native="false" synchronized="false"
  4138. static="false" final="false" visibility="protected"
  4139. deprecated="not deprecated">
  4140. <param name="queueName" type="java.lang.String"/>
  4141. <doc>
  4142. <![CDATA[Set the queue name of the JobQueueInfo
  4143. @param queueName Name of the job queue.]]>
  4144. </doc>
  4145. </method>
  4146. <method name="setSchedulingInfo"
  4147. abstract="false" native="false" synchronized="false"
  4148. static="false" final="false" visibility="protected"
  4149. deprecated="not deprecated">
  4150. <param name="schedulingInfo" type="java.lang.String"/>
  4151. <doc>
  4152. <![CDATA[Set the scheduling information associated to particular job queue
  4153. @param schedulingInfo]]>
  4154. </doc>
  4155. </method>
  4156. <method name="setQueueState"
  4157. abstract="false" native="false" synchronized="false"
  4158. static="false" final="false" visibility="protected"
  4159. deprecated="not deprecated">
  4160. <param name="state" type="java.lang.String"/>
  4161. <doc>
  4162. <![CDATA[Set the state of the queue
  4163. @param state state of the queue.]]>
  4164. </doc>
  4165. </method>
  4166. <method name="setChildren"
  4167. abstract="false" native="false" synchronized="false"
  4168. static="false" final="false" visibility="protected"
  4169. deprecated="not deprecated">
  4170. <param name="children" type="java.util.List"/>
  4171. </method>
  4172. <method name="getChildren" return="java.util.List"
  4173. abstract="false" native="false" synchronized="false"
  4174. static="false" final="false" visibility="public"
  4175. deprecated="not deprecated">
  4176. </method>
  4177. <method name="setProperties"
  4178. abstract="false" native="false" synchronized="false"
  4179. static="false" final="false" visibility="protected"
  4180. deprecated="not deprecated">
  4181. <param name="props" type="java.util.Properties"/>
  4182. </method>
  4183. <method name="setJobStatuses"
  4184. abstract="false" native="false" synchronized="false"
  4185. static="false" final="false" visibility="protected"
  4186. deprecated="not deprecated">
  4187. <param name="stats" type="org.apache.hadoop.mapreduce.JobStatus[]"/>
  4188. </method>
  4189. <doc>
  4190. <![CDATA[Class that contains the information regarding the Job Queues which are
  4191. maintained by the Hadoop Map/Reduce framework.
  4192. @deprecated Use {@link QueueInfo} instead]]>
  4193. </doc>
  4194. </class>
  4195. <!-- end class org.apache.hadoop.mapred.JobQueueInfo -->
  4196. <!-- start class org.apache.hadoop.mapred.JobStatus -->
  4197. <class name="JobStatus" extends="org.apache.hadoop.mapreduce.JobStatus"
  4198. abstract="false"
  4199. static="false" final="false" visibility="public"
  4200. deprecated="Use {@link org.apache.hadoop.mapreduce.JobStatus} instead">
  4201. <constructor name="JobStatus"
  4202. static="false" final="false" visibility="public"
  4203. deprecated="not deprecated">
  4204. </constructor>
  4205. <constructor name="JobStatus" type="org.apache.hadoop.mapred.JobID, float, float, float, int, java.lang.String, java.lang.String, java.lang.String, java.lang.String"
  4206. static="false" final="false" visibility="public"
  4207. deprecated="not deprecated">
  4208. <doc>
  4209. <![CDATA[Create a job status object for a given jobid.
  4210. @param jobid The jobid of the job
  4211. @param mapProgress The progress made on the maps
  4212. @param reduceProgress The progress made on the reduces
  4213. @param cleanupProgress The progress made on cleanup
  4214. @param runState The current state of the job
  4215. @param user userid of the person who submitted the job.
  4216. @param jobName user-specified job name.
  4217. @param jobFile job configuration file.
  4218. @param trackingUrl link to the web-ui for details of the job.]]>
  4219. </doc>
  4220. </constructor>
  4221. <constructor name="JobStatus" type="org.apache.hadoop.mapred.JobID, float, float, int, java.lang.String, java.lang.String, java.lang.String, java.lang.String"
  4222. static="false" final="false" visibility="public"
  4223. deprecated="not deprecated">
  4224. <doc>
  4225. <![CDATA[Create a job status object for a given jobid.
  4226. @param jobid The jobid of the job
  4227. @param mapProgress The progress made on the maps
  4228. @param reduceProgress The progress made on the reduces
  4229. @param runState The current state of the job
  4230. @param user userid of the person who submitted the job.
  4231. @param jobName user-specified job name.
  4232. @param jobFile job configuration file.
  4233. @param trackingUrl link to the web-ui for details of the job.]]>
  4234. </doc>
  4235. </constructor>
  4236. <constructor name="JobStatus" type="org.apache.hadoop.mapred.JobID, float, float, float, int, org.apache.hadoop.mapred.JobPriority, java.lang.String, java.lang.String, java.lang.String, java.lang.String"
  4237. static="false" final="false" visibility="public"
  4238. deprecated="not deprecated">
  4239. <doc>
  4240. <![CDATA[Create a job status object for a given jobid.
  4241. @param jobid The jobid of the job
  4242. @param mapProgress The progress made on the maps
  4243. @param reduceProgress The progress made on the reduces
  4244. @param runState The current state of the job
  4245. @param jp Priority of the job.
  4246. @param user userid of the person who submitted the job.
  4247. @param jobName user-specified job name.
  4248. @param jobFile job configuration file.
  4249. @param trackingUrl link to the web-ui for details of the job.]]>
  4250. </doc>
  4251. </constructor>
  4252. <constructor name="JobStatus" type="org.apache.hadoop.mapred.JobID, float, float, float, float, int, org.apache.hadoop.mapred.JobPriority, java.lang.String, java.lang.String, java.lang.String, java.lang.String"
  4253. static="false" final="false" visibility="public"
  4254. deprecated="not deprecated">
  4255. <doc>
  4256. <![CDATA[Create a job status object for a given jobid.
  4257. @param jobid The jobid of the job
  4258. @param setupProgress The progress made on the setup
  4259. @param mapProgress The progress made on the maps
  4260. @param reduceProgress The progress made on the reduces
  4261. @param cleanupProgress The progress made on the cleanup
  4262. @param runState The current state of the job
  4263. @param jp Priority of the job.
  4264. @param user userid of the person who submitted the job.
  4265. @param jobName user-specified job name.
  4266. @param jobFile job configuration file.
  4267. @param trackingUrl link to the web-ui for details of the job.]]>
  4268. </doc>
  4269. </constructor>
  4270. <method name="getJobRunState" return="java.lang.String"
  4271. abstract="false" native="false" synchronized="false"
  4272. static="true" final="false" visibility="public"
  4273. deprecated="not deprecated">
  4274. <param name="state" type="int"/>
  4275. <doc>
  4276. <![CDATA[Helper method to get human-readable state of the job.
  4277. @param state job state
  4278. @return human-readable state of the job]]>
  4279. </doc>
  4280. </method>
  4281. <method name="downgrade" return="org.apache.hadoop.mapred.JobStatus"
  4282. abstract="false" native="false" synchronized="false"
  4283. static="true" final="false" visibility="public"
  4284. deprecated="not deprecated">
  4285. <param name="stat" type="org.apache.hadoop.mapreduce.JobStatus"/>
  4286. </method>
  4287. <method name="getJobId" return="java.lang.String"
  4288. abstract="false" native="false" synchronized="false"
  4289. static="false" final="false" visibility="public"
  4290. deprecated="use getJobID instead">
  4291. <doc>
  4292. <![CDATA[@deprecated use getJobID instead]]>
  4293. </doc>
  4294. </method>
  4295. <method name="getJobID" return="org.apache.hadoop.mapred.JobID"
  4296. abstract="false" native="false" synchronized="false"
  4297. static="false" final="false" visibility="public"
  4298. deprecated="not deprecated">
  4299. <doc>
  4300. <![CDATA[@return The jobid of the Job]]>
  4301. </doc>
  4302. </method>
  4303. <method name="getJobPriority" return="org.apache.hadoop.mapred.JobPriority"
  4304. abstract="false" native="false" synchronized="true"
  4305. static="false" final="false" visibility="public"
  4306. deprecated="not deprecated">
  4307. <doc>
  4308. <![CDATA[Return the priority of the job
  4309. @return job priority]]>
  4310. </doc>
  4311. </method>
  4312. <method name="setMapProgress"
  4313. abstract="false" native="false" synchronized="true"
  4314. static="false" final="false" visibility="protected"
  4315. deprecated="not deprecated">
  4316. <param name="p" type="float"/>
  4317. <doc>
  4318. <![CDATA[Sets the map progress of this job
  4319. @param p The value of map progress to set to]]>
  4320. </doc>
  4321. </method>
  4322. <method name="setCleanupProgress"
  4323. abstract="false" native="false" synchronized="true"
  4324. static="false" final="false" visibility="protected"
  4325. deprecated="not deprecated">
  4326. <param name="p" type="float"/>
  4327. <doc>
  4328. <![CDATA[Sets the cleanup progress of this job
  4329. @param p The value of cleanup progress to set to]]>
  4330. </doc>
  4331. </method>
  4332. <method name="setSetupProgress"
  4333. abstract="false" native="false" synchronized="true"
  4334. static="false" final="false" visibility="protected"
  4335. deprecated="not deprecated">
  4336. <param name="p" type="float"/>
  4337. <doc>
  4338. <![CDATA[Sets the setup progress of this job
  4339. @param p The value of setup progress to set to]]>
  4340. </doc>
  4341. </method>
  4342. <method name="setReduceProgress"
  4343. abstract="false" native="false" synchronized="true"
  4344. static="false" final="false" visibility="protected"
  4345. deprecated="not deprecated">
  4346. <param name="p" type="float"/>
  4347. <doc>
  4348. <![CDATA[Sets the reduce progress of this Job
  4349. @param p The value of reduce progress to set to]]>
  4350. </doc>
  4351. </method>
  4352. <method name="setFinishTime"
  4353. abstract="false" native="false" synchronized="true"
  4354. static="false" final="false" visibility="protected"
  4355. deprecated="not deprecated">
  4356. <param name="finishTime" type="long"/>
  4357. <doc>
  4358. <![CDATA[Set the finish time of the job
  4359. @param finishTime The finishTime of the job]]>
  4360. </doc>
  4361. </method>
  4362. <method name="setHistoryFile"
  4363. abstract="false" native="false" synchronized="true"
  4364. static="false" final="false" visibility="protected"
  4365. deprecated="not deprecated">
  4366. <param name="historyFile" type="java.lang.String"/>
  4367. <doc>
  4368. <![CDATA[Set the job history file url for a completed job]]>
  4369. </doc>
  4370. </method>
  4371. <method name="setTrackingUrl"
  4372. abstract="false" native="false" synchronized="true"
  4373. static="false" final="false" visibility="protected"
  4374. deprecated="not deprecated">
  4375. <param name="trackingUrl" type="java.lang.String"/>
  4376. <doc>
  4377. <![CDATA[Set the link to the web-ui for details of the job.]]>
  4378. </doc>
  4379. </method>
  4380. <method name="setRetired"
  4381. abstract="false" native="false" synchronized="true"
  4382. static="false" final="false" visibility="protected"
  4383. deprecated="not deprecated">
  4384. <doc>
  4385. <![CDATA[Set the job retire flag to true.]]>
  4386. </doc>
  4387. </method>
  4388. <method name="setRunState"
  4389. abstract="false" native="false" synchronized="true"
  4390. static="false" final="false" visibility="protected"
  4391. deprecated="not deprecated">
  4392. <param name="state" type="int"/>
  4393. <doc>
  4394. <![CDATA[Change the current run state of the job.]]>
  4395. </doc>
  4396. </method>
  4397. <method name="getRunState" return="int"
  4398. abstract="false" native="false" synchronized="true"
  4399. static="false" final="false" visibility="public"
  4400. deprecated="not deprecated">
  4401. <doc>
  4402. <![CDATA[@return running state of the job]]>
  4403. </doc>
  4404. </method>
  4405. <method name="setStartTime"
  4406. abstract="false" native="false" synchronized="true"
  4407. static="false" final="false" visibility="protected"
  4408. deprecated="not deprecated">
  4409. <param name="startTime" type="long"/>
  4410. <doc>
  4411. <![CDATA[Set the start time of the job
  4412. @param startTime The startTime of the job]]>
  4413. </doc>
  4414. </method>
  4415. <method name="setUsername"
  4416. abstract="false" native="false" synchronized="true"
  4417. static="false" final="false" visibility="protected"
  4418. deprecated="not deprecated">
  4419. <param name="userName" type="java.lang.String"/>
  4420. <doc>
  4421. <![CDATA[@param userName The username of the job]]>
  4422. </doc>
  4423. </method>
  4424. <method name="setSchedulingInfo"
  4425. abstract="false" native="false" synchronized="true"
  4426. static="false" final="false" visibility="protected"
  4427. deprecated="not deprecated">
  4428. <param name="schedulingInfo" type="java.lang.String"/>
  4429. <doc>
  4430. <![CDATA[Used to set the scheduling information associated to a particular Job.
  4431. @param schedulingInfo Scheduling information of the job]]>
  4432. </doc>
  4433. </method>
  4434. <method name="setJobACLs"
  4435. abstract="false" native="false" synchronized="true"
  4436. static="false" final="false" visibility="protected"
  4437. deprecated="not deprecated">
  4438. <param name="acls" type="java.util.Map"/>
  4439. </method>
  4440. <method name="setJobPriority"
  4441. abstract="false" native="false" synchronized="true"
  4442. static="false" final="false" visibility="public"
  4443. deprecated="not deprecated">
  4444. <param name="jp" type="org.apache.hadoop.mapred.JobPriority"/>
  4445. <doc>
  4446. <![CDATA[Set the priority of the job, defaulting to NORMAL.
  4447. @param jp new job priority]]>
  4448. </doc>
  4449. </method>
  4450. <method name="mapProgress" return="float"
  4451. abstract="false" native="false" synchronized="true"
  4452. static="false" final="false" visibility="public"
  4453. deprecated="not deprecated">
  4454. <doc>
  4455. <![CDATA[@return Percentage of progress in maps]]>
  4456. </doc>
  4457. </method>
  4458. <method name="cleanupProgress" return="float"
  4459. abstract="false" native="false" synchronized="true"
  4460. static="false" final="false" visibility="public"
  4461. deprecated="not deprecated">
  4462. <doc>
  4463. <![CDATA[@return Percentage of progress in cleanup]]>
  4464. </doc>
  4465. </method>
  4466. <method name="setupProgress" return="float"
  4467. abstract="false" native="false" synchronized="true"
  4468. static="false" final="false" visibility="public"
  4469. deprecated="not deprecated">
  4470. <doc>
  4471. <![CDATA[@return Percentage of progress in setup]]>
  4472. </doc>
  4473. </method>
  4474. <method name="reduceProgress" return="float"
  4475. abstract="false" native="false" synchronized="true"
  4476. static="false" final="false" visibility="public"
  4477. deprecated="not deprecated">
  4478. <doc>
  4479. <![CDATA[@return Percentage of progress in reduce]]>
  4480. </doc>
  4481. </method>
  4482. <field name="RUNNING" type="int"
  4483. transient="false" volatile="false"
  4484. static="true" final="true" visibility="public"
  4485. deprecated="not deprecated">
  4486. </field>
  4487. <field name="SUCCEEDED" type="int"
  4488. transient="false" volatile="false"
  4489. static="true" final="true" visibility="public"
  4490. deprecated="not deprecated">
  4491. </field>
  4492. <field name="FAILED" type="int"
  4493. transient="false" volatile="false"
  4494. static="true" final="true" visibility="public"
  4495. deprecated="not deprecated">
  4496. </field>
  4497. <field name="PREP" type="int"
  4498. transient="false" volatile="false"
  4499. static="true" final="true" visibility="public"
  4500. deprecated="not deprecated">
  4501. </field>
  4502. <field name="KILLED" type="int"
  4503. transient="false" volatile="false"
  4504. static="true" final="true" visibility="public"
  4505. deprecated="not deprecated">
  4506. </field>
  4507. <doc>
  4508. <![CDATA[Describes the current status of a job. This is
  4509. not intended to be a comprehensive piece of data.
  4510. For that, look at JobProfile.
  4511. @deprecated Use {@link org.apache.hadoop.mapreduce.JobStatus} instead]]>
  4512. </doc>
  4513. </class>
  4514. <!-- end class org.apache.hadoop.mapred.JobStatus -->
  4515. <!-- start class org.apache.hadoop.mapred.KeyValueLineRecordReader -->
  4516. <class name="KeyValueLineRecordReader" extends="java.lang.Object"
  4517. abstract="false"
  4518. static="false" final="false" visibility="public"
  4519. deprecated="Use
  4520. {@link org.apache.hadoop.mapreduce.lib.input.KeyValueLineRecordReader}
  4521. instead">
  4522. <implements name="org.apache.hadoop.mapred.RecordReader"/>
  4523. <constructor name="KeyValueLineRecordReader" type="org.apache.hadoop.conf.Configuration, org.apache.hadoop.mapred.FileSplit"
  4524. static="false" final="false" visibility="public"
  4525. deprecated="not deprecated">
  4526. <exception name="IOException" type="java.io.IOException"/>
  4527. </constructor>
  4528. <method name="getKeyClass" return="java.lang.Class"
  4529. abstract="false" native="false" synchronized="false"
  4530. static="false" final="false" visibility="public"
  4531. deprecated="not deprecated">
  4532. </method>
  4533. <method name="createKey" return="org.apache.hadoop.io.Text"
  4534. abstract="false" native="false" synchronized="false"
  4535. static="false" final="false" visibility="public"
  4536. deprecated="not deprecated">
  4537. </method>
  4538. <method name="createValue" return="org.apache.hadoop.io.Text"
  4539. abstract="false" native="false" synchronized="false"
  4540. static="false" final="false" visibility="public"
  4541. deprecated="not deprecated">
  4542. </method>
  4543. <method name="findSeparator" return="int"
  4544. abstract="false" native="false" synchronized="false"
  4545. static="true" final="false" visibility="public"
  4546. deprecated="not deprecated">
  4547. <param name="utf" type="byte[]"/>
  4548. <param name="start" type="int"/>
  4549. <param name="length" type="int"/>
  4550. <param name="sep" type="byte"/>
  4551. </method>
  4552. <method name="next" return="boolean"
  4553. abstract="false" native="false" synchronized="true"
  4554. static="false" final="false" visibility="public"
  4555. deprecated="not deprecated">
  4556. <param name="key" type="org.apache.hadoop.io.Text"/>
  4557. <param name="value" type="org.apache.hadoop.io.Text"/>
  4558. <exception name="IOException" type="java.io.IOException"/>
  4559. <doc>
  4560. <![CDATA[Read key/value pair in a line.]]>
  4561. </doc>
  4562. </method>
  4563. <method name="getProgress" return="float"
  4564. abstract="false" native="false" synchronized="false"
  4565. static="false" final="false" visibility="public"
  4566. deprecated="not deprecated">
  4567. <exception name="IOException" type="java.io.IOException"/>
  4568. </method>
  4569. <method name="getPos" return="long"
  4570. abstract="false" native="false" synchronized="true"
  4571. static="false" final="false" visibility="public"
  4572. deprecated="not deprecated">
  4573. <exception name="IOException" type="java.io.IOException"/>
  4574. </method>
  4575. <method name="close"
  4576. abstract="false" native="false" synchronized="true"
  4577. static="false" final="false" visibility="public"
  4578. deprecated="not deprecated">
  4579. <exception name="IOException" type="java.io.IOException"/>
  4580. </method>
  4581. <doc>
  4582. <![CDATA[This class treats a line in the input as a key/value pair separated by a
  4583. separator character. The separator can be specified in config file
  4584. under the attribute name mapreduce.input.keyvaluelinerecordreader.key.value.separator. The default
  4585. separator is the tab character ('\t').
  4586. @deprecated Use
  4587. {@link org.apache.hadoop.mapreduce.lib.input.KeyValueLineRecordReader}
  4588. instead]]>
  4589. </doc>
  4590. </class>
  4591. <!-- end class org.apache.hadoop.mapred.KeyValueLineRecordReader -->
  4592. <!-- start class org.apache.hadoop.mapred.KeyValueTextInputFormat -->
  4593. <class name="KeyValueTextInputFormat" extends="org.apache.hadoop.mapred.FileInputFormat"
  4594. abstract="false"
  4595. static="false" final="false" visibility="public"
  4596. deprecated="Use
  4597. {@link org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat}
  4598. instead">
  4599. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  4600. <constructor name="KeyValueTextInputFormat"
  4601. static="false" final="false" visibility="public"
  4602. deprecated="not deprecated">
  4603. </constructor>
  4604. <method name="configure"
  4605. abstract="false" native="false" synchronized="false"
  4606. static="false" final="false" visibility="public"
  4607. deprecated="not deprecated">
  4608. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  4609. </method>
  4610. <method name="isSplitable" return="boolean"
  4611. abstract="false" native="false" synchronized="false"
  4612. static="false" final="false" visibility="protected"
  4613. deprecated="not deprecated">
  4614. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  4615. <param name="file" type="org.apache.hadoop.fs.Path"/>
  4616. </method>
  4617. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  4618. abstract="false" native="false" synchronized="false"
  4619. static="false" final="false" visibility="public"
  4620. deprecated="not deprecated">
  4621. <param name="genericSplit" type="org.apache.hadoop.mapred.InputSplit"/>
  4622. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  4623. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  4624. <exception name="IOException" type="java.io.IOException"/>
  4625. </method>
  4626. <doc>
  4627. <![CDATA[An {@link InputFormat} for plain text files. Files are broken into lines.
  4628. Either linefeed or carriage-return are used to signal end of line. Each line
  4629. is divided into key and value parts by a separator byte. If no such a byte
  4630. exists, the key will be the entire line and value will be empty.
  4631. @deprecated Use
  4632. {@link org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat}
  4633. instead]]>
  4634. </doc>
  4635. </class>
  4636. <!-- end class org.apache.hadoop.mapred.KeyValueTextInputFormat -->
  4637. <!-- start class org.apache.hadoop.mapred.LineRecordReader.LineReader -->
  4638. <class name="LineRecordReader.LineReader" extends="org.apache.hadoop.util.LineReader"
  4639. abstract="false"
  4640. static="true" final="false" visibility="public"
  4641. deprecated="Use {@link org.apache.hadoop.util.LineReader} instead.">
  4642. <constructor name="LineRecordReader.LineReader" type="java.io.InputStream, org.apache.hadoop.conf.Configuration"
  4643. static="false" final="false" visibility="public"
  4644. deprecated="not deprecated">
  4645. <exception name="IOException" type="java.io.IOException"/>
  4646. </constructor>
  4647. <doc>
  4648. <![CDATA[A class that provides a line reader from an input stream.
  4649. @deprecated Use {@link org.apache.hadoop.util.LineReader} instead.]]>
  4650. </doc>
  4651. </class>
  4652. <!-- end class org.apache.hadoop.mapred.LineRecordReader.LineReader -->
  4653. <!-- start class org.apache.hadoop.mapred.MapFileOutputFormat -->
  4654. <class name="MapFileOutputFormat" extends="org.apache.hadoop.mapred.FileOutputFormat"
  4655. abstract="false"
  4656. static="false" final="false" visibility="public"
  4657. deprecated="Use
  4658. {@link org.apache.hadoop.mapreduce.lib.output.MapFileOutputFormat} instead">
  4659. <constructor name="MapFileOutputFormat"
  4660. static="false" final="false" visibility="public"
  4661. deprecated="not deprecated">
  4662. </constructor>
  4663. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  4664. abstract="false" native="false" synchronized="false"
  4665. static="false" final="false" visibility="public"
  4666. deprecated="not deprecated">
  4667. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  4668. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  4669. <param name="name" type="java.lang.String"/>
  4670. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  4671. <exception name="IOException" type="java.io.IOException"/>
  4672. </method>
  4673. <method name="getReaders" return="org.apache.hadoop.io.MapFile.Reader[]"
  4674. abstract="false" native="false" synchronized="false"
  4675. static="true" final="false" visibility="public"
  4676. deprecated="not deprecated">
  4677. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  4678. <param name="dir" type="org.apache.hadoop.fs.Path"/>
  4679. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  4680. <exception name="IOException" type="java.io.IOException"/>
  4681. <doc>
  4682. <![CDATA[Open the output generated by this format.]]>
  4683. </doc>
  4684. </method>
  4685. <method name="getEntry" return="org.apache.hadoop.io.Writable"
  4686. abstract="false" native="false" synchronized="false"
  4687. static="true" final="false" visibility="public"
  4688. deprecated="not deprecated">
  4689. <param name="readers" type="org.apache.hadoop.io.MapFile.Reader[]"/>
  4690. <param name="partitioner" type="org.apache.hadoop.mapred.Partitioner"/>
  4691. <param name="key" type="K"/>
  4692. <param name="value" type="V"/>
  4693. <exception name="IOException" type="java.io.IOException"/>
  4694. <doc>
  4695. <![CDATA[Get an entry from output generated by this class.]]>
  4696. </doc>
  4697. </method>
  4698. <doc>
  4699. <![CDATA[An {@link OutputFormat} that writes {@link MapFile}s.
  4700. @deprecated Use
  4701. {@link org.apache.hadoop.mapreduce.lib.output.MapFileOutputFormat} instead]]>
  4702. </doc>
  4703. </class>
  4704. <!-- end class org.apache.hadoop.mapred.MapFileOutputFormat -->
  4705. <!-- start interface org.apache.hadoop.mapred.Mapper -->
  4706. <interface name="Mapper" abstract="true"
  4707. static="false" final="false" visibility="public"
  4708. deprecated="Use {@link org.apache.hadoop.mapreduce.Mapper} instead.">
  4709. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  4710. <implements name="org.apache.hadoop.io.Closeable"/>
  4711. <method name="map"
  4712. abstract="false" native="false" synchronized="false"
  4713. static="false" final="false" visibility="public"
  4714. deprecated="not deprecated">
  4715. <param name="key" type="K1"/>
  4716. <param name="value" type="V1"/>
  4717. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  4718. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  4719. <exception name="IOException" type="java.io.IOException"/>
  4720. <doc>
  4721. <![CDATA[Maps a single input key/value pair into an intermediate key/value pair.
  4722. <p>Output pairs need not be of the same types as input pairs. A given
  4723. input pair may map to zero or many output pairs. Output pairs are
  4724. collected with calls to
  4725. {@link OutputCollector#collect(Object,Object)}.</p>
  4726. <p>Applications can use the {@link Reporter} provided to report progress
  4727. or just indicate that they are alive. In scenarios where the application
  4728. takes an insignificant amount of time to process individual key/value
  4729. pairs, this is crucial since the framework might assume that the task has
  4730. timed-out and kill that task. The other way of avoiding this is to set
  4731. <a href="{@docRoot}/../mapred-default.html#mapreduce.task.timeout">
  4732. mapreduce.task.timeout</a> to a high-enough value (or even zero for no
  4733. time-outs).</p>
  4734. @param key the input key.
  4735. @param value the input value.
  4736. @param output collects mapped keys and values.
  4737. @param reporter facility to report progress.]]>
  4738. </doc>
  4739. </method>
  4740. <doc>
  4741. <![CDATA[Maps input key/value pairs to a set of intermediate key/value pairs.
  4742. <p>Maps are the individual tasks which transform input records into a
  4743. intermediate records. The transformed intermediate records need not be of
  4744. the same type as the input records. A given input pair may map to zero or
  4745. many output pairs.</p>
  4746. <p>The Hadoop Map-Reduce framework spawns one map task for each
  4747. {@link InputSplit} generated by the {@link InputFormat} for the job.
  4748. <code>Mapper</code> implementations can access the {@link JobConf} for the
  4749. job via the {@link JobConfigurable#configure(JobConf)} and initialize
  4750. themselves. Similarly they can use the {@link Closeable#close()} method for
  4751. de-initialization.</p>
  4752. <p>The framework then calls
  4753. {@link #map(Object, Object, OutputCollector, Reporter)}
  4754. for each key/value pair in the <code>InputSplit</code> for that task.</p>
  4755. <p>All intermediate values associated with a given output key are
  4756. subsequently grouped by the framework, and passed to a {@link Reducer} to
  4757. determine the final output. Users can control the grouping by specifying
  4758. a <code>Comparator</code> via
  4759. {@link JobConf#setOutputKeyComparatorClass(Class)}.</p>
  4760. <p>The grouped <code>Mapper</code> outputs are partitioned per
  4761. <code>Reducer</code>. Users can control which keys (and hence records) go to
  4762. which <code>Reducer</code> by implementing a custom {@link Partitioner}.
  4763. <p>Users can optionally specify a <code>combiner</code>, via
  4764. {@link JobConf#setCombinerClass(Class)}, to perform local aggregation of the
  4765. intermediate outputs, which helps to cut down the amount of data transferred
  4766. from the <code>Mapper</code> to the <code>Reducer</code>.
  4767. <p>The intermediate, grouped outputs are always stored in
  4768. {@link SequenceFile}s. Applications can specify if and how the intermediate
  4769. outputs are to be compressed and which {@link CompressionCodec}s are to be
  4770. used via the <code>JobConf</code>.</p>
  4771. <p>If the job has
  4772. <a href="{@docRoot}/org/apache/hadoop/mapred/JobConf.html#ReducerNone">zero
  4773. reduces</a> then the output of the <code>Mapper</code> is directly written
  4774. to the {@link FileSystem} without grouping by keys.</p>
  4775. <p>Example:</p>
  4776. <p><blockquote><pre>
  4777. public class MyMapper&lt;K extends WritableComparable, V extends Writable&gt;
  4778. extends MapReduceBase implements Mapper&lt;K, V, K, V&gt; {
  4779. static enum MyCounters { NUM_RECORDS }
  4780. private String mapTaskId;
  4781. private String inputFile;
  4782. private int noRecords = 0;
  4783. public void configure(JobConf job) {
  4784. mapTaskId = job.get(JobContext.TASK_ATTEMPT_ID);
  4785. inputFile = job.get(JobContext.MAP_INPUT_FILE);
  4786. }
  4787. public void map(K key, V val,
  4788. OutputCollector&lt;K, V&gt; output, Reporter reporter)
  4789. throws IOException {
  4790. // Process the &lt;key, value&gt; pair (assume this takes a while)
  4791. // ...
  4792. // ...
  4793. // Let the framework know that we are alive, and kicking!
  4794. // reporter.progress();
  4795. // Process some more
  4796. // ...
  4797. // ...
  4798. // Increment the no. of &lt;key, value&gt; pairs processed
  4799. ++noRecords;
  4800. // Increment counters
  4801. reporter.incrCounter(NUM_RECORDS, 1);
  4802. // Every 100 records update application-level status
  4803. if ((noRecords%100) == 0) {
  4804. reporter.setStatus(mapTaskId + " processed " + noRecords +
  4805. " from input-file: " + inputFile);
  4806. }
  4807. // Output the result
  4808. output.collect(key, val);
  4809. }
  4810. }
  4811. </pre></blockquote></p>
  4812. <p>Applications may write a custom {@link MapRunnable} to exert greater
  4813. control on map processing e.g. multi-threaded <code>Mapper</code>s etc.</p>
  4814. @see JobConf
  4815. @see InputFormat
  4816. @see Partitioner
  4817. @see Reducer
  4818. @see MapReduceBase
  4819. @see MapRunnable
  4820. @see SequenceFile
  4821. @deprecated Use {@link org.apache.hadoop.mapreduce.Mapper} instead.]]>
  4822. </doc>
  4823. </interface>
  4824. <!-- end interface org.apache.hadoop.mapred.Mapper -->
  4825. <!-- start class org.apache.hadoop.mapred.MapReduceBase -->
  4826. <class name="MapReduceBase" extends="java.lang.Object"
  4827. abstract="false"
  4828. static="false" final="false" visibility="public"
  4829. deprecated="not deprecated">
  4830. <implements name="org.apache.hadoop.io.Closeable"/>
  4831. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  4832. <constructor name="MapReduceBase"
  4833. static="false" final="false" visibility="public"
  4834. deprecated="not deprecated">
  4835. </constructor>
  4836. <method name="close"
  4837. abstract="false" native="false" synchronized="false"
  4838. static="false" final="false" visibility="public"
  4839. deprecated="not deprecated">
  4840. <exception name="IOException" type="java.io.IOException"/>
  4841. <doc>
  4842. <![CDATA[Default implementation that does nothing.]]>
  4843. </doc>
  4844. </method>
  4845. <method name="configure"
  4846. abstract="false" native="false" synchronized="false"
  4847. static="false" final="false" visibility="public"
  4848. deprecated="not deprecated">
  4849. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  4850. <doc>
  4851. <![CDATA[Default implementation that does nothing.]]>
  4852. </doc>
  4853. </method>
  4854. <doc>
  4855. <![CDATA[Base class for {@link Mapper} and {@link Reducer} implementations.
  4856. <p>Provides default no-op implementations for a few methods, most non-trivial
  4857. applications need to override some of them.</p>]]>
  4858. </doc>
  4859. </class>
  4860. <!-- end class org.apache.hadoop.mapred.MapReduceBase -->
  4861. <!-- start interface org.apache.hadoop.mapred.MapRunnable -->
  4862. <interface name="MapRunnable" abstract="true"
  4863. static="false" final="false" visibility="public"
  4864. deprecated="Use {@link org.apache.hadoop.mapreduce.Mapper} instead.">
  4865. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  4866. <method name="run"
  4867. abstract="false" native="false" synchronized="false"
  4868. static="false" final="false" visibility="public"
  4869. deprecated="not deprecated">
  4870. <param name="input" type="org.apache.hadoop.mapred.RecordReader"/>
  4871. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  4872. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  4873. <exception name="IOException" type="java.io.IOException"/>
  4874. <doc>
  4875. <![CDATA[Start mapping input <tt>&lt;key, value&gt;</tt> pairs.
  4876. <p>Mapping of input records to output records is complete when this method
  4877. returns.</p>
  4878. @param input the {@link RecordReader} to read the input records.
  4879. @param output the {@link OutputCollector} to collect the outputrecords.
  4880. @param reporter {@link Reporter} to report progress, status-updates etc.
  4881. @throws IOException]]>
  4882. </doc>
  4883. </method>
  4884. <doc>
  4885. <![CDATA[Expert: Generic interface for {@link Mapper}s.
  4886. <p>Custom implementations of <code>MapRunnable</code> can exert greater
  4887. control on map processing e.g. multi-threaded, asynchronous mappers etc.</p>
  4888. @see Mapper
  4889. @deprecated Use {@link org.apache.hadoop.mapreduce.Mapper} instead.]]>
  4890. </doc>
  4891. </interface>
  4892. <!-- end interface org.apache.hadoop.mapred.MapRunnable -->
  4893. <!-- start class org.apache.hadoop.mapred.MapRunner -->
  4894. <class name="MapRunner" extends="java.lang.Object"
  4895. abstract="false"
  4896. static="false" final="false" visibility="public"
  4897. deprecated="not deprecated">
  4898. <implements name="org.apache.hadoop.mapred.MapRunnable"/>
  4899. <constructor name="MapRunner"
  4900. static="false" final="false" visibility="public"
  4901. deprecated="not deprecated">
  4902. </constructor>
  4903. <method name="configure"
  4904. abstract="false" native="false" synchronized="false"
  4905. static="false" final="false" visibility="public"
  4906. deprecated="not deprecated">
  4907. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  4908. </method>
  4909. <method name="run"
  4910. abstract="false" native="false" synchronized="false"
  4911. static="false" final="false" visibility="public"
  4912. deprecated="not deprecated">
  4913. <param name="input" type="org.apache.hadoop.mapred.RecordReader"/>
  4914. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  4915. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  4916. <exception name="IOException" type="java.io.IOException"/>
  4917. </method>
  4918. <method name="getMapper" return="org.apache.hadoop.mapred.Mapper"
  4919. abstract="false" native="false" synchronized="false"
  4920. static="false" final="false" visibility="protected"
  4921. deprecated="not deprecated">
  4922. </method>
  4923. <doc>
  4924. <![CDATA[Default {@link MapRunnable} implementation.]]>
  4925. </doc>
  4926. </class>
  4927. <!-- end class org.apache.hadoop.mapred.MapRunner -->
  4928. <!-- start class org.apache.hadoop.mapred.MultiFileInputFormat -->
  4929. <class name="MultiFileInputFormat" extends="org.apache.hadoop.mapred.FileInputFormat"
  4930. abstract="true"
  4931. static="false" final="false" visibility="public"
  4932. deprecated="Use {@link org.apache.hadoop.mapred.lib.CombineFileInputFormat} instead">
  4933. <constructor name="MultiFileInputFormat"
  4934. static="false" final="false" visibility="public"
  4935. deprecated="not deprecated">
  4936. </constructor>
  4937. <method name="getSplits" return="org.apache.hadoop.mapred.InputSplit[]"
  4938. abstract="false" native="false" synchronized="false"
  4939. static="false" final="false" visibility="public"
  4940. deprecated="not deprecated">
  4941. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  4942. <param name="numSplits" type="int"/>
  4943. <exception name="IOException" type="java.io.IOException"/>
  4944. </method>
  4945. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  4946. abstract="true" native="false" synchronized="false"
  4947. static="false" final="false" visibility="public"
  4948. deprecated="not deprecated">
  4949. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  4950. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  4951. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  4952. <exception name="IOException" type="java.io.IOException"/>
  4953. </method>
  4954. <doc>
  4955. <![CDATA[An abstract {@link InputFormat} that returns {@link MultiFileSplit}'s
  4956. in {@link #getSplits(JobConf, int)} method. Splits are constructed from
  4957. the files under the input paths. Each split returned contains <i>nearly</i>
  4958. equal content length. <br>
  4959. Subclasses implement {@link #getRecordReader(InputSplit, JobConf, Reporter)}
  4960. to construct <code>RecordReader</code>'s for <code>MultiFileSplit</code>'s.
  4961. @see MultiFileSplit
  4962. @deprecated Use {@link org.apache.hadoop.mapred.lib.CombineFileInputFormat} instead]]>
  4963. </doc>
  4964. </class>
  4965. <!-- end class org.apache.hadoop.mapred.MultiFileInputFormat -->
  4966. <!-- start class org.apache.hadoop.mapred.MultiFileSplit -->
  4967. <class name="MultiFileSplit" extends="org.apache.hadoop.mapred.lib.CombineFileSplit"
  4968. abstract="false"
  4969. static="false" final="false" visibility="public"
  4970. deprecated="Use {@link org.apache.hadoop.mapred.lib.CombineFileSplit} instead">
  4971. <constructor name="MultiFileSplit" type="org.apache.hadoop.mapred.JobConf, org.apache.hadoop.fs.Path[], long[]"
  4972. static="false" final="false" visibility="public"
  4973. deprecated="not deprecated">
  4974. </constructor>
  4975. <method name="getLocations" return="java.lang.String[]"
  4976. abstract="false" native="false" synchronized="false"
  4977. static="false" final="false" visibility="public"
  4978. deprecated="not deprecated">
  4979. <exception name="IOException" type="java.io.IOException"/>
  4980. </method>
  4981. <method name="toString" return="java.lang.String"
  4982. abstract="false" native="false" synchronized="false"
  4983. static="false" final="false" visibility="public"
  4984. deprecated="not deprecated">
  4985. </method>
  4986. <doc>
  4987. <![CDATA[A sub-collection of input files. Unlike {@link FileSplit}, MultiFileSplit
  4988. class does not represent a split of a file, but a split of input files
  4989. into smaller sets. The atomic unit of split is a file. <br>
  4990. MultiFileSplit can be used to implement {@link RecordReader}'s, with
  4991. reading one record per file.
  4992. @see FileSplit
  4993. @see MultiFileInputFormat
  4994. @deprecated Use {@link org.apache.hadoop.mapred.lib.CombineFileSplit} instead]]>
  4995. </doc>
  4996. </class>
  4997. <!-- end class org.apache.hadoop.mapred.MultiFileSplit -->
  4998. <!-- start interface org.apache.hadoop.mapred.OutputCollector -->
  4999. <interface name="OutputCollector" abstract="true"
  5000. static="false" final="false" visibility="public"
  5001. deprecated="not deprecated">
  5002. <method name="collect"
  5003. abstract="false" native="false" synchronized="false"
  5004. static="false" final="false" visibility="public"
  5005. deprecated="not deprecated">
  5006. <param name="key" type="K"/>
  5007. <param name="value" type="V"/>
  5008. <exception name="IOException" type="java.io.IOException"/>
  5009. <doc>
  5010. <![CDATA[Adds a key/value pair to the output.
  5011. @param key the key to collect.
  5012. @param value to value to collect.
  5013. @throws IOException]]>
  5014. </doc>
  5015. </method>
  5016. <doc>
  5017. <![CDATA[Collects the <code>&lt;key, value&gt;</code> pairs output by {@link Mapper}s
  5018. and {@link Reducer}s.
  5019. <p><code>OutputCollector</code> is the generalization of the facility
  5020. provided by the Map-Reduce framework to collect data output by either the
  5021. <code>Mapper</code> or the <code>Reducer</code> i.e. intermediate outputs
  5022. or the output of the job.</p>]]>
  5023. </doc>
  5024. </interface>
  5025. <!-- end interface org.apache.hadoop.mapred.OutputCollector -->
  5026. <!-- start class org.apache.hadoop.mapred.OutputCommitter -->
  5027. <class name="OutputCommitter" extends="org.apache.hadoop.mapreduce.OutputCommitter"
  5028. abstract="true"
  5029. static="false" final="false" visibility="public"
  5030. deprecated="Use {@link org.apache.hadoop.mapreduce.OutputCommitter} instead.">
  5031. <constructor name="OutputCommitter"
  5032. static="false" final="false" visibility="public"
  5033. deprecated="not deprecated">
  5034. </constructor>
  5035. <method name="setupJob"
  5036. abstract="true" native="false" synchronized="false"
  5037. static="false" final="false" visibility="public"
  5038. deprecated="not deprecated">
  5039. <param name="jobContext" type="org.apache.hadoop.mapred.JobContext"/>
  5040. <exception name="IOException" type="java.io.IOException"/>
  5041. <doc>
  5042. <![CDATA[For the framework to setup the job output during initialization
  5043. @param jobContext Context of the job whose output is being written.
  5044. @throws IOException if temporary output could not be created]]>
  5045. </doc>
  5046. </method>
  5047. <method name="cleanupJob"
  5048. abstract="false" native="false" synchronized="false"
  5049. static="false" final="false" visibility="public"
  5050. deprecated="Use {@link #commitJob(JobContext)} or
  5051. {@link #abortJob(JobContext, int)} instead.">
  5052. <param name="jobContext" type="org.apache.hadoop.mapred.JobContext"/>
  5053. <exception name="IOException" type="java.io.IOException"/>
  5054. <doc>
  5055. <![CDATA[For cleaning up the job's output after job completion
  5056. @param jobContext Context of the job whose output is being written.
  5057. @throws IOException
  5058. @deprecated Use {@link #commitJob(JobContext)} or
  5059. {@link #abortJob(JobContext, int)} instead.]]>
  5060. </doc>
  5061. </method>
  5062. <method name="commitJob"
  5063. abstract="false" native="false" synchronized="false"
  5064. static="false" final="false" visibility="public"
  5065. deprecated="not deprecated">
  5066. <param name="jobContext" type="org.apache.hadoop.mapred.JobContext"/>
  5067. <exception name="IOException" type="java.io.IOException"/>
  5068. <doc>
  5069. <![CDATA[For committing job's output after successful job completion. Note that this
  5070. is invoked for jobs with final runstate as SUCCESSFUL.
  5071. @param jobContext Context of the job whose output is being written.
  5072. @throws IOException]]>
  5073. </doc>
  5074. </method>
  5075. <method name="abortJob"
  5076. abstract="false" native="false" synchronized="false"
  5077. static="false" final="false" visibility="public"
  5078. deprecated="not deprecated">
  5079. <param name="jobContext" type="org.apache.hadoop.mapred.JobContext"/>
  5080. <param name="status" type="int"/>
  5081. <exception name="IOException" type="java.io.IOException"/>
  5082. <doc>
  5083. <![CDATA[For aborting an unsuccessful job's output. Note that this is invoked for
  5084. jobs with final runstate as {@link JobStatus#FAILED} or
  5085. {@link JobStatus#KILLED}
  5086. @param jobContext Context of the job whose output is being written.
  5087. @param status final runstate of the job
  5088. @throws IOException]]>
  5089. </doc>
  5090. </method>
  5091. <method name="setupTask"
  5092. abstract="true" native="false" synchronized="false"
  5093. static="false" final="false" visibility="public"
  5094. deprecated="not deprecated">
  5095. <param name="taskContext" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  5096. <exception name="IOException" type="java.io.IOException"/>
  5097. <doc>
  5098. <![CDATA[Sets up output for the task.
  5099. @param taskContext Context of the task whose output is being written.
  5100. @throws IOException]]>
  5101. </doc>
  5102. </method>
  5103. <method name="needsTaskCommit" return="boolean"
  5104. abstract="true" native="false" synchronized="false"
  5105. static="false" final="false" visibility="public"
  5106. deprecated="not deprecated">
  5107. <param name="taskContext" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  5108. <exception name="IOException" type="java.io.IOException"/>
  5109. <doc>
  5110. <![CDATA[Check whether task needs a commit
  5111. @param taskContext
  5112. @return true/false
  5113. @throws IOException]]>
  5114. </doc>
  5115. </method>
  5116. <method name="commitTask"
  5117. abstract="true" native="false" synchronized="false"
  5118. static="false" final="false" visibility="public"
  5119. deprecated="not deprecated">
  5120. <param name="taskContext" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  5121. <exception name="IOException" type="java.io.IOException"/>
  5122. <doc>
  5123. <![CDATA[To promote the task's temporary output to final output location
  5124. The task's output is moved to the job's output directory.
  5125. @param taskContext Context of the task whose output is being written.
  5126. @throws IOException if commit is not]]>
  5127. </doc>
  5128. </method>
  5129. <method name="abortTask"
  5130. abstract="true" native="false" synchronized="false"
  5131. static="false" final="false" visibility="public"
  5132. deprecated="not deprecated">
  5133. <param name="taskContext" type="org.apache.hadoop.mapred.TaskAttemptContext"/>
  5134. <exception name="IOException" type="java.io.IOException"/>
  5135. <doc>
  5136. <![CDATA[Discard the task output
  5137. @param taskContext
  5138. @throws IOException]]>
  5139. </doc>
  5140. </method>
  5141. <method name="setupJob"
  5142. abstract="false" native="false" synchronized="false"
  5143. static="false" final="true" visibility="public"
  5144. deprecated="not deprecated">
  5145. <param name="jobContext" type="org.apache.hadoop.mapreduce.JobContext"/>
  5146. <exception name="IOException" type="java.io.IOException"/>
  5147. <doc>
  5148. <![CDATA[This method implements the new interface by calling the old method. Note
  5149. that the input types are different between the new and old apis and this
  5150. is a bridge between the two.]]>
  5151. </doc>
  5152. </method>
  5153. <method name="cleanupJob"
  5154. abstract="false" native="false" synchronized="false"
  5155. static="false" final="true" visibility="public"
  5156. deprecated="Use {@link #commitJob(org.apache.hadoop.mapreduce.JobContext)}
  5157. or {@link #abortJob(org.apache.hadoop.mapreduce.JobContext, org.apache.hadoop.mapreduce.JobStatus.State)}
  5158. instead.">
  5159. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  5160. <exception name="IOException" type="java.io.IOException"/>
  5161. <doc>
  5162. <![CDATA[This method implements the new interface by calling the old method. Note
  5163. that the input types are different between the new and old apis and this
  5164. is a bridge between the two.
  5165. @deprecated Use {@link #commitJob(org.apache.hadoop.mapreduce.JobContext)}
  5166. or {@link #abortJob(org.apache.hadoop.mapreduce.JobContext, org.apache.hadoop.mapreduce.JobStatus.State)}
  5167. instead.]]>
  5168. </doc>
  5169. </method>
  5170. <method name="commitJob"
  5171. abstract="false" native="false" synchronized="false"
  5172. static="false" final="true" visibility="public"
  5173. deprecated="not deprecated">
  5174. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  5175. <exception name="IOException" type="java.io.IOException"/>
  5176. <doc>
  5177. <![CDATA[This method implements the new interface by calling the old method. Note
  5178. that the input types are different between the new and old apis and this
  5179. is a bridge between the two.]]>
  5180. </doc>
  5181. </method>
  5182. <method name="abortJob"
  5183. abstract="false" native="false" synchronized="false"
  5184. static="false" final="true" visibility="public"
  5185. deprecated="not deprecated">
  5186. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  5187. <param name="runState" type="org.apache.hadoop.mapreduce.JobStatus.State"/>
  5188. <exception name="IOException" type="java.io.IOException"/>
  5189. <doc>
  5190. <![CDATA[This method implements the new interface by calling the old method. Note
  5191. that the input types are different between the new and old apis and this
  5192. is a bridge between the two.]]>
  5193. </doc>
  5194. </method>
  5195. <method name="setupTask"
  5196. abstract="false" native="false" synchronized="false"
  5197. static="false" final="true" visibility="public"
  5198. deprecated="not deprecated">
  5199. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  5200. <exception name="IOException" type="java.io.IOException"/>
  5201. <doc>
  5202. <![CDATA[This method implements the new interface by calling the old method. Note
  5203. that the input types are different between the new and old apis and this
  5204. is a bridge between the two.]]>
  5205. </doc>
  5206. </method>
  5207. <method name="needsTaskCommit" return="boolean"
  5208. abstract="false" native="false" synchronized="false"
  5209. static="false" final="true" visibility="public"
  5210. deprecated="not deprecated">
  5211. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  5212. <exception name="IOException" type="java.io.IOException"/>
  5213. <doc>
  5214. <![CDATA[This method implements the new interface by calling the old method. Note
  5215. that the input types are different between the new and old apis and this
  5216. is a bridge between the two.]]>
  5217. </doc>
  5218. </method>
  5219. <method name="commitTask"
  5220. abstract="false" native="false" synchronized="false"
  5221. static="false" final="true" visibility="public"
  5222. deprecated="not deprecated">
  5223. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  5224. <exception name="IOException" type="java.io.IOException"/>
  5225. <doc>
  5226. <![CDATA[This method implements the new interface by calling the old method. Note
  5227. that the input types are different between the new and old apis and this
  5228. is a bridge between the two.]]>
  5229. </doc>
  5230. </method>
  5231. <method name="abortTask"
  5232. abstract="false" native="false" synchronized="false"
  5233. static="false" final="true" visibility="public"
  5234. deprecated="not deprecated">
  5235. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  5236. <exception name="IOException" type="java.io.IOException"/>
  5237. <doc>
  5238. <![CDATA[This method implements the new interface by calling the old method. Note
  5239. that the input types are different between the new and old apis and this
  5240. is a bridge between the two.]]>
  5241. </doc>
  5242. </method>
  5243. <doc>
  5244. <![CDATA[<code>OutputCommitter</code> describes the commit of task output for a
  5245. Map-Reduce job.
  5246. <p>The Map-Reduce framework relies on the <code>OutputCommitter</code> of
  5247. the job to:<p>
  5248. <ol>
  5249. <li>
  5250. Setup the job during initialization. For example, create the temporary
  5251. output directory for the job during the initialization of the job.
  5252. </li>
  5253. <li>
  5254. Cleanup the job after the job completion. For example, remove the
  5255. temporary output directory after the job completion.
  5256. </li>
  5257. <li>
  5258. Setup the task temporary output.
  5259. </li>
  5260. <li>
  5261. Check whether a task needs a commit. This is to avoid the commit
  5262. procedure if a task does not need commit.
  5263. </li>
  5264. <li>
  5265. Commit of the task output.
  5266. </li>
  5267. <li>
  5268. Discard the task commit.
  5269. </li>
  5270. </ol>
  5271. @see FileOutputCommitter
  5272. @see JobContext
  5273. @see TaskAttemptContext
  5274. @deprecated Use {@link org.apache.hadoop.mapreduce.OutputCommitter} instead.]]>
  5275. </doc>
  5276. </class>
  5277. <!-- end class org.apache.hadoop.mapred.OutputCommitter -->
  5278. <!-- start interface org.apache.hadoop.mapred.OutputFormat -->
  5279. <interface name="OutputFormat" abstract="true"
  5280. static="false" final="false" visibility="public"
  5281. deprecated="Use {@link org.apache.hadoop.mapreduce.OutputFormat} instead.">
  5282. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  5283. abstract="false" native="false" synchronized="false"
  5284. static="false" final="false" visibility="public"
  5285. deprecated="not deprecated">
  5286. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  5287. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  5288. <param name="name" type="java.lang.String"/>
  5289. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  5290. <exception name="IOException" type="java.io.IOException"/>
  5291. <doc>
  5292. <![CDATA[Get the {@link RecordWriter} for the given job.
  5293. @param ignored
  5294. @param job configuration for the job whose output is being written.
  5295. @param name the unique name for this part of the output.
  5296. @param progress mechanism for reporting progress while writing to file.
  5297. @return a {@link RecordWriter} to write the output for the job.
  5298. @throws IOException]]>
  5299. </doc>
  5300. </method>
  5301. <method name="checkOutputSpecs"
  5302. abstract="false" native="false" synchronized="false"
  5303. static="false" final="false" visibility="public"
  5304. deprecated="not deprecated">
  5305. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  5306. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  5307. <exception name="IOException" type="java.io.IOException"/>
  5308. <doc>
  5309. <![CDATA[Check for validity of the output-specification for the job.
  5310. <p>This is to validate the output specification for the job when it is
  5311. a job is submitted. Typically checks that it does not already exist,
  5312. throwing an exception when it already exists, so that output is not
  5313. overwritten.</p>
  5314. @param ignored
  5315. @param job job configuration.
  5316. @throws IOException when output should not be attempted]]>
  5317. </doc>
  5318. </method>
  5319. <doc>
  5320. <![CDATA[<code>OutputFormat</code> describes the output-specification for a
  5321. Map-Reduce job.
  5322. <p>The Map-Reduce framework relies on the <code>OutputFormat</code> of the
  5323. job to:<p>
  5324. <ol>
  5325. <li>
  5326. Validate the output-specification of the job. For e.g. check that the
  5327. output directory doesn't already exist.
  5328. <li>
  5329. Provide the {@link RecordWriter} implementation to be used to write out
  5330. the output files of the job. Output files are stored in a
  5331. {@link FileSystem}.
  5332. </li>
  5333. </ol>
  5334. @see RecordWriter
  5335. @see JobConf
  5336. @deprecated Use {@link org.apache.hadoop.mapreduce.OutputFormat} instead.]]>
  5337. </doc>
  5338. </interface>
  5339. <!-- end interface org.apache.hadoop.mapred.OutputFormat -->
  5340. <!-- start class org.apache.hadoop.mapred.OutputLogFilter -->
  5341. <class name="OutputLogFilter" extends="java.lang.Object"
  5342. abstract="false"
  5343. static="false" final="false" visibility="public"
  5344. deprecated="Use
  5345. {@link org.apache.hadoop.mapred.Utils.OutputFileUtils.OutputLogFilter}
  5346. instead.">
  5347. <implements name="org.apache.hadoop.fs.PathFilter"/>
  5348. <constructor name="OutputLogFilter"
  5349. static="false" final="false" visibility="public"
  5350. deprecated="not deprecated">
  5351. </constructor>
  5352. <method name="accept" return="boolean"
  5353. abstract="false" native="false" synchronized="false"
  5354. static="false" final="false" visibility="public"
  5355. deprecated="not deprecated">
  5356. <param name="path" type="org.apache.hadoop.fs.Path"/>
  5357. </method>
  5358. <doc>
  5359. <![CDATA[This class filters log files from directory given
  5360. It doesnt accept paths having _logs.
  5361. This can be used to list paths of output directory as follows:
  5362. Path[] fileList = FileUtil.stat2Paths(fs.listStatus(outDir,
  5363. new OutputLogFilter()));
  5364. @deprecated Use
  5365. {@link org.apache.hadoop.mapred.Utils.OutputFileUtils.OutputLogFilter}
  5366. instead.]]>
  5367. </doc>
  5368. </class>
  5369. <!-- end class org.apache.hadoop.mapred.OutputLogFilter -->
  5370. <!-- start interface org.apache.hadoop.mapred.Partitioner -->
  5371. <interface name="Partitioner" abstract="true"
  5372. static="false" final="false" visibility="public"
  5373. deprecated="Use {@link org.apache.hadoop.mapreduce.Partitioner} instead.">
  5374. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  5375. <method name="getPartition" return="int"
  5376. abstract="false" native="false" synchronized="false"
  5377. static="false" final="false" visibility="public"
  5378. deprecated="not deprecated">
  5379. <param name="key" type="K2"/>
  5380. <param name="value" type="V2"/>
  5381. <param name="numPartitions" type="int"/>
  5382. <doc>
  5383. <![CDATA[Get the paritition number for a given key (hence record) given the total
  5384. number of partitions i.e. number of reduce-tasks for the job.
  5385. <p>Typically a hash function on a all or a subset of the key.</p>
  5386. @param key the key to be paritioned.
  5387. @param value the entry value.
  5388. @param numPartitions the total number of partitions.
  5389. @return the partition number for the <code>key</code>.]]>
  5390. </doc>
  5391. </method>
  5392. <doc>
  5393. <![CDATA[Partitions the key space.
  5394. <p><code>Partitioner</code> controls the partitioning of the keys of the
  5395. intermediate map-outputs. The key (or a subset of the key) is used to derive
  5396. the partition, typically by a hash function. The total number of partitions
  5397. is the same as the number of reduce tasks for the job. Hence this controls
  5398. which of the <code>m</code> reduce tasks the intermediate key (and hence the
  5399. record) is sent for reduction.</p>
  5400. @see Reducer
  5401. @deprecated Use {@link org.apache.hadoop.mapreduce.Partitioner} instead.]]>
  5402. </doc>
  5403. </interface>
  5404. <!-- end interface org.apache.hadoop.mapred.Partitioner -->
  5405. <!-- start interface org.apache.hadoop.mapred.RecordReader -->
  5406. <interface name="RecordReader" abstract="true"
  5407. static="false" final="false" visibility="public"
  5408. deprecated="not deprecated">
  5409. <method name="next" return="boolean"
  5410. abstract="false" native="false" synchronized="false"
  5411. static="false" final="false" visibility="public"
  5412. deprecated="not deprecated">
  5413. <param name="key" type="K"/>
  5414. <param name="value" type="V"/>
  5415. <exception name="IOException" type="java.io.IOException"/>
  5416. <doc>
  5417. <![CDATA[Reads the next key/value pair from the input for processing.
  5418. @param key the key to read data into
  5419. @param value the value to read data into
  5420. @return true iff a key/value was read, false if at EOF]]>
  5421. </doc>
  5422. </method>
  5423. <method name="createKey" return="K"
  5424. abstract="false" native="false" synchronized="false"
  5425. static="false" final="false" visibility="public"
  5426. deprecated="not deprecated">
  5427. <doc>
  5428. <![CDATA[Create an object of the appropriate type to be used as a key.
  5429. @return a new key object.]]>
  5430. </doc>
  5431. </method>
  5432. <method name="createValue" return="V"
  5433. abstract="false" native="false" synchronized="false"
  5434. static="false" final="false" visibility="public"
  5435. deprecated="not deprecated">
  5436. <doc>
  5437. <![CDATA[Create an object of the appropriate type to be used as a value.
  5438. @return a new value object.]]>
  5439. </doc>
  5440. </method>
  5441. <method name="getPos" return="long"
  5442. abstract="false" native="false" synchronized="false"
  5443. static="false" final="false" visibility="public"
  5444. deprecated="not deprecated">
  5445. <exception name="IOException" type="java.io.IOException"/>
  5446. <doc>
  5447. <![CDATA[Returns the current position in the input.
  5448. @return the current position in the input.
  5449. @throws IOException]]>
  5450. </doc>
  5451. </method>
  5452. <method name="close"
  5453. abstract="false" native="false" synchronized="false"
  5454. static="false" final="false" visibility="public"
  5455. deprecated="not deprecated">
  5456. <exception name="IOException" type="java.io.IOException"/>
  5457. <doc>
  5458. <![CDATA[Close this {@link InputSplit} to future operations.
  5459. @throws IOException]]>
  5460. </doc>
  5461. </method>
  5462. <method name="getProgress" return="float"
  5463. abstract="false" native="false" synchronized="false"
  5464. static="false" final="false" visibility="public"
  5465. deprecated="not deprecated">
  5466. <exception name="IOException" type="java.io.IOException"/>
  5467. <doc>
  5468. <![CDATA[How much of the input has the {@link RecordReader} consumed i.e.
  5469. has been processed by?
  5470. @return progress from <code>0.0</code> to <code>1.0</code>.
  5471. @throws IOException]]>
  5472. </doc>
  5473. </method>
  5474. <doc>
  5475. <![CDATA[<code>RecordReader</code> reads &lt;key, value&gt; pairs from an
  5476. {@link InputSplit}.
  5477. <p><code>RecordReader</code>, typically, converts the byte-oriented view of
  5478. the input, provided by the <code>InputSplit</code>, and presents a
  5479. record-oriented view for the {@link Mapper} & {@link Reducer} tasks for
  5480. processing. It thus assumes the responsibility of processing record
  5481. boundaries and presenting the tasks with keys and values.</p>
  5482. @see InputSplit
  5483. @see InputFormat]]>
  5484. </doc>
  5485. </interface>
  5486. <!-- end interface org.apache.hadoop.mapred.RecordReader -->
  5487. <!-- start interface org.apache.hadoop.mapred.RecordWriter -->
  5488. <interface name="RecordWriter" abstract="true"
  5489. static="false" final="false" visibility="public"
  5490. deprecated="not deprecated">
  5491. <method name="write"
  5492. abstract="false" native="false" synchronized="false"
  5493. static="false" final="false" visibility="public"
  5494. deprecated="not deprecated">
  5495. <param name="key" type="K"/>
  5496. <param name="value" type="V"/>
  5497. <exception name="IOException" type="java.io.IOException"/>
  5498. <doc>
  5499. <![CDATA[Writes a key/value pair.
  5500. @param key the key to write.
  5501. @param value the value to write.
  5502. @throws IOException]]>
  5503. </doc>
  5504. </method>
  5505. <method name="close"
  5506. abstract="false" native="false" synchronized="false"
  5507. static="false" final="false" visibility="public"
  5508. deprecated="not deprecated">
  5509. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  5510. <exception name="IOException" type="java.io.IOException"/>
  5511. <doc>
  5512. <![CDATA[Close this <code>RecordWriter</code> to future operations.
  5513. @param reporter facility to report progress.
  5514. @throws IOException]]>
  5515. </doc>
  5516. </method>
  5517. <doc>
  5518. <![CDATA[<code>RecordWriter</code> writes the output &lt;key, value&gt; pairs
  5519. to an output file.
  5520. <p><code>RecordWriter</code> implementations write the job outputs to the
  5521. {@link FileSystem}.
  5522. @see OutputFormat]]>
  5523. </doc>
  5524. </interface>
  5525. <!-- end interface org.apache.hadoop.mapred.RecordWriter -->
  5526. <!-- start interface org.apache.hadoop.mapred.Reducer -->
  5527. <interface name="Reducer" abstract="true"
  5528. static="false" final="false" visibility="public"
  5529. deprecated="Use {@link org.apache.hadoop.mapreduce.Reducer} instead.">
  5530. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  5531. <implements name="org.apache.hadoop.io.Closeable"/>
  5532. <method name="reduce"
  5533. abstract="false" native="false" synchronized="false"
  5534. static="false" final="false" visibility="public"
  5535. deprecated="not deprecated">
  5536. <param name="key" type="K2"/>
  5537. <param name="values" type="java.util.Iterator"/>
  5538. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  5539. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  5540. <exception name="IOException" type="java.io.IOException"/>
  5541. <doc>
  5542. <![CDATA[<i>Reduces</i> values for a given key.
  5543. <p>The framework calls this method for each
  5544. <code>&lt;key, (list of values)></code> pair in the grouped inputs.
  5545. Output values must be of the same type as input values. Input keys must
  5546. not be altered. The framework will <b>reuse</b> the key and value objects
  5547. that are passed into the reduce, therefore the application should clone
  5548. the objects they want to keep a copy of. In many cases, all values are
  5549. combined into zero or one value.
  5550. </p>
  5551. <p>Output pairs are collected with calls to
  5552. {@link OutputCollector#collect(Object,Object)}.</p>
  5553. <p>Applications can use the {@link Reporter} provided to report progress
  5554. or just indicate that they are alive. In scenarios where the application
  5555. takes an insignificant amount of time to process individual key/value
  5556. pairs, this is crucial since the framework might assume that the task has
  5557. timed-out and kill that task. The other way of avoiding this is to set
  5558. <a href="{@docRoot}/../mapred-default.html#mapreduce.task.timeout">
  5559. mapreduce.task.timeout</a> to a high-enough value (or even zero for no
  5560. time-outs).</p>
  5561. @param key the key.
  5562. @param values the list of values to reduce.
  5563. @param output to collect keys and combined values.
  5564. @param reporter facility to report progress.]]>
  5565. </doc>
  5566. </method>
  5567. <doc>
  5568. <![CDATA[Reduces a set of intermediate values which share a key to a smaller set of
  5569. values.
  5570. <p>The number of <code>Reducer</code>s for the job is set by the user via
  5571. {@link JobConf#setNumReduceTasks(int)}. <code>Reducer</code> implementations
  5572. can access the {@link JobConf} for the job via the
  5573. {@link JobConfigurable#configure(JobConf)} method and initialize themselves.
  5574. Similarly they can use the {@link Closeable#close()} method for
  5575. de-initialization.</p>
  5576. <p><code>Reducer</code> has 3 primary phases:</p>
  5577. <ol>
  5578. <li>
  5579. <h4 id="Shuffle">Shuffle</h4>
  5580. <p><code>Reducer</code> is input the grouped output of a {@link Mapper}.
  5581. In the phase the framework, for each <code>Reducer</code>, fetches the
  5582. relevant partition of the output of all the <code>Mapper</code>s, via HTTP.
  5583. </p>
  5584. </li>
  5585. <li>
  5586. <h4 id="Sort">Sort</h4>
  5587. <p>The framework groups <code>Reducer</code> inputs by <code>key</code>s
  5588. (since different <code>Mapper</code>s may have output the same key) in this
  5589. stage.</p>
  5590. <p>The shuffle and sort phases occur simultaneously i.e. while outputs are
  5591. being fetched they are merged.</p>
  5592. <h5 id="SecondarySort">SecondarySort</h5>
  5593. <p>If equivalence rules for keys while grouping the intermediates are
  5594. different from those for grouping keys before reduction, then one may
  5595. specify a <code>Comparator</code> via
  5596. {@link JobConf#setOutputValueGroupingComparator(Class)}.Since
  5597. {@link JobConf#setOutputKeyComparatorClass(Class)} can be used to
  5598. control how intermediate keys are grouped, these can be used in conjunction
  5599. to simulate <i>secondary sort on values</i>.</p>
  5600. For example, say that you want to find duplicate web pages and tag them
  5601. all with the url of the "best" known example. You would set up the job
  5602. like:
  5603. <ul>
  5604. <li>Map Input Key: url</li>
  5605. <li>Map Input Value: document</li>
  5606. <li>Map Output Key: document checksum, url pagerank</li>
  5607. <li>Map Output Value: url</li>
  5608. <li>Partitioner: by checksum</li>
  5609. <li>OutputKeyComparator: by checksum and then decreasing pagerank</li>
  5610. <li>OutputValueGroupingComparator: by checksum</li>
  5611. </ul>
  5612. </li>
  5613. <li>
  5614. <h4 id="Reduce">Reduce</h4>
  5615. <p>In this phase the
  5616. {@link #reduce(Object, Iterator, OutputCollector, Reporter)}
  5617. method is called for each <code>&lt;key, (list of values)></code> pair in
  5618. the grouped inputs.</p>
  5619. <p>The output of the reduce task is typically written to the
  5620. {@link FileSystem} via
  5621. {@link OutputCollector#collect(Object, Object)}.</p>
  5622. </li>
  5623. </ol>
  5624. <p>The output of the <code>Reducer</code> is <b>not re-sorted</b>.</p>
  5625. <p>Example:</p>
  5626. <p><blockquote><pre>
  5627. public class MyReducer&lt;K extends WritableComparable, V extends Writable&gt;
  5628. extends MapReduceBase implements Reducer&lt;K, V, K, V&gt; {
  5629. static enum MyCounters { NUM_RECORDS }
  5630. private String reduceTaskId;
  5631. private int noKeys = 0;
  5632. public void configure(JobConf job) {
  5633. reduceTaskId = job.get(JobContext.TASK_ATTEMPT_ID);
  5634. }
  5635. public void reduce(K key, Iterator&lt;V&gt; values,
  5636. OutputCollector&lt;K, V&gt; output,
  5637. Reporter reporter)
  5638. throws IOException {
  5639. // Process
  5640. int noValues = 0;
  5641. while (values.hasNext()) {
  5642. V value = values.next();
  5643. // Increment the no. of values for this key
  5644. ++noValues;
  5645. // Process the &lt;key, value&gt; pair (assume this takes a while)
  5646. // ...
  5647. // ...
  5648. // Let the framework know that we are alive, and kicking!
  5649. if ((noValues%10) == 0) {
  5650. reporter.progress();
  5651. }
  5652. // Process some more
  5653. // ...
  5654. // ...
  5655. // Output the &lt;key, value&gt;
  5656. output.collect(key, value);
  5657. }
  5658. // Increment the no. of &lt;key, list of values&gt; pairs processed
  5659. ++noKeys;
  5660. // Increment counters
  5661. reporter.incrCounter(NUM_RECORDS, 1);
  5662. // Every 100 keys update application-level status
  5663. if ((noKeys%100) == 0) {
  5664. reporter.setStatus(reduceTaskId + " processed " + noKeys);
  5665. }
  5666. }
  5667. }
  5668. </pre></blockquote></p>
  5669. @see Mapper
  5670. @see Partitioner
  5671. @see Reporter
  5672. @see MapReduceBase
  5673. @deprecated Use {@link org.apache.hadoop.mapreduce.Reducer} instead.]]>
  5674. </doc>
  5675. </interface>
  5676. <!-- end interface org.apache.hadoop.mapred.Reducer -->
  5677. <!-- start interface org.apache.hadoop.mapred.Reporter -->
  5678. <interface name="Reporter" abstract="true"
  5679. static="false" final="false" visibility="public"
  5680. deprecated="not deprecated">
  5681. <implements name="org.apache.hadoop.util.Progressable"/>
  5682. <method name="setStatus"
  5683. abstract="false" native="false" synchronized="false"
  5684. static="false" final="false" visibility="public"
  5685. deprecated="not deprecated">
  5686. <param name="status" type="java.lang.String"/>
  5687. <doc>
  5688. <![CDATA[Set the status description for the task.
  5689. @param status brief description of the current status.]]>
  5690. </doc>
  5691. </method>
  5692. <method name="getCounter" return="org.apache.hadoop.mapred.Counters.Counter"
  5693. abstract="false" native="false" synchronized="false"
  5694. static="false" final="false" visibility="public"
  5695. deprecated="not deprecated">
  5696. <param name="name" type="java.lang.Enum"/>
  5697. <doc>
  5698. <![CDATA[Get the {@link Counter} of the given group with the given name.
  5699. @param name counter name
  5700. @return the <code>Counter</code> of the given group/name.]]>
  5701. </doc>
  5702. </method>
  5703. <method name="getCounter" return="org.apache.hadoop.mapred.Counters.Counter"
  5704. abstract="false" native="false" synchronized="false"
  5705. static="false" final="false" visibility="public"
  5706. deprecated="not deprecated">
  5707. <param name="group" type="java.lang.String"/>
  5708. <param name="name" type="java.lang.String"/>
  5709. <doc>
  5710. <![CDATA[Get the {@link Counter} of the given group with the given name.
  5711. @param group counter group
  5712. @param name counter name
  5713. @return the <code>Counter</code> of the given group/name.]]>
  5714. </doc>
  5715. </method>
  5716. <method name="incrCounter"
  5717. abstract="false" native="false" synchronized="false"
  5718. static="false" final="false" visibility="public"
  5719. deprecated="not deprecated">
  5720. <param name="key" type="java.lang.Enum"/>
  5721. <param name="amount" type="long"/>
  5722. <doc>
  5723. <![CDATA[Increments the counter identified by the key, which can be of
  5724. any {@link Enum} type, by the specified amount.
  5725. @param key key to identify the counter to be incremented. The key can be
  5726. be any <code>Enum</code>.
  5727. @param amount A non-negative amount by which the counter is to
  5728. be incremented.]]>
  5729. </doc>
  5730. </method>
  5731. <method name="incrCounter"
  5732. abstract="false" native="false" synchronized="false"
  5733. static="false" final="false" visibility="public"
  5734. deprecated="not deprecated">
  5735. <param name="group" type="java.lang.String"/>
  5736. <param name="counter" type="java.lang.String"/>
  5737. <param name="amount" type="long"/>
  5738. <doc>
  5739. <![CDATA[Increments the counter identified by the group and counter name
  5740. by the specified amount.
  5741. @param group name to identify the group of the counter to be incremented.
  5742. @param counter name to identify the counter within the group.
  5743. @param amount A non-negative amount by which the counter is to
  5744. be incremented.]]>
  5745. </doc>
  5746. </method>
  5747. <method name="getInputSplit" return="org.apache.hadoop.mapred.InputSplit"
  5748. abstract="false" native="false" synchronized="false"
  5749. static="false" final="false" visibility="public"
  5750. deprecated="not deprecated">
  5751. <exception name="UnsupportedOperationException" type="java.lang.UnsupportedOperationException"/>
  5752. <doc>
  5753. <![CDATA[Get the {@link InputSplit} object for a map.
  5754. @return the <code>InputSplit</code> that the map is reading from.
  5755. @throws UnsupportedOperationException if called outside a mapper]]>
  5756. </doc>
  5757. </method>
  5758. <field name="NULL" type="org.apache.hadoop.mapred.Reporter"
  5759. transient="false" volatile="false"
  5760. static="true" final="true" visibility="public"
  5761. deprecated="not deprecated">
  5762. <doc>
  5763. <![CDATA[A constant of Reporter type that does nothing.]]>
  5764. </doc>
  5765. </field>
  5766. <doc>
  5767. <![CDATA[A facility for Map-Reduce applications to report progress and update
  5768. counters, status information etc.
  5769. <p>{@link Mapper} and {@link Reducer} can use the <code>Reporter</code>
  5770. provided to report progress or just indicate that they are alive. In
  5771. scenarios where the application takes an insignificant amount of time to
  5772. process individual key/value pairs, this is crucial since the framework
  5773. might assume that the task has timed-out and kill that task.
  5774. <p>Applications can also update {@link Counters} via the provided
  5775. <code>Reporter</code> .</p>
  5776. @see Progressable
  5777. @see Counters]]>
  5778. </doc>
  5779. </interface>
  5780. <!-- end interface org.apache.hadoop.mapred.Reporter -->
  5781. <!-- start interface org.apache.hadoop.mapred.RunningJob -->
  5782. <interface name="RunningJob" abstract="true"
  5783. static="false" final="false" visibility="public"
  5784. deprecated="Use {@link org.apache.hadoop.mapreduce.Job} instead">
  5785. <method name="getConfiguration" return="org.apache.hadoop.conf.Configuration"
  5786. abstract="false" native="false" synchronized="false"
  5787. static="false" final="false" visibility="public"
  5788. deprecated="not deprecated">
  5789. <doc>
  5790. <![CDATA[Get the underlying job configuration
  5791. @return the configuration of the job.]]>
  5792. </doc>
  5793. </method>
  5794. <method name="getID" return="org.apache.hadoop.mapred.JobID"
  5795. abstract="false" native="false" synchronized="false"
  5796. static="false" final="false" visibility="public"
  5797. deprecated="not deprecated">
  5798. <doc>
  5799. <![CDATA[Get the job identifier.
  5800. @return the job identifier.]]>
  5801. </doc>
  5802. </method>
  5803. <method name="getJobID" return="java.lang.String"
  5804. abstract="false" native="false" synchronized="false"
  5805. static="false" final="false" visibility="public"
  5806. deprecated="This method is deprecated and will be removed. Applications should
  5807. rather use {@link #getID()}.">
  5808. <doc>
  5809. <![CDATA[@deprecated This method is deprecated and will be removed. Applications should
  5810. rather use {@link #getID()}.]]>
  5811. </doc>
  5812. </method>
  5813. <method name="getJobName" return="java.lang.String"
  5814. abstract="false" native="false" synchronized="false"
  5815. static="false" final="false" visibility="public"
  5816. deprecated="not deprecated">
  5817. <doc>
  5818. <![CDATA[Get the name of the job.
  5819. @return the name of the job.]]>
  5820. </doc>
  5821. </method>
  5822. <method name="getJobFile" return="java.lang.String"
  5823. abstract="false" native="false" synchronized="false"
  5824. static="false" final="false" visibility="public"
  5825. deprecated="not deprecated">
  5826. <doc>
  5827. <![CDATA[Get the path of the submitted job configuration.
  5828. @return the path of the submitted job configuration.]]>
  5829. </doc>
  5830. </method>
  5831. <method name="getTrackingURL" return="java.lang.String"
  5832. abstract="false" native="false" synchronized="false"
  5833. static="false" final="false" visibility="public"
  5834. deprecated="not deprecated">
  5835. <doc>
  5836. <![CDATA[Get the URL where some job progress information will be displayed.
  5837. @return the URL where some job progress information will be displayed.]]>
  5838. </doc>
  5839. </method>
  5840. <method name="mapProgress" return="float"
  5841. abstract="false" native="false" synchronized="false"
  5842. static="false" final="false" visibility="public"
  5843. deprecated="not deprecated">
  5844. <exception name="IOException" type="java.io.IOException"/>
  5845. <doc>
  5846. <![CDATA[Get the <i>progress</i> of the job's map-tasks, as a float between 0.0
  5847. and 1.0. When all map tasks have completed, the function returns 1.0.
  5848. @return the progress of the job's map-tasks.
  5849. @throws IOException]]>
  5850. </doc>
  5851. </method>
  5852. <method name="reduceProgress" return="float"
  5853. abstract="false" native="false" synchronized="false"
  5854. static="false" final="false" visibility="public"
  5855. deprecated="not deprecated">
  5856. <exception name="IOException" type="java.io.IOException"/>
  5857. <doc>
  5858. <![CDATA[Get the <i>progress</i> of the job's reduce-tasks, as a float between 0.0
  5859. and 1.0. When all reduce tasks have completed, the function returns 1.0.
  5860. @return the progress of the job's reduce-tasks.
  5861. @throws IOException]]>
  5862. </doc>
  5863. </method>
  5864. <method name="cleanupProgress" return="float"
  5865. abstract="false" native="false" synchronized="false"
  5866. static="false" final="false" visibility="public"
  5867. deprecated="not deprecated">
  5868. <exception name="IOException" type="java.io.IOException"/>
  5869. <doc>
  5870. <![CDATA[Get the <i>progress</i> of the job's cleanup-tasks, as a float between 0.0
  5871. and 1.0. When all cleanup tasks have completed, the function returns 1.0.
  5872. @return the progress of the job's cleanup-tasks.
  5873. @throws IOException]]>
  5874. </doc>
  5875. </method>
  5876. <method name="setupProgress" return="float"
  5877. abstract="false" native="false" synchronized="false"
  5878. static="false" final="false" visibility="public"
  5879. deprecated="not deprecated">
  5880. <exception name="IOException" type="java.io.IOException"/>
  5881. <doc>
  5882. <![CDATA[Get the <i>progress</i> of the job's setup-tasks, as a float between 0.0
  5883. and 1.0. When all setup tasks have completed, the function returns 1.0.
  5884. @return the progress of the job's setup-tasks.
  5885. @throws IOException]]>
  5886. </doc>
  5887. </method>
  5888. <method name="isComplete" return="boolean"
  5889. abstract="false" native="false" synchronized="false"
  5890. static="false" final="false" visibility="public"
  5891. deprecated="not deprecated">
  5892. <exception name="IOException" type="java.io.IOException"/>
  5893. <doc>
  5894. <![CDATA[Check if the job is finished or not.
  5895. This is a non-blocking call.
  5896. @return <code>true</code> if the job is complete, else <code>false</code>.
  5897. @throws IOException]]>
  5898. </doc>
  5899. </method>
  5900. <method name="isSuccessful" return="boolean"
  5901. abstract="false" native="false" synchronized="false"
  5902. static="false" final="false" visibility="public"
  5903. deprecated="not deprecated">
  5904. <exception name="IOException" type="java.io.IOException"/>
  5905. <doc>
  5906. <![CDATA[Check if the job completed successfully.
  5907. @return <code>true</code> if the job succeeded, else <code>false</code>.
  5908. @throws IOException]]>
  5909. </doc>
  5910. </method>
  5911. <method name="waitForCompletion"
  5912. abstract="false" native="false" synchronized="false"
  5913. static="false" final="false" visibility="public"
  5914. deprecated="not deprecated">
  5915. <exception name="IOException" type="java.io.IOException"/>
  5916. <doc>
  5917. <![CDATA[Blocks until the job is complete.
  5918. @throws IOException]]>
  5919. </doc>
  5920. </method>
  5921. <method name="getJobState" return="int"
  5922. abstract="false" native="false" synchronized="false"
  5923. static="false" final="false" visibility="public"
  5924. deprecated="not deprecated">
  5925. <exception name="IOException" type="java.io.IOException"/>
  5926. <doc>
  5927. <![CDATA[Returns the current state of the Job.
  5928. {@link JobStatus}
  5929. @throws IOException]]>
  5930. </doc>
  5931. </method>
  5932. <method name="killJob"
  5933. abstract="false" native="false" synchronized="false"
  5934. static="false" final="false" visibility="public"
  5935. deprecated="not deprecated">
  5936. <exception name="IOException" type="java.io.IOException"/>
  5937. <doc>
  5938. <![CDATA[Kill the running job. Blocks until all job tasks have been
  5939. killed as well. If the job is no longer running, it simply returns.
  5940. @throws IOException]]>
  5941. </doc>
  5942. </method>
  5943. <method name="setJobPriority"
  5944. abstract="false" native="false" synchronized="false"
  5945. static="false" final="false" visibility="public"
  5946. deprecated="not deprecated">
  5947. <param name="priority" type="java.lang.String"/>
  5948. <exception name="IOException" type="java.io.IOException"/>
  5949. <doc>
  5950. <![CDATA[Set the priority of a running job.
  5951. @param priority the new priority for the job.
  5952. @throws IOException]]>
  5953. </doc>
  5954. </method>
  5955. <method name="getTaskCompletionEvents" return="org.apache.hadoop.mapred.TaskCompletionEvent[]"
  5956. abstract="false" native="false" synchronized="false"
  5957. static="false" final="false" visibility="public"
  5958. deprecated="not deprecated">
  5959. <param name="startFrom" type="int"/>
  5960. <exception name="IOException" type="java.io.IOException"/>
  5961. <doc>
  5962. <![CDATA[Get events indicating completion (success/failure) of component tasks.
  5963. @param startFrom index to start fetching events from
  5964. @return an array of {@link TaskCompletionEvent}s
  5965. @throws IOException]]>
  5966. </doc>
  5967. </method>
  5968. <method name="killTask"
  5969. abstract="false" native="false" synchronized="false"
  5970. static="false" final="false" visibility="public"
  5971. deprecated="not deprecated">
  5972. <param name="taskId" type="org.apache.hadoop.mapred.TaskAttemptID"/>
  5973. <param name="shouldFail" type="boolean"/>
  5974. <exception name="IOException" type="java.io.IOException"/>
  5975. <doc>
  5976. <![CDATA[Kill indicated task attempt.
  5977. @param taskId the id of the task to be terminated.
  5978. @param shouldFail if true the task is failed and added to failed tasks
  5979. list, otherwise it is just killed, w/o affecting
  5980. job failure status.
  5981. @throws IOException]]>
  5982. </doc>
  5983. </method>
  5984. <method name="killTask"
  5985. abstract="false" native="false" synchronized="false"
  5986. static="false" final="false" visibility="public"
  5987. deprecated="Applications should rather use {@link #killTask(TaskAttemptID, boolean)}">
  5988. <param name="taskId" type="java.lang.String"/>
  5989. <param name="shouldFail" type="boolean"/>
  5990. <exception name="IOException" type="java.io.IOException"/>
  5991. <doc>
  5992. <![CDATA[@deprecated Applications should rather use {@link #killTask(TaskAttemptID, boolean)}]]>
  5993. </doc>
  5994. </method>
  5995. <method name="getCounters" return="org.apache.hadoop.mapred.Counters"
  5996. abstract="false" native="false" synchronized="false"
  5997. static="false" final="false" visibility="public"
  5998. deprecated="not deprecated">
  5999. <exception name="IOException" type="java.io.IOException"/>
  6000. <doc>
  6001. <![CDATA[Gets the counters for this job.
  6002. @return the counters for this job.
  6003. @throws IOException]]>
  6004. </doc>
  6005. </method>
  6006. <method name="getTaskDiagnostics" return="java.lang.String[]"
  6007. abstract="false" native="false" synchronized="false"
  6008. static="false" final="false" visibility="public"
  6009. deprecated="not deprecated">
  6010. <param name="taskid" type="org.apache.hadoop.mapred.TaskAttemptID"/>
  6011. <exception name="IOException" type="java.io.IOException"/>
  6012. <doc>
  6013. <![CDATA[Gets the diagnostic messages for a given task attempt.
  6014. @param taskid
  6015. @return the list of diagnostic messages for the task
  6016. @throws IOException]]>
  6017. </doc>
  6018. </method>
  6019. <method name="getHistoryUrl" return="java.lang.String"
  6020. abstract="false" native="false" synchronized="false"
  6021. static="false" final="false" visibility="public"
  6022. deprecated="not deprecated">
  6023. <exception name="IOException" type="java.io.IOException"/>
  6024. <doc>
  6025. <![CDATA[Get the url where history file is archived. Returns empty string if
  6026. history file is not available yet.
  6027. @return the url where history file is archived
  6028. @throws IOException]]>
  6029. </doc>
  6030. </method>
  6031. <method name="isRetired" return="boolean"
  6032. abstract="false" native="false" synchronized="false"
  6033. static="false" final="false" visibility="public"
  6034. deprecated="not deprecated">
  6035. <exception name="IOException" type="java.io.IOException"/>
  6036. <doc>
  6037. <![CDATA[Check whether the job has been removed from JobTracker memory and retired.
  6038. On retire, the job history file is copied to a location known by
  6039. {@link #getHistoryUrl()}
  6040. @return <code>true</code> if the job retired, else <code>false</code>.
  6041. @throws IOException]]>
  6042. </doc>
  6043. </method>
  6044. <doc>
  6045. <![CDATA[<code>RunningJob</code> is the user-interface to query for details on a
  6046. running Map-Reduce job.
  6047. <p>Clients can get hold of <code>RunningJob</code> via the {@link JobClient}
  6048. and then query the running-job for details such as name, configuration,
  6049. progress etc.</p>
  6050. @see JobClient
  6051. @deprecated Use {@link org.apache.hadoop.mapreduce.Job} instead]]>
  6052. </doc>
  6053. </interface>
  6054. <!-- end interface org.apache.hadoop.mapred.RunningJob -->
  6055. <!-- start class org.apache.hadoop.mapred.SequenceFileAsBinaryInputFormat -->
  6056. <class name="SequenceFileAsBinaryInputFormat" extends="org.apache.hadoop.mapred.SequenceFileInputFormat"
  6057. abstract="false"
  6058. static="false" final="false" visibility="public"
  6059. deprecated="Use
  6060. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileAsBinaryInputFormat}
  6061. instead">
  6062. <constructor name="SequenceFileAsBinaryInputFormat"
  6063. static="false" final="false" visibility="public"
  6064. deprecated="not deprecated">
  6065. </constructor>
  6066. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  6067. abstract="false" native="false" synchronized="false"
  6068. static="false" final="false" visibility="public"
  6069. deprecated="not deprecated">
  6070. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  6071. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6072. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  6073. <exception name="IOException" type="java.io.IOException"/>
  6074. </method>
  6075. <doc>
  6076. <![CDATA[InputFormat reading keys, values from SequenceFiles in binary (raw)
  6077. format.
  6078. @deprecated Use
  6079. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileAsBinaryInputFormat}
  6080. instead]]>
  6081. </doc>
  6082. </class>
  6083. <!-- end class org.apache.hadoop.mapred.SequenceFileAsBinaryInputFormat -->
  6084. <!-- start class org.apache.hadoop.mapred.SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader -->
  6085. <class name="SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader" extends="java.lang.Object"
  6086. abstract="false"
  6087. static="true" final="false" visibility="public"
  6088. deprecated="not deprecated">
  6089. <implements name="org.apache.hadoop.mapred.RecordReader"/>
  6090. <constructor name="SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader" type="org.apache.hadoop.conf.Configuration, org.apache.hadoop.mapred.FileSplit"
  6091. static="false" final="false" visibility="public"
  6092. deprecated="not deprecated">
  6093. <exception name="IOException" type="java.io.IOException"/>
  6094. </constructor>
  6095. <method name="createKey" return="org.apache.hadoop.io.BytesWritable"
  6096. abstract="false" native="false" synchronized="false"
  6097. static="false" final="false" visibility="public"
  6098. deprecated="not deprecated">
  6099. </method>
  6100. <method name="createValue" return="org.apache.hadoop.io.BytesWritable"
  6101. abstract="false" native="false" synchronized="false"
  6102. static="false" final="false" visibility="public"
  6103. deprecated="not deprecated">
  6104. </method>
  6105. <method name="getKeyClassName" return="java.lang.String"
  6106. abstract="false" native="false" synchronized="false"
  6107. static="false" final="false" visibility="public"
  6108. deprecated="not deprecated">
  6109. <doc>
  6110. <![CDATA[Retrieve the name of the key class for this SequenceFile.
  6111. @see org.apache.hadoop.io.SequenceFile.Reader#getKeyClassName]]>
  6112. </doc>
  6113. </method>
  6114. <method name="getValueClassName" return="java.lang.String"
  6115. abstract="false" native="false" synchronized="false"
  6116. static="false" final="false" visibility="public"
  6117. deprecated="not deprecated">
  6118. <doc>
  6119. <![CDATA[Retrieve the name of the value class for this SequenceFile.
  6120. @see org.apache.hadoop.io.SequenceFile.Reader#getValueClassName]]>
  6121. </doc>
  6122. </method>
  6123. <method name="next" return="boolean"
  6124. abstract="false" native="false" synchronized="true"
  6125. static="false" final="false" visibility="public"
  6126. deprecated="not deprecated">
  6127. <param name="key" type="org.apache.hadoop.io.BytesWritable"/>
  6128. <param name="val" type="org.apache.hadoop.io.BytesWritable"/>
  6129. <exception name="IOException" type="java.io.IOException"/>
  6130. <doc>
  6131. <![CDATA[Read raw bytes from a SequenceFile.]]>
  6132. </doc>
  6133. </method>
  6134. <method name="getPos" return="long"
  6135. abstract="false" native="false" synchronized="false"
  6136. static="false" final="false" visibility="public"
  6137. deprecated="not deprecated">
  6138. <exception name="IOException" type="java.io.IOException"/>
  6139. </method>
  6140. <method name="close"
  6141. abstract="false" native="false" synchronized="false"
  6142. static="false" final="false" visibility="public"
  6143. deprecated="not deprecated">
  6144. <exception name="IOException" type="java.io.IOException"/>
  6145. </method>
  6146. <method name="getProgress" return="float"
  6147. abstract="false" native="false" synchronized="false"
  6148. static="false" final="false" visibility="public"
  6149. deprecated="not deprecated">
  6150. <exception name="IOException" type="java.io.IOException"/>
  6151. <doc>
  6152. <![CDATA[Return the progress within the input split
  6153. @return 0.0 to 1.0 of the input byte range]]>
  6154. </doc>
  6155. </method>
  6156. <doc>
  6157. <![CDATA[Read records from a SequenceFile as binary (raw) bytes.]]>
  6158. </doc>
  6159. </class>
  6160. <!-- end class org.apache.hadoop.mapred.SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader -->
  6161. <!-- start class org.apache.hadoop.mapred.SequenceFileAsBinaryOutputFormat -->
  6162. <class name="SequenceFileAsBinaryOutputFormat" extends="org.apache.hadoop.mapred.SequenceFileOutputFormat"
  6163. abstract="false"
  6164. static="false" final="false" visibility="public"
  6165. deprecated="Use
  6166. {@link org.apache.hadoop.mapreduce.lib.output.SequenceFileAsBinaryOutputFormat}
  6167. instead">
  6168. <constructor name="SequenceFileAsBinaryOutputFormat"
  6169. static="false" final="false" visibility="public"
  6170. deprecated="not deprecated">
  6171. </constructor>
  6172. <method name="setSequenceFileOutputKeyClass"
  6173. abstract="false" native="false" synchronized="false"
  6174. static="true" final="false" visibility="public"
  6175. deprecated="not deprecated">
  6176. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  6177. <param name="theClass" type="java.lang.Class"/>
  6178. <doc>
  6179. <![CDATA[Set the key class for the {@link SequenceFile}
  6180. <p>This allows the user to specify the key class to be different
  6181. from the actual class ({@link BytesWritable}) used for writing </p>
  6182. @param conf the {@link JobConf} to modify
  6183. @param theClass the SequenceFile output key class.]]>
  6184. </doc>
  6185. </method>
  6186. <method name="setSequenceFileOutputValueClass"
  6187. abstract="false" native="false" synchronized="false"
  6188. static="true" final="false" visibility="public"
  6189. deprecated="not deprecated">
  6190. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  6191. <param name="theClass" type="java.lang.Class"/>
  6192. <doc>
  6193. <![CDATA[Set the value class for the {@link SequenceFile}
  6194. <p>This allows the user to specify the value class to be different
  6195. from the actual class ({@link BytesWritable}) used for writing </p>
  6196. @param conf the {@link JobConf} to modify
  6197. @param theClass the SequenceFile output key class.]]>
  6198. </doc>
  6199. </method>
  6200. <method name="getSequenceFileOutputKeyClass" return="java.lang.Class"
  6201. abstract="false" native="false" synchronized="false"
  6202. static="true" final="false" visibility="public"
  6203. deprecated="not deprecated">
  6204. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  6205. <doc>
  6206. <![CDATA[Get the key class for the {@link SequenceFile}
  6207. @return the key class of the {@link SequenceFile}]]>
  6208. </doc>
  6209. </method>
  6210. <method name="getSequenceFileOutputValueClass" return="java.lang.Class"
  6211. abstract="false" native="false" synchronized="false"
  6212. static="true" final="false" visibility="public"
  6213. deprecated="not deprecated">
  6214. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  6215. <doc>
  6216. <![CDATA[Get the value class for the {@link SequenceFile}
  6217. @return the value class of the {@link SequenceFile}]]>
  6218. </doc>
  6219. </method>
  6220. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  6221. abstract="false" native="false" synchronized="false"
  6222. static="false" final="false" visibility="public"
  6223. deprecated="not deprecated">
  6224. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  6225. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6226. <param name="name" type="java.lang.String"/>
  6227. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  6228. <exception name="IOException" type="java.io.IOException"/>
  6229. </method>
  6230. <method name="checkOutputSpecs"
  6231. abstract="false" native="false" synchronized="false"
  6232. static="false" final="false" visibility="public"
  6233. deprecated="not deprecated">
  6234. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  6235. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6236. <exception name="IOException" type="java.io.IOException"/>
  6237. </method>
  6238. <doc>
  6239. <![CDATA[An {@link OutputFormat} that writes keys, values to
  6240. {@link SequenceFile}s in binary(raw) format
  6241. @deprecated Use
  6242. {@link org.apache.hadoop.mapreduce.lib.output.SequenceFileAsBinaryOutputFormat}
  6243. instead]]>
  6244. </doc>
  6245. </class>
  6246. <!-- end class org.apache.hadoop.mapred.SequenceFileAsBinaryOutputFormat -->
  6247. <!-- start class org.apache.hadoop.mapred.SequenceFileAsBinaryOutputFormat.WritableValueBytes -->
  6248. <class name="SequenceFileAsBinaryOutputFormat.WritableValueBytes" extends="org.apache.hadoop.mapreduce.lib.output.SequenceFileAsBinaryOutputFormat.WritableValueBytes"
  6249. abstract="false"
  6250. static="true" final="false" visibility="protected"
  6251. deprecated="not deprecated">
  6252. <constructor name="SequenceFileAsBinaryOutputFormat.WritableValueBytes"
  6253. static="false" final="false" visibility="protected"
  6254. deprecated="not deprecated">
  6255. </constructor>
  6256. <doc>
  6257. <![CDATA[Inner class used for appendRaw]]>
  6258. </doc>
  6259. </class>
  6260. <!-- end class org.apache.hadoop.mapred.SequenceFileAsBinaryOutputFormat.WritableValueBytes -->
  6261. <!-- start class org.apache.hadoop.mapred.SequenceFileAsTextInputFormat -->
  6262. <class name="SequenceFileAsTextInputFormat" extends="org.apache.hadoop.mapred.SequenceFileInputFormat"
  6263. abstract="false"
  6264. static="false" final="false" visibility="public"
  6265. deprecated="Use
  6266. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextInputFormat}
  6267. instead">
  6268. <constructor name="SequenceFileAsTextInputFormat"
  6269. static="false" final="false" visibility="public"
  6270. deprecated="not deprecated">
  6271. </constructor>
  6272. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  6273. abstract="false" native="false" synchronized="false"
  6274. static="false" final="false" visibility="public"
  6275. deprecated="not deprecated">
  6276. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  6277. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6278. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  6279. <exception name="IOException" type="java.io.IOException"/>
  6280. </method>
  6281. <doc>
  6282. <![CDATA[This class is similar to SequenceFileInputFormat,
  6283. except it generates SequenceFileAsTextRecordReader
  6284. which converts the input keys and values to their
  6285. String forms by calling toString() method.
  6286. @deprecated Use
  6287. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextInputFormat}
  6288. instead]]>
  6289. </doc>
  6290. </class>
  6291. <!-- end class org.apache.hadoop.mapred.SequenceFileAsTextInputFormat -->
  6292. <!-- start class org.apache.hadoop.mapred.SequenceFileAsTextRecordReader -->
  6293. <class name="SequenceFileAsTextRecordReader" extends="java.lang.Object"
  6294. abstract="false"
  6295. static="false" final="false" visibility="public"
  6296. deprecated="Use
  6297. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextRecordReader}
  6298. instead">
  6299. <implements name="org.apache.hadoop.mapred.RecordReader"/>
  6300. <constructor name="SequenceFileAsTextRecordReader" type="org.apache.hadoop.conf.Configuration, org.apache.hadoop.mapred.FileSplit"
  6301. static="false" final="false" visibility="public"
  6302. deprecated="not deprecated">
  6303. <exception name="IOException" type="java.io.IOException"/>
  6304. </constructor>
  6305. <method name="createKey" return="org.apache.hadoop.io.Text"
  6306. abstract="false" native="false" synchronized="false"
  6307. static="false" final="false" visibility="public"
  6308. deprecated="not deprecated">
  6309. </method>
  6310. <method name="createValue" return="org.apache.hadoop.io.Text"
  6311. abstract="false" native="false" synchronized="false"
  6312. static="false" final="false" visibility="public"
  6313. deprecated="not deprecated">
  6314. </method>
  6315. <method name="next" return="boolean"
  6316. abstract="false" native="false" synchronized="true"
  6317. static="false" final="false" visibility="public"
  6318. deprecated="not deprecated">
  6319. <param name="key" type="org.apache.hadoop.io.Text"/>
  6320. <param name="value" type="org.apache.hadoop.io.Text"/>
  6321. <exception name="IOException" type="java.io.IOException"/>
  6322. <doc>
  6323. <![CDATA[Read key/value pair in a line.]]>
  6324. </doc>
  6325. </method>
  6326. <method name="getProgress" return="float"
  6327. abstract="false" native="false" synchronized="false"
  6328. static="false" final="false" visibility="public"
  6329. deprecated="not deprecated">
  6330. <exception name="IOException" type="java.io.IOException"/>
  6331. </method>
  6332. <method name="getPos" return="long"
  6333. abstract="false" native="false" synchronized="true"
  6334. static="false" final="false" visibility="public"
  6335. deprecated="not deprecated">
  6336. <exception name="IOException" type="java.io.IOException"/>
  6337. </method>
  6338. <method name="close"
  6339. abstract="false" native="false" synchronized="true"
  6340. static="false" final="false" visibility="public"
  6341. deprecated="not deprecated">
  6342. <exception name="IOException" type="java.io.IOException"/>
  6343. </method>
  6344. <doc>
  6345. <![CDATA[This class converts the input keys and values to their String forms by calling toString()
  6346. method. This class to SequenceFileAsTextInputFormat class is as LineRecordReader
  6347. class to TextInputFormat class.
  6348. @deprecated Use
  6349. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextRecordReader}
  6350. instead]]>
  6351. </doc>
  6352. </class>
  6353. <!-- end class org.apache.hadoop.mapred.SequenceFileAsTextRecordReader -->
  6354. <!-- start class org.apache.hadoop.mapred.SequenceFileInputFilter -->
  6355. <class name="SequenceFileInputFilter" extends="org.apache.hadoop.mapred.SequenceFileInputFormat"
  6356. abstract="false"
  6357. static="false" final="false" visibility="public"
  6358. deprecated="Use
  6359. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter}
  6360. instead">
  6361. <constructor name="SequenceFileInputFilter"
  6362. static="false" final="false" visibility="public"
  6363. deprecated="not deprecated">
  6364. </constructor>
  6365. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  6366. abstract="false" native="false" synchronized="false"
  6367. static="false" final="false" visibility="public"
  6368. deprecated="not deprecated">
  6369. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  6370. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6371. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  6372. <exception name="IOException" type="java.io.IOException"/>
  6373. <doc>
  6374. <![CDATA[Create a record reader for the given split
  6375. @param split file split
  6376. @param job job configuration
  6377. @param reporter reporter who sends report to task tracker
  6378. @return RecordReader]]>
  6379. </doc>
  6380. </method>
  6381. <method name="setFilterClass"
  6382. abstract="false" native="false" synchronized="false"
  6383. static="true" final="false" visibility="public"
  6384. deprecated="not deprecated">
  6385. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6386. <param name="filterClass" type="java.lang.Class"/>
  6387. <doc>
  6388. <![CDATA[set the filter class
  6389. @param conf application configuration
  6390. @param filterClass filter class]]>
  6391. </doc>
  6392. </method>
  6393. <doc>
  6394. <![CDATA[A class that allows a map/red job to work on a sample of sequence files.
  6395. The sample is decided by the filter class set by the job.
  6396. @deprecated Use
  6397. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter}
  6398. instead]]>
  6399. </doc>
  6400. </class>
  6401. <!-- end class org.apache.hadoop.mapred.SequenceFileInputFilter -->
  6402. <!-- start interface org.apache.hadoop.mapred.SequenceFileInputFilter.Filter -->
  6403. <interface name="SequenceFileInputFilter.Filter" abstract="true"
  6404. static="true" final="false" visibility="public"
  6405. deprecated="not deprecated">
  6406. <implements name="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.Filter"/>
  6407. <doc>
  6408. <![CDATA[filter interface]]>
  6409. </doc>
  6410. </interface>
  6411. <!-- end interface org.apache.hadoop.mapred.SequenceFileInputFilter.Filter -->
  6412. <!-- start class org.apache.hadoop.mapred.SequenceFileInputFilter.FilterBase -->
  6413. <class name="SequenceFileInputFilter.FilterBase" extends="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.FilterBase"
  6414. abstract="true"
  6415. static="true" final="false" visibility="public"
  6416. deprecated="not deprecated">
  6417. <implements name="org.apache.hadoop.mapred.SequenceFileInputFilter.Filter"/>
  6418. <constructor name="SequenceFileInputFilter.FilterBase"
  6419. static="false" final="false" visibility="public"
  6420. deprecated="not deprecated">
  6421. </constructor>
  6422. <doc>
  6423. <![CDATA[base class for Filters]]>
  6424. </doc>
  6425. </class>
  6426. <!-- end class org.apache.hadoop.mapred.SequenceFileInputFilter.FilterBase -->
  6427. <!-- start class org.apache.hadoop.mapred.SequenceFileInputFilter.MD5Filter -->
  6428. <class name="SequenceFileInputFilter.MD5Filter" extends="org.apache.hadoop.mapred.SequenceFileInputFilter.FilterBase"
  6429. abstract="false"
  6430. static="true" final="false" visibility="public"
  6431. deprecated="not deprecated">
  6432. <constructor name="SequenceFileInputFilter.MD5Filter"
  6433. static="false" final="false" visibility="public"
  6434. deprecated="not deprecated">
  6435. </constructor>
  6436. <method name="setFrequency"
  6437. abstract="false" native="false" synchronized="false"
  6438. static="true" final="false" visibility="public"
  6439. deprecated="not deprecated">
  6440. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6441. <param name="frequency" type="int"/>
  6442. <doc>
  6443. <![CDATA[set the filtering frequency in configuration
  6444. @param conf configuration
  6445. @param frequency filtering frequency]]>
  6446. </doc>
  6447. </method>
  6448. <method name="setConf"
  6449. abstract="false" native="false" synchronized="false"
  6450. static="false" final="false" visibility="public"
  6451. deprecated="not deprecated">
  6452. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6453. <doc>
  6454. <![CDATA[configure the filter according to configuration
  6455. @param conf configuration]]>
  6456. </doc>
  6457. </method>
  6458. <method name="accept" return="boolean"
  6459. abstract="false" native="false" synchronized="false"
  6460. static="false" final="false" visibility="public"
  6461. deprecated="not deprecated">
  6462. <param name="key" type="java.lang.Object"/>
  6463. <doc>
  6464. <![CDATA[Filtering method
  6465. If MD5(key) % frequency==0, return true; otherwise return false
  6466. @see org.apache.hadoop.mapred.SequenceFileInputFilter.Filter#accept(Object)]]>
  6467. </doc>
  6468. </method>
  6469. <field name="MD5_LEN" type="int"
  6470. transient="false" volatile="false"
  6471. static="true" final="true" visibility="public"
  6472. deprecated="not deprecated">
  6473. </field>
  6474. <doc>
  6475. <![CDATA[This class returns a set of records by examing the MD5 digest of its
  6476. key against a filtering frequency <i>f</i>. The filtering criteria is
  6477. MD5(key) % f == 0.]]>
  6478. </doc>
  6479. </class>
  6480. <!-- end class org.apache.hadoop.mapred.SequenceFileInputFilter.MD5Filter -->
  6481. <!-- start class org.apache.hadoop.mapred.SequenceFileInputFilter.PercentFilter -->
  6482. <class name="SequenceFileInputFilter.PercentFilter" extends="org.apache.hadoop.mapred.SequenceFileInputFilter.FilterBase"
  6483. abstract="false"
  6484. static="true" final="false" visibility="public"
  6485. deprecated="not deprecated">
  6486. <constructor name="SequenceFileInputFilter.PercentFilter"
  6487. static="false" final="false" visibility="public"
  6488. deprecated="not deprecated">
  6489. </constructor>
  6490. <method name="setFrequency"
  6491. abstract="false" native="false" synchronized="false"
  6492. static="true" final="false" visibility="public"
  6493. deprecated="not deprecated">
  6494. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6495. <param name="frequency" type="int"/>
  6496. <doc>
  6497. <![CDATA[set the frequency and stores it in conf
  6498. @param conf configuration
  6499. @param frequency filtering frequencey]]>
  6500. </doc>
  6501. </method>
  6502. <method name="setConf"
  6503. abstract="false" native="false" synchronized="false"
  6504. static="false" final="false" visibility="public"
  6505. deprecated="not deprecated">
  6506. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6507. <doc>
  6508. <![CDATA[configure the filter by checking the configuration
  6509. @param conf configuration]]>
  6510. </doc>
  6511. </method>
  6512. <method name="accept" return="boolean"
  6513. abstract="false" native="false" synchronized="false"
  6514. static="false" final="false" visibility="public"
  6515. deprecated="not deprecated">
  6516. <param name="key" type="java.lang.Object"/>
  6517. <doc>
  6518. <![CDATA[Filtering method
  6519. If record# % frequency==0, return true; otherwise return false
  6520. @see org.apache.hadoop.mapred.SequenceFileInputFilter.Filter#accept(Object)]]>
  6521. </doc>
  6522. </method>
  6523. <doc>
  6524. <![CDATA[This class returns a percentage of records
  6525. The percentage is determined by a filtering frequency <i>f</i> using
  6526. the criteria record# % f == 0.
  6527. For example, if the frequency is 10, one out of 10 records is returned.]]>
  6528. </doc>
  6529. </class>
  6530. <!-- end class org.apache.hadoop.mapred.SequenceFileInputFilter.PercentFilter -->
  6531. <!-- start class org.apache.hadoop.mapred.SequenceFileInputFilter.RegexFilter -->
  6532. <class name="SequenceFileInputFilter.RegexFilter" extends="org.apache.hadoop.mapred.SequenceFileInputFilter.FilterBase"
  6533. abstract="false"
  6534. static="true" final="false" visibility="public"
  6535. deprecated="not deprecated">
  6536. <constructor name="SequenceFileInputFilter.RegexFilter"
  6537. static="false" final="false" visibility="public"
  6538. deprecated="not deprecated">
  6539. </constructor>
  6540. <method name="setPattern"
  6541. abstract="false" native="false" synchronized="false"
  6542. static="true" final="false" visibility="public"
  6543. deprecated="not deprecated">
  6544. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6545. <param name="regex" type="java.lang.String"/>
  6546. <exception name="PatternSyntaxException" type="java.util.regex.PatternSyntaxException"/>
  6547. </method>
  6548. <method name="setConf"
  6549. abstract="false" native="false" synchronized="false"
  6550. static="false" final="false" visibility="public"
  6551. deprecated="not deprecated">
  6552. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6553. <doc>
  6554. <![CDATA[configure the Filter by checking the configuration]]>
  6555. </doc>
  6556. </method>
  6557. <method name="accept" return="boolean"
  6558. abstract="false" native="false" synchronized="false"
  6559. static="false" final="false" visibility="public"
  6560. deprecated="not deprecated">
  6561. <param name="key" type="java.lang.Object"/>
  6562. <doc>
  6563. <![CDATA[Filtering method
  6564. If key matches the regex, return true; otherwise return false
  6565. @see org.apache.hadoop.mapred.SequenceFileInputFilter.Filter#accept(Object)]]>
  6566. </doc>
  6567. </method>
  6568. <doc>
  6569. <![CDATA[Records filter by matching key to regex]]>
  6570. </doc>
  6571. </class>
  6572. <!-- end class org.apache.hadoop.mapred.SequenceFileInputFilter.RegexFilter -->
  6573. <!-- start class org.apache.hadoop.mapred.SequenceFileInputFormat -->
  6574. <class name="SequenceFileInputFormat" extends="org.apache.hadoop.mapred.FileInputFormat"
  6575. abstract="false"
  6576. static="false" final="false" visibility="public"
  6577. deprecated="Use
  6578. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat}
  6579. instead.">
  6580. <constructor name="SequenceFileInputFormat"
  6581. static="false" final="false" visibility="public"
  6582. deprecated="not deprecated">
  6583. </constructor>
  6584. <method name="listStatus" return="org.apache.hadoop.fs.FileStatus[]"
  6585. abstract="false" native="false" synchronized="false"
  6586. static="false" final="false" visibility="protected"
  6587. deprecated="not deprecated">
  6588. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6589. <exception name="IOException" type="java.io.IOException"/>
  6590. </method>
  6591. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  6592. abstract="false" native="false" synchronized="false"
  6593. static="false" final="false" visibility="public"
  6594. deprecated="not deprecated">
  6595. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  6596. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6597. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  6598. <exception name="IOException" type="java.io.IOException"/>
  6599. </method>
  6600. <doc>
  6601. <![CDATA[An {@link InputFormat} for {@link SequenceFile}s.
  6602. @deprecated Use
  6603. {@link org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat}
  6604. instead.]]>
  6605. </doc>
  6606. </class>
  6607. <!-- end class org.apache.hadoop.mapred.SequenceFileInputFormat -->
  6608. <!-- start class org.apache.hadoop.mapred.SequenceFileOutputFormat -->
  6609. <class name="SequenceFileOutputFormat" extends="org.apache.hadoop.mapred.FileOutputFormat"
  6610. abstract="false"
  6611. static="false" final="false" visibility="public"
  6612. deprecated="Use
  6613. {@link org.apache.hadoop.mapreduce.lib.output.SequenceFileOutputFormat}
  6614. instead.">
  6615. <constructor name="SequenceFileOutputFormat"
  6616. static="false" final="false" visibility="public"
  6617. deprecated="not deprecated">
  6618. </constructor>
  6619. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  6620. abstract="false" native="false" synchronized="false"
  6621. static="false" final="false" visibility="public"
  6622. deprecated="not deprecated">
  6623. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  6624. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  6625. <param name="name" type="java.lang.String"/>
  6626. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  6627. <exception name="IOException" type="java.io.IOException"/>
  6628. </method>
  6629. <method name="getReaders" return="org.apache.hadoop.io.SequenceFile.Reader[]"
  6630. abstract="false" native="false" synchronized="false"
  6631. static="true" final="false" visibility="public"
  6632. deprecated="not deprecated">
  6633. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6634. <param name="dir" type="org.apache.hadoop.fs.Path"/>
  6635. <exception name="IOException" type="java.io.IOException"/>
  6636. <doc>
  6637. <![CDATA[Open the output generated by this format.]]>
  6638. </doc>
  6639. </method>
  6640. <method name="getOutputCompressionType" return="org.apache.hadoop.io.SequenceFile.CompressionType"
  6641. abstract="false" native="false" synchronized="false"
  6642. static="true" final="false" visibility="public"
  6643. deprecated="not deprecated">
  6644. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  6645. <doc>
  6646. <![CDATA[Get the {@link CompressionType} for the output {@link SequenceFile}.
  6647. @param conf the {@link JobConf}
  6648. @return the {@link CompressionType} for the output {@link SequenceFile},
  6649. defaulting to {@link CompressionType#RECORD}]]>
  6650. </doc>
  6651. </method>
  6652. <method name="setOutputCompressionType"
  6653. abstract="false" native="false" synchronized="false"
  6654. static="true" final="false" visibility="public"
  6655. deprecated="not deprecated">
  6656. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  6657. <param name="style" type="org.apache.hadoop.io.SequenceFile.CompressionType"/>
  6658. <doc>
  6659. <![CDATA[Set the {@link CompressionType} for the output {@link SequenceFile}.
  6660. @param conf the {@link JobConf} to modify
  6661. @param style the {@link CompressionType} for the output
  6662. {@link SequenceFile}]]>
  6663. </doc>
  6664. </method>
  6665. <doc>
  6666. <![CDATA[An {@link OutputFormat} that writes {@link SequenceFile}s.
  6667. @deprecated Use
  6668. {@link org.apache.hadoop.mapreduce.lib.output.SequenceFileOutputFormat}
  6669. instead.]]>
  6670. </doc>
  6671. </class>
  6672. <!-- end class org.apache.hadoop.mapred.SequenceFileOutputFormat -->
  6673. <!-- start class org.apache.hadoop.mapred.SequenceFileRecordReader -->
  6674. <class name="SequenceFileRecordReader" extends="java.lang.Object"
  6675. abstract="false"
  6676. static="false" final="false" visibility="public"
  6677. deprecated="not deprecated">
  6678. <implements name="org.apache.hadoop.mapred.RecordReader"/>
  6679. <constructor name="SequenceFileRecordReader" type="org.apache.hadoop.conf.Configuration, org.apache.hadoop.mapred.FileSplit"
  6680. static="false" final="false" visibility="public"
  6681. deprecated="not deprecated">
  6682. <exception name="IOException" type="java.io.IOException"/>
  6683. </constructor>
  6684. <method name="getKeyClass" return="java.lang.Class"
  6685. abstract="false" native="false" synchronized="false"
  6686. static="false" final="false" visibility="public"
  6687. deprecated="not deprecated">
  6688. <doc>
  6689. <![CDATA[The class of key that must be passed to {@link
  6690. #next(Object, Object)}..]]>
  6691. </doc>
  6692. </method>
  6693. <method name="getValueClass" return="java.lang.Class"
  6694. abstract="false" native="false" synchronized="false"
  6695. static="false" final="false" visibility="public"
  6696. deprecated="not deprecated">
  6697. <doc>
  6698. <![CDATA[The class of value that must be passed to {@link
  6699. #next(Object, Object)}..]]>
  6700. </doc>
  6701. </method>
  6702. <method name="createKey" return="K"
  6703. abstract="false" native="false" synchronized="false"
  6704. static="false" final="false" visibility="public"
  6705. deprecated="not deprecated">
  6706. </method>
  6707. <method name="createValue" return="V"
  6708. abstract="false" native="false" synchronized="false"
  6709. static="false" final="false" visibility="public"
  6710. deprecated="not deprecated">
  6711. </method>
  6712. <method name="next" return="boolean"
  6713. abstract="false" native="false" synchronized="true"
  6714. static="false" final="false" visibility="public"
  6715. deprecated="not deprecated">
  6716. <param name="key" type="K"/>
  6717. <param name="value" type="V"/>
  6718. <exception name="IOException" type="java.io.IOException"/>
  6719. </method>
  6720. <method name="next" return="boolean"
  6721. abstract="false" native="false" synchronized="true"
  6722. static="false" final="false" visibility="protected"
  6723. deprecated="not deprecated">
  6724. <param name="key" type="K"/>
  6725. <exception name="IOException" type="java.io.IOException"/>
  6726. </method>
  6727. <method name="getCurrentValue"
  6728. abstract="false" native="false" synchronized="true"
  6729. static="false" final="false" visibility="protected"
  6730. deprecated="not deprecated">
  6731. <param name="value" type="V"/>
  6732. <exception name="IOException" type="java.io.IOException"/>
  6733. </method>
  6734. <method name="getProgress" return="float"
  6735. abstract="false" native="false" synchronized="false"
  6736. static="false" final="false" visibility="public"
  6737. deprecated="not deprecated">
  6738. <exception name="IOException" type="java.io.IOException"/>
  6739. <doc>
  6740. <![CDATA[Return the progress within the input split
  6741. @return 0.0 to 1.0 of the input byte range]]>
  6742. </doc>
  6743. </method>
  6744. <method name="getPos" return="long"
  6745. abstract="false" native="false" synchronized="true"
  6746. static="false" final="false" visibility="public"
  6747. deprecated="not deprecated">
  6748. <exception name="IOException" type="java.io.IOException"/>
  6749. </method>
  6750. <method name="seek"
  6751. abstract="false" native="false" synchronized="true"
  6752. static="false" final="false" visibility="protected"
  6753. deprecated="not deprecated">
  6754. <param name="pos" type="long"/>
  6755. <exception name="IOException" type="java.io.IOException"/>
  6756. </method>
  6757. <method name="close"
  6758. abstract="false" native="false" synchronized="true"
  6759. static="false" final="false" visibility="public"
  6760. deprecated="not deprecated">
  6761. <exception name="IOException" type="java.io.IOException"/>
  6762. </method>
  6763. <field name="conf" type="org.apache.hadoop.conf.Configuration"
  6764. transient="false" volatile="false"
  6765. static="false" final="false" visibility="protected"
  6766. deprecated="not deprecated">
  6767. </field>
  6768. <doc>
  6769. <![CDATA[An {@link RecordReader} for {@link SequenceFile}s.]]>
  6770. </doc>
  6771. </class>
  6772. <!-- end class org.apache.hadoop.mapred.SequenceFileRecordReader -->
  6773. <!-- start class org.apache.hadoop.mapred.SkipBadRecords -->
  6774. <class name="SkipBadRecords" extends="java.lang.Object"
  6775. abstract="false"
  6776. static="false" final="false" visibility="public"
  6777. deprecated="not deprecated">
  6778. <constructor name="SkipBadRecords"
  6779. static="false" final="false" visibility="public"
  6780. deprecated="not deprecated">
  6781. </constructor>
  6782. <method name="getAttemptsToStartSkipping" return="int"
  6783. abstract="false" native="false" synchronized="false"
  6784. static="true" final="false" visibility="public"
  6785. deprecated="not deprecated">
  6786. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6787. <doc>
  6788. <![CDATA[Get the number of Task attempts AFTER which skip mode
  6789. will be kicked off. When skip mode is kicked off, the
  6790. tasks reports the range of records which it will process
  6791. next to the TaskTracker. So that on failures, TT knows which
  6792. ones are possibly the bad records. On further executions,
  6793. those are skipped.
  6794. Default value is 2.
  6795. @param conf the configuration
  6796. @return attemptsToStartSkipping no of task attempts]]>
  6797. </doc>
  6798. </method>
  6799. <method name="setAttemptsToStartSkipping"
  6800. abstract="false" native="false" synchronized="false"
  6801. static="true" final="false" visibility="public"
  6802. deprecated="not deprecated">
  6803. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6804. <param name="attemptsToStartSkipping" type="int"/>
  6805. <doc>
  6806. <![CDATA[Set the number of Task attempts AFTER which skip mode
  6807. will be kicked off. When skip mode is kicked off, the
  6808. tasks reports the range of records which it will process
  6809. next to the TaskTracker. So that on failures, TT knows which
  6810. ones are possibly the bad records. On further executions,
  6811. those are skipped.
  6812. Default value is 2.
  6813. @param conf the configuration
  6814. @param attemptsToStartSkipping no of task attempts]]>
  6815. </doc>
  6816. </method>
  6817. <method name="getAutoIncrMapperProcCount" return="boolean"
  6818. abstract="false" native="false" synchronized="false"
  6819. static="true" final="false" visibility="public"
  6820. deprecated="not deprecated">
  6821. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6822. <doc>
  6823. <![CDATA[Get the flag which if set to true,
  6824. {@link SkipBadRecords#COUNTER_MAP_PROCESSED_RECORDS} is incremented
  6825. by MapRunner after invoking the map function. This value must be set to
  6826. false for applications which process the records asynchronously
  6827. or buffer the input records. For example streaming.
  6828. In such cases applications should increment this counter on their own.
  6829. Default value is true.
  6830. @param conf the configuration
  6831. @return <code>true</code> if auto increment
  6832. {@link SkipBadRecords#COUNTER_MAP_PROCESSED_RECORDS}.
  6833. <code>false</code> otherwise.]]>
  6834. </doc>
  6835. </method>
  6836. <method name="setAutoIncrMapperProcCount"
  6837. abstract="false" native="false" synchronized="false"
  6838. static="true" final="false" visibility="public"
  6839. deprecated="not deprecated">
  6840. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6841. <param name="autoIncr" type="boolean"/>
  6842. <doc>
  6843. <![CDATA[Set the flag which if set to true,
  6844. {@link SkipBadRecords#COUNTER_MAP_PROCESSED_RECORDS} is incremented
  6845. by MapRunner after invoking the map function. This value must be set to
  6846. false for applications which process the records asynchronously
  6847. or buffer the input records. For example streaming.
  6848. In such cases applications should increment this counter on their own.
  6849. Default value is true.
  6850. @param conf the configuration
  6851. @param autoIncr whether to auto increment
  6852. {@link SkipBadRecords#COUNTER_MAP_PROCESSED_RECORDS}.]]>
  6853. </doc>
  6854. </method>
  6855. <method name="getAutoIncrReducerProcCount" return="boolean"
  6856. abstract="false" native="false" synchronized="false"
  6857. static="true" final="false" visibility="public"
  6858. deprecated="not deprecated">
  6859. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6860. <doc>
  6861. <![CDATA[Get the flag which if set to true,
  6862. {@link SkipBadRecords#COUNTER_REDUCE_PROCESSED_GROUPS} is incremented
  6863. by framework after invoking the reduce function. This value must be set to
  6864. false for applications which process the records asynchronously
  6865. or buffer the input records. For example streaming.
  6866. In such cases applications should increment this counter on their own.
  6867. Default value is true.
  6868. @param conf the configuration
  6869. @return <code>true</code> if auto increment
  6870. {@link SkipBadRecords#COUNTER_REDUCE_PROCESSED_GROUPS}.
  6871. <code>false</code> otherwise.]]>
  6872. </doc>
  6873. </method>
  6874. <method name="setAutoIncrReducerProcCount"
  6875. abstract="false" native="false" synchronized="false"
  6876. static="true" final="false" visibility="public"
  6877. deprecated="not deprecated">
  6878. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6879. <param name="autoIncr" type="boolean"/>
  6880. <doc>
  6881. <![CDATA[Set the flag which if set to true,
  6882. {@link SkipBadRecords#COUNTER_REDUCE_PROCESSED_GROUPS} is incremented
  6883. by framework after invoking the reduce function. This value must be set to
  6884. false for applications which process the records asynchronously
  6885. or buffer the input records. For example streaming.
  6886. In such cases applications should increment this counter on their own.
  6887. Default value is true.
  6888. @param conf the configuration
  6889. @param autoIncr whether to auto increment
  6890. {@link SkipBadRecords#COUNTER_REDUCE_PROCESSED_GROUPS}.]]>
  6891. </doc>
  6892. </method>
  6893. <method name="getSkipOutputPath" return="org.apache.hadoop.fs.Path"
  6894. abstract="false" native="false" synchronized="false"
  6895. static="true" final="false" visibility="public"
  6896. deprecated="not deprecated">
  6897. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6898. <doc>
  6899. <![CDATA[Get the directory to which skipped records are written. By default it is
  6900. the sub directory of the output _logs directory.
  6901. User can stop writing skipped records by setting the value null.
  6902. @param conf the configuration.
  6903. @return path skip output directory. Null is returned if this is not set
  6904. and output directory is also not set.]]>
  6905. </doc>
  6906. </method>
  6907. <method name="setSkipOutputPath"
  6908. abstract="false" native="false" synchronized="false"
  6909. static="true" final="false" visibility="public"
  6910. deprecated="not deprecated">
  6911. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  6912. <param name="path" type="org.apache.hadoop.fs.Path"/>
  6913. <doc>
  6914. <![CDATA[Set the directory to which skipped records are written. By default it is
  6915. the sub directory of the output _logs directory.
  6916. User can stop writing skipped records by setting the value null.
  6917. @param conf the configuration.
  6918. @param path skip output directory path]]>
  6919. </doc>
  6920. </method>
  6921. <method name="getMapperMaxSkipRecords" return="long"
  6922. abstract="false" native="false" synchronized="false"
  6923. static="true" final="false" visibility="public"
  6924. deprecated="not deprecated">
  6925. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6926. <doc>
  6927. <![CDATA[Get the number of acceptable skip records surrounding the bad record PER
  6928. bad record in mapper. The number includes the bad record as well.
  6929. To turn the feature of detection/skipping of bad records off, set the
  6930. value to 0.
  6931. The framework tries to narrow down the skipped range by retrying
  6932. until this threshold is met OR all attempts get exhausted for this task.
  6933. Set the value to Long.MAX_VALUE to indicate that framework need not try to
  6934. narrow down. Whatever records(depends on application) get skipped are
  6935. acceptable.
  6936. Default value is 0.
  6937. @param conf the configuration
  6938. @return maxSkipRecs acceptable skip records.]]>
  6939. </doc>
  6940. </method>
  6941. <method name="setMapperMaxSkipRecords"
  6942. abstract="false" native="false" synchronized="false"
  6943. static="true" final="false" visibility="public"
  6944. deprecated="not deprecated">
  6945. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6946. <param name="maxSkipRecs" type="long"/>
  6947. <doc>
  6948. <![CDATA[Set the number of acceptable skip records surrounding the bad record PER
  6949. bad record in mapper. The number includes the bad record as well.
  6950. To turn the feature of detection/skipping of bad records off, set the
  6951. value to 0.
  6952. The framework tries to narrow down the skipped range by retrying
  6953. until this threshold is met OR all attempts get exhausted for this task.
  6954. Set the value to Long.MAX_VALUE to indicate that framework need not try to
  6955. narrow down. Whatever records(depends on application) get skipped are
  6956. acceptable.
  6957. Default value is 0.
  6958. @param conf the configuration
  6959. @param maxSkipRecs acceptable skip records.]]>
  6960. </doc>
  6961. </method>
  6962. <method name="getReducerMaxSkipGroups" return="long"
  6963. abstract="false" native="false" synchronized="false"
  6964. static="true" final="false" visibility="public"
  6965. deprecated="not deprecated">
  6966. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6967. <doc>
  6968. <![CDATA[Get the number of acceptable skip groups surrounding the bad group PER
  6969. bad group in reducer. The number includes the bad group as well.
  6970. To turn the feature of detection/skipping of bad groups off, set the
  6971. value to 0.
  6972. The framework tries to narrow down the skipped range by retrying
  6973. until this threshold is met OR all attempts get exhausted for this task.
  6974. Set the value to Long.MAX_VALUE to indicate that framework need not try to
  6975. narrow down. Whatever groups(depends on application) get skipped are
  6976. acceptable.
  6977. Default value is 0.
  6978. @param conf the configuration
  6979. @return maxSkipGrps acceptable skip groups.]]>
  6980. </doc>
  6981. </method>
  6982. <method name="setReducerMaxSkipGroups"
  6983. abstract="false" native="false" synchronized="false"
  6984. static="true" final="false" visibility="public"
  6985. deprecated="not deprecated">
  6986. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  6987. <param name="maxSkipGrps" type="long"/>
  6988. <doc>
  6989. <![CDATA[Set the number of acceptable skip groups surrounding the bad group PER
  6990. bad group in reducer. The number includes the bad group as well.
  6991. To turn the feature of detection/skipping of bad groups off, set the
  6992. value to 0.
  6993. The framework tries to narrow down the skipped range by retrying
  6994. until this threshold is met OR all attempts get exhausted for this task.
  6995. Set the value to Long.MAX_VALUE to indicate that framework need not try to
  6996. narrow down. Whatever groups(depends on application) get skipped are
  6997. acceptable.
  6998. Default value is 0.
  6999. @param conf the configuration
  7000. @param maxSkipGrps acceptable skip groups.]]>
  7001. </doc>
  7002. </method>
  7003. <field name="COUNTER_GROUP" type="java.lang.String"
  7004. transient="false" volatile="false"
  7005. static="true" final="true" visibility="public"
  7006. deprecated="not deprecated">
  7007. <doc>
  7008. <![CDATA[Special counters which are written by the application and are
  7009. used by the framework for detecting bad records. For detecting bad records
  7010. these counters must be incremented by the application.]]>
  7011. </doc>
  7012. </field>
  7013. <field name="COUNTER_MAP_PROCESSED_RECORDS" type="java.lang.String"
  7014. transient="false" volatile="false"
  7015. static="true" final="true" visibility="public"
  7016. deprecated="not deprecated">
  7017. <doc>
  7018. <![CDATA[Number of processed map records.
  7019. @see SkipBadRecords#getAutoIncrMapperProcCount(Configuration)]]>
  7020. </doc>
  7021. </field>
  7022. <field name="COUNTER_REDUCE_PROCESSED_GROUPS" type="java.lang.String"
  7023. transient="false" volatile="false"
  7024. static="true" final="true" visibility="public"
  7025. deprecated="not deprecated">
  7026. <doc>
  7027. <![CDATA[Number of processed reduce groups.
  7028. @see SkipBadRecords#getAutoIncrReducerProcCount(Configuration)]]>
  7029. </doc>
  7030. </field>
  7031. <doc>
  7032. <![CDATA[Utility class for skip bad records functionality. It contains various
  7033. settings related to skipping of bad records.
  7034. <p>Hadoop provides an optional mode of execution in which the bad records
  7035. are detected and skipped in further attempts.
  7036. <p>This feature can be used when map/reduce tasks crashes deterministically on
  7037. certain input. This happens due to bugs in the map/reduce function. The usual
  7038. course would be to fix these bugs. But sometimes this is not possible;
  7039. perhaps the bug is in third party libraries for which the source code is
  7040. not available. Due to this, the task never reaches to completion even with
  7041. multiple attempts and complete data for that task is lost.</p>
  7042. <p>With this feature, only a small portion of data is lost surrounding
  7043. the bad record, which may be acceptable for some user applications.
  7044. see {@link SkipBadRecords#setMapperMaxSkipRecords(Configuration, long)}</p>
  7045. <p>The skipping mode gets kicked off after certain no of failures
  7046. see {@link SkipBadRecords#setAttemptsToStartSkipping(Configuration, int)}</p>
  7047. <p>In the skipping mode, the map/reduce task maintains the record range which
  7048. is getting processed at all times. Before giving the input to the
  7049. map/reduce function, it sends this record range to the Task tracker.
  7050. If task crashes, the Task tracker knows which one was the last reported
  7051. range. On further attempts that range get skipped.</p>]]>
  7052. </doc>
  7053. </class>
  7054. <!-- end class org.apache.hadoop.mapred.SkipBadRecords -->
  7055. <!-- start interface org.apache.hadoop.mapred.TaskAttemptContext -->
  7056. <interface name="TaskAttemptContext" abstract="true"
  7057. static="false" final="false" visibility="public"
  7058. deprecated="Use {@link org.apache.hadoop.mapreduce.TaskAttemptContext}
  7059. instead.">
  7060. <implements name="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  7061. <method name="getTaskAttemptID" return="org.apache.hadoop.mapred.TaskAttemptID"
  7062. abstract="false" native="false" synchronized="false"
  7063. static="false" final="false" visibility="public"
  7064. deprecated="not deprecated">
  7065. </method>
  7066. <method name="getProgressible" return="org.apache.hadoop.util.Progressable"
  7067. abstract="false" native="false" synchronized="false"
  7068. static="false" final="false" visibility="public"
  7069. deprecated="not deprecated">
  7070. </method>
  7071. <method name="getJobConf" return="org.apache.hadoop.mapred.JobConf"
  7072. abstract="false" native="false" synchronized="false"
  7073. static="false" final="false" visibility="public"
  7074. deprecated="not deprecated">
  7075. </method>
  7076. <doc>
  7077. <![CDATA[@deprecated Use {@link org.apache.hadoop.mapreduce.TaskAttemptContext}
  7078. instead.]]>
  7079. </doc>
  7080. </interface>
  7081. <!-- end interface org.apache.hadoop.mapred.TaskAttemptContext -->
  7082. <!-- start class org.apache.hadoop.mapred.TaskAttemptID -->
  7083. <class name="TaskAttemptID" extends="org.apache.hadoop.mapreduce.TaskAttemptID"
  7084. abstract="false"
  7085. static="false" final="false" visibility="public"
  7086. deprecated="not deprecated">
  7087. <constructor name="TaskAttemptID" type="org.apache.hadoop.mapred.TaskID, int"
  7088. static="false" final="false" visibility="public"
  7089. deprecated="not deprecated">
  7090. <doc>
  7091. <![CDATA[Constructs a TaskAttemptID object from given {@link TaskID}.
  7092. @param taskId TaskID that this task belongs to
  7093. @param id the task attempt number]]>
  7094. </doc>
  7095. </constructor>
  7096. <constructor name="TaskAttemptID" type="java.lang.String, int, boolean, int, int"
  7097. static="false" final="false" visibility="public"
  7098. deprecated="Use {@link #TaskAttemptID(String, int, TaskType, int, int)}.">
  7099. <doc>
  7100. <![CDATA[Constructs a TaskId object from given parts.
  7101. @param jtIdentifier jobTracker identifier
  7102. @param jobId job number
  7103. @param isMap whether the tip is a map
  7104. @param taskId taskId number
  7105. @param id the task attempt number
  7106. @deprecated Use {@link #TaskAttemptID(String, int, TaskType, int, int)}.]]>
  7107. </doc>
  7108. </constructor>
  7109. <constructor name="TaskAttemptID" type="java.lang.String, int, org.apache.hadoop.mapreduce.TaskType, int, int"
  7110. static="false" final="false" visibility="public"
  7111. deprecated="not deprecated">
  7112. <doc>
  7113. <![CDATA[Constructs a TaskId object from given parts.
  7114. @param jtIdentifier jobTracker identifier
  7115. @param jobId job number
  7116. @param type the TaskType
  7117. @param taskId taskId number
  7118. @param id the task attempt number]]>
  7119. </doc>
  7120. </constructor>
  7121. <constructor name="TaskAttemptID"
  7122. static="false" final="false" visibility="public"
  7123. deprecated="not deprecated">
  7124. </constructor>
  7125. <method name="downgrade" return="org.apache.hadoop.mapred.TaskAttemptID"
  7126. abstract="false" native="false" synchronized="false"
  7127. static="true" final="false" visibility="public"
  7128. deprecated="not deprecated">
  7129. <param name="old" type="org.apache.hadoop.mapreduce.TaskAttemptID"/>
  7130. <doc>
  7131. <![CDATA[Downgrade a new TaskAttemptID to an old one
  7132. @param old the new id
  7133. @return either old or a new TaskAttemptID constructed to match old]]>
  7134. </doc>
  7135. </method>
  7136. <method name="getTaskID" return="org.apache.hadoop.mapred.TaskID"
  7137. abstract="false" native="false" synchronized="false"
  7138. static="false" final="false" visibility="public"
  7139. deprecated="not deprecated">
  7140. </method>
  7141. <method name="getJobID" return="org.apache.hadoop.mapred.JobID"
  7142. abstract="false" native="false" synchronized="false"
  7143. static="false" final="false" visibility="public"
  7144. deprecated="not deprecated">
  7145. </method>
  7146. <method name="read" return="org.apache.hadoop.mapred.TaskAttemptID"
  7147. abstract="false" native="false" synchronized="false"
  7148. static="true" final="false" visibility="public"
  7149. deprecated="not deprecated">
  7150. <param name="in" type="java.io.DataInput"/>
  7151. <exception name="IOException" type="java.io.IOException"/>
  7152. </method>
  7153. <method name="forName" return="org.apache.hadoop.mapred.TaskAttemptID"
  7154. abstract="false" native="false" synchronized="false"
  7155. static="true" final="false" visibility="public"
  7156. deprecated="not deprecated">
  7157. <param name="str" type="java.lang.String"/>
  7158. <exception name="IllegalArgumentException" type="java.lang.IllegalArgumentException"/>
  7159. <doc>
  7160. <![CDATA[Construct a TaskAttemptID object from given string
  7161. @return constructed TaskAttemptID object or null if the given String is null
  7162. @throws IllegalArgumentException if the given string is malformed]]>
  7163. </doc>
  7164. </method>
  7165. <method name="getTaskAttemptIDsPattern" return="java.lang.String"
  7166. abstract="false" native="false" synchronized="false"
  7167. static="true" final="false" visibility="public"
  7168. deprecated="not deprecated">
  7169. <param name="jtIdentifier" type="java.lang.String"/>
  7170. <param name="jobId" type="java.lang.Integer"/>
  7171. <param name="isMap" type="java.lang.Boolean"/>
  7172. <param name="taskId" type="java.lang.Integer"/>
  7173. <param name="attemptId" type="java.lang.Integer"/>
  7174. <doc>
  7175. <![CDATA[Returns a regex pattern which matches task attempt IDs. Arguments can
  7176. be given null, in which case that part of the regex will be generic.
  7177. For example to obtain a regex matching <i>all task attempt IDs</i>
  7178. of <i>any jobtracker</i>, in <i>any job</i>, of the <i>first
  7179. map task</i>, we would use :
  7180. <pre>
  7181. TaskAttemptID.getTaskAttemptIDsPattern(null, null, true, 1, null);
  7182. </pre>
  7183. which will return :
  7184. <pre> "attempt_[^_]*_[0-9]*_m_000001_[0-9]*" </pre>
  7185. @param jtIdentifier jobTracker identifier, or null
  7186. @param jobId job number, or null
  7187. @param isMap whether the tip is a map, or null
  7188. @param taskId taskId number, or null
  7189. @param attemptId the task attempt number, or null
  7190. @return a regex pattern matching TaskAttemptIDs]]>
  7191. </doc>
  7192. </method>
  7193. <method name="getTaskAttemptIDsPattern" return="java.lang.String"
  7194. abstract="false" native="false" synchronized="false"
  7195. static="true" final="false" visibility="public"
  7196. deprecated="not deprecated">
  7197. <param name="jtIdentifier" type="java.lang.String"/>
  7198. <param name="jobId" type="java.lang.Integer"/>
  7199. <param name="type" type="org.apache.hadoop.mapreduce.TaskType"/>
  7200. <param name="taskId" type="java.lang.Integer"/>
  7201. <param name="attemptId" type="java.lang.Integer"/>
  7202. <doc>
  7203. <![CDATA[Returns a regex pattern which matches task attempt IDs. Arguments can
  7204. be given null, in which case that part of the regex will be generic.
  7205. For example to obtain a regex matching <i>all task attempt IDs</i>
  7206. of <i>any jobtracker</i>, in <i>any job</i>, of the <i>first
  7207. map task</i>, we would use :
  7208. <pre>
  7209. TaskAttemptID.getTaskAttemptIDsPattern(null, null, TaskType.MAP, 1, null);
  7210. </pre>
  7211. which will return :
  7212. <pre> "attempt_[^_]*_[0-9]*_m_000001_[0-9]*" </pre>
  7213. @param jtIdentifier jobTracker identifier, or null
  7214. @param jobId job number, or null
  7215. @param type the {@link TaskType}
  7216. @param taskId taskId number, or null
  7217. @param attemptId the task attempt number, or null
  7218. @return a regex pattern matching TaskAttemptIDs]]>
  7219. </doc>
  7220. </method>
  7221. <doc>
  7222. <![CDATA[TaskAttemptID represents the immutable and unique identifier for
  7223. a task attempt. Each task attempt is one particular instance of a Map or
  7224. Reduce Task identified by its TaskID.
  7225. TaskAttemptID consists of 2 parts. First part is the
  7226. {@link TaskID}, that this TaskAttemptID belongs to.
  7227. Second part is the task attempt number. <br>
  7228. An example TaskAttemptID is :
  7229. <code>attempt_200707121733_0003_m_000005_0</code> , which represents the
  7230. zeroth task attempt for the fifth map task in the third job
  7231. running at the jobtracker started at <code>200707121733</code>.
  7232. <p>
  7233. Applications should never construct or parse TaskAttemptID strings
  7234. , but rather use appropriate constructors or {@link #forName(String)}
  7235. method.
  7236. @see JobID
  7237. @see TaskID]]>
  7238. </doc>
  7239. </class>
  7240. <!-- end class org.apache.hadoop.mapred.TaskAttemptID -->
  7241. <!-- start class org.apache.hadoop.mapred.TaskCompletionEvent -->
  7242. <class name="TaskCompletionEvent" extends="org.apache.hadoop.mapreduce.TaskCompletionEvent"
  7243. abstract="false"
  7244. static="false" final="false" visibility="public"
  7245. deprecated="Use
  7246. {@link org.apache.hadoop.mapreduce.TaskCompletionEvent} instead">
  7247. <constructor name="TaskCompletionEvent"
  7248. static="false" final="false" visibility="public"
  7249. deprecated="not deprecated">
  7250. <doc>
  7251. <![CDATA[Default constructor for Writable.]]>
  7252. </doc>
  7253. </constructor>
  7254. <constructor name="TaskCompletionEvent" type="int, org.apache.hadoop.mapred.TaskAttemptID, int, boolean, org.apache.hadoop.mapred.TaskCompletionEvent.Status, java.lang.String"
  7255. static="false" final="false" visibility="public"
  7256. deprecated="not deprecated">
  7257. <doc>
  7258. <![CDATA[Constructor. eventId should be created externally and incremented
  7259. per event for each job.
  7260. @param eventId event id, event id should be unique and assigned in
  7261. incrementally, starting from 0.
  7262. @param taskId task id
  7263. @param status task's status
  7264. @param taskTrackerHttp task tracker's host:port for http.]]>
  7265. </doc>
  7266. </constructor>
  7267. <method name="getTaskId" return="java.lang.String"
  7268. abstract="false" native="false" synchronized="false"
  7269. static="false" final="false" visibility="public"
  7270. deprecated="use {@link #getTaskAttemptId()} instead.">
  7271. <doc>
  7272. <![CDATA[Returns task id.
  7273. @return task id
  7274. @deprecated use {@link #getTaskAttemptId()} instead.]]>
  7275. </doc>
  7276. </method>
  7277. <method name="getTaskAttemptId" return="org.apache.hadoop.mapred.TaskAttemptID"
  7278. abstract="false" native="false" synchronized="false"
  7279. static="false" final="false" visibility="public"
  7280. deprecated="not deprecated">
  7281. <doc>
  7282. <![CDATA[Returns task id.
  7283. @return task id]]>
  7284. </doc>
  7285. </method>
  7286. <method name="getTaskStatus" return="org.apache.hadoop.mapred.TaskCompletionEvent.Status"
  7287. abstract="false" native="false" synchronized="false"
  7288. static="false" final="false" visibility="public"
  7289. deprecated="not deprecated">
  7290. <doc>
  7291. <![CDATA[Returns enum Status.SUCESS or Status.FAILURE.
  7292. @return task tracker status]]>
  7293. </doc>
  7294. </method>
  7295. <method name="setTaskId"
  7296. abstract="false" native="false" synchronized="false"
  7297. static="false" final="false" visibility="public"
  7298. deprecated="use {@link #setTaskAttemptId(TaskAttemptID)} instead.">
  7299. <param name="taskId" type="java.lang.String"/>
  7300. <doc>
  7301. <![CDATA[Sets task id.
  7302. @param taskId
  7303. @deprecated use {@link #setTaskAttemptId(TaskAttemptID)} instead.]]>
  7304. </doc>
  7305. </method>
  7306. <method name="setTaskAttemptId"
  7307. abstract="false" native="false" synchronized="false"
  7308. static="false" final="false" visibility="protected"
  7309. deprecated="not deprecated">
  7310. <param name="taskId" type="org.apache.hadoop.mapred.TaskAttemptID"/>
  7311. <doc>
  7312. <![CDATA[Sets task id.
  7313. @param taskId]]>
  7314. </doc>
  7315. </method>
  7316. <method name="setTaskStatus"
  7317. abstract="false" native="false" synchronized="false"
  7318. static="false" final="false" visibility="protected"
  7319. deprecated="not deprecated">
  7320. <param name="status" type="org.apache.hadoop.mapred.TaskCompletionEvent.Status"/>
  7321. <doc>
  7322. <![CDATA[Set task status.
  7323. @param status]]>
  7324. </doc>
  7325. </method>
  7326. <method name="setTaskRunTime"
  7327. abstract="false" native="false" synchronized="false"
  7328. static="false" final="false" visibility="protected"
  7329. deprecated="not deprecated">
  7330. <param name="taskCompletionTime" type="int"/>
  7331. <doc>
  7332. <![CDATA[Set the task completion time
  7333. @param taskCompletionTime time (in millisec) the task took to complete]]>
  7334. </doc>
  7335. </method>
  7336. <method name="setEventId"
  7337. abstract="false" native="false" synchronized="false"
  7338. static="false" final="false" visibility="protected"
  7339. deprecated="not deprecated">
  7340. <param name="eventId" type="int"/>
  7341. <doc>
  7342. <![CDATA[set event Id. should be assigned incrementally starting from 0.
  7343. @param eventId]]>
  7344. </doc>
  7345. </method>
  7346. <method name="setTaskTrackerHttp"
  7347. abstract="false" native="false" synchronized="false"
  7348. static="false" final="false" visibility="protected"
  7349. deprecated="not deprecated">
  7350. <param name="taskTrackerHttp" type="java.lang.String"/>
  7351. <doc>
  7352. <![CDATA[Set task tracker http location.
  7353. @param taskTrackerHttp]]>
  7354. </doc>
  7355. </method>
  7356. <field name="EMPTY_ARRAY" type="org.apache.hadoop.mapred.TaskCompletionEvent[]"
  7357. transient="false" volatile="false"
  7358. static="true" final="true" visibility="public"
  7359. deprecated="not deprecated">
  7360. </field>
  7361. <doc>
  7362. <![CDATA[This is used to track task completion events on
  7363. job tracker.
  7364. @deprecated Use
  7365. {@link org.apache.hadoop.mapreduce.TaskCompletionEvent} instead]]>
  7366. </doc>
  7367. </class>
  7368. <!-- end class org.apache.hadoop.mapred.TaskCompletionEvent -->
  7369. <!-- start class org.apache.hadoop.mapred.TaskCompletionEvent.Status -->
  7370. <class name="TaskCompletionEvent.Status" extends="java.lang.Enum"
  7371. abstract="false"
  7372. static="true" final="true" visibility="public"
  7373. deprecated="not deprecated">
  7374. <method name="values" return="org.apache.hadoop.mapred.TaskCompletionEvent.Status[]"
  7375. abstract="false" native="false" synchronized="false"
  7376. static="true" final="false" visibility="public"
  7377. deprecated="not deprecated">
  7378. </method>
  7379. <method name="valueOf" return="org.apache.hadoop.mapred.TaskCompletionEvent.Status"
  7380. abstract="false" native="false" synchronized="false"
  7381. static="true" final="false" visibility="public"
  7382. deprecated="not deprecated">
  7383. <param name="name" type="java.lang.String"/>
  7384. </method>
  7385. </class>
  7386. <!-- end class org.apache.hadoop.mapred.TaskCompletionEvent.Status -->
  7387. <!-- start class org.apache.hadoop.mapred.TaskID -->
  7388. <class name="TaskID" extends="org.apache.hadoop.mapreduce.TaskID"
  7389. abstract="false"
  7390. static="false" final="false" visibility="public"
  7391. deprecated="not deprecated">
  7392. <constructor name="TaskID" type="org.apache.hadoop.mapreduce.JobID, boolean, int"
  7393. static="false" final="false" visibility="public"
  7394. deprecated="Use {@link #TaskID(String, int, TaskType, int)}">
  7395. <doc>
  7396. <![CDATA[Constructs a TaskID object from given {@link JobID}.
  7397. @param jobId JobID that this tip belongs to
  7398. @param isMap whether the tip is a map
  7399. @param id the tip number
  7400. @deprecated Use {@link #TaskID(String, int, TaskType, int)}]]>
  7401. </doc>
  7402. </constructor>
  7403. <constructor name="TaskID" type="java.lang.String, int, boolean, int"
  7404. static="false" final="false" visibility="public"
  7405. deprecated="Use {@link #TaskID(org.apache.hadoop.mapreduce.JobID, TaskType,
  7406. int)}">
  7407. <doc>
  7408. <![CDATA[Constructs a TaskInProgressId object from given parts.
  7409. @param jtIdentifier jobTracker identifier
  7410. @param jobId job number
  7411. @param isMap whether the tip is a map
  7412. @param id the tip number
  7413. @deprecated Use {@link #TaskID(org.apache.hadoop.mapreduce.JobID, TaskType,
  7414. int)}]]>
  7415. </doc>
  7416. </constructor>
  7417. <constructor name="TaskID" type="org.apache.hadoop.mapreduce.JobID, org.apache.hadoop.mapreduce.TaskType, int"
  7418. static="false" final="false" visibility="public"
  7419. deprecated="not deprecated">
  7420. <doc>
  7421. <![CDATA[Constructs a TaskID object from given {@link JobID}.
  7422. @param jobId JobID that this tip belongs to
  7423. @param type the {@link TaskType}
  7424. @param id the tip number]]>
  7425. </doc>
  7426. </constructor>
  7427. <constructor name="TaskID" type="java.lang.String, int, org.apache.hadoop.mapreduce.TaskType, int"
  7428. static="false" final="false" visibility="public"
  7429. deprecated="not deprecated">
  7430. <doc>
  7431. <![CDATA[Constructs a TaskInProgressId object from given parts.
  7432. @param jtIdentifier jobTracker identifier
  7433. @param jobId job number
  7434. @param type the {@link TaskType}
  7435. @param id the tip number]]>
  7436. </doc>
  7437. </constructor>
  7438. <constructor name="TaskID"
  7439. static="false" final="false" visibility="public"
  7440. deprecated="not deprecated">
  7441. </constructor>
  7442. <method name="downgrade" return="org.apache.hadoop.mapred.TaskID"
  7443. abstract="false" native="false" synchronized="false"
  7444. static="true" final="false" visibility="public"
  7445. deprecated="not deprecated">
  7446. <param name="old" type="org.apache.hadoop.mapreduce.TaskID"/>
  7447. <doc>
  7448. <![CDATA[Downgrade a new TaskID to an old one
  7449. @param old a new or old TaskID
  7450. @return either old or a new TaskID build to match old]]>
  7451. </doc>
  7452. </method>
  7453. <method name="read" return="org.apache.hadoop.mapred.TaskID"
  7454. abstract="false" native="false" synchronized="false"
  7455. static="true" final="false" visibility="public"
  7456. deprecated="not deprecated">
  7457. <param name="in" type="java.io.DataInput"/>
  7458. <exception name="IOException" type="java.io.IOException"/>
  7459. </method>
  7460. <method name="getJobID" return="org.apache.hadoop.mapred.JobID"
  7461. abstract="false" native="false" synchronized="false"
  7462. static="false" final="false" visibility="public"
  7463. deprecated="not deprecated">
  7464. </method>
  7465. <method name="getTaskIDsPattern" return="java.lang.String"
  7466. abstract="false" native="false" synchronized="false"
  7467. static="true" final="false" visibility="public"
  7468. deprecated="Use {@link TaskID#getTaskIDsPattern(String, Integer, TaskType,
  7469. Integer)}">
  7470. <param name="jtIdentifier" type="java.lang.String"/>
  7471. <param name="jobId" type="java.lang.Integer"/>
  7472. <param name="isMap" type="java.lang.Boolean"/>
  7473. <param name="taskId" type="java.lang.Integer"/>
  7474. <doc>
  7475. <![CDATA[Returns a regex pattern which matches task IDs. Arguments can
  7476. be given null, in which case that part of the regex will be generic.
  7477. For example to obtain a regex matching <i>the first map task</i>
  7478. of <i>any jobtracker</i>, of <i>any job</i>, we would use :
  7479. <pre>
  7480. TaskID.getTaskIDsPattern(null, null, true, 1);
  7481. </pre>
  7482. which will return :
  7483. <pre> "task_[^_]*_[0-9]*_m_000001*" </pre>
  7484. @param jtIdentifier jobTracker identifier, or null
  7485. @param jobId job number, or null
  7486. @param isMap whether the tip is a map, or null
  7487. @param taskId taskId number, or null
  7488. @return a regex pattern matching TaskIDs
  7489. @deprecated Use {@link TaskID#getTaskIDsPattern(String, Integer, TaskType,
  7490. Integer)}]]>
  7491. </doc>
  7492. </method>
  7493. <method name="getTaskIDsPattern" return="java.lang.String"
  7494. abstract="false" native="false" synchronized="false"
  7495. static="true" final="false" visibility="public"
  7496. deprecated="not deprecated">
  7497. <param name="jtIdentifier" type="java.lang.String"/>
  7498. <param name="jobId" type="java.lang.Integer"/>
  7499. <param name="type" type="org.apache.hadoop.mapreduce.TaskType"/>
  7500. <param name="taskId" type="java.lang.Integer"/>
  7501. <doc>
  7502. <![CDATA[Returns a regex pattern which matches task IDs. Arguments can
  7503. be given null, in which case that part of the regex will be generic.
  7504. For example to obtain a regex matching <i>the first map task</i>
  7505. of <i>any jobtracker</i>, of <i>any job</i>, we would use :
  7506. <pre>
  7507. TaskID.getTaskIDsPattern(null, null, true, 1);
  7508. </pre>
  7509. which will return :
  7510. <pre> "task_[^_]*_[0-9]*_m_000001*" </pre>
  7511. @param jtIdentifier jobTracker identifier, or null
  7512. @param jobId job number, or null
  7513. @param type the {@link TaskType}, or null
  7514. @param taskId taskId number, or null
  7515. @return a regex pattern matching TaskIDs]]>
  7516. </doc>
  7517. </method>
  7518. <method name="forName" return="org.apache.hadoop.mapred.TaskID"
  7519. abstract="false" native="false" synchronized="false"
  7520. static="true" final="false" visibility="public"
  7521. deprecated="not deprecated">
  7522. <param name="str" type="java.lang.String"/>
  7523. <exception name="IllegalArgumentException" type="java.lang.IllegalArgumentException"/>
  7524. </method>
  7525. <doc>
  7526. <![CDATA[TaskID represents the immutable and unique identifier for
  7527. a Map or Reduce Task. Each TaskID encompasses multiple attempts made to
  7528. execute the Map or Reduce Task, each of which are uniquely indentified by
  7529. their TaskAttemptID.
  7530. TaskID consists of 3 parts. First part is the {@link JobID}, that this
  7531. TaskInProgress belongs to. Second part of the TaskID is either 'm' or 'r'
  7532. representing whether the task is a map task or a reduce task.
  7533. And the third part is the task number. <br>
  7534. An example TaskID is :
  7535. <code>task_200707121733_0003_m_000005</code> , which represents the
  7536. fifth map task in the third job running at the jobtracker
  7537. started at <code>200707121733</code>.
  7538. <p>
  7539. Applications should never construct or parse TaskID strings
  7540. , but rather use appropriate constructors or {@link #forName(String)}
  7541. method.
  7542. @see JobID
  7543. @see TaskAttemptID]]>
  7544. </doc>
  7545. </class>
  7546. <!-- end class org.apache.hadoop.mapred.TaskID -->
  7547. <!-- start class org.apache.hadoop.mapred.TaskLog.Reader -->
  7548. <class name="TaskLog.Reader" extends="java.io.InputStream"
  7549. abstract="false"
  7550. static="true" final="false" visibility="public"
  7551. deprecated="not deprecated">
  7552. <constructor name="TaskLog.Reader" type="org.apache.hadoop.mapred.TaskAttemptID, org.apache.hadoop.mapred.TaskLog.LogName, long, long, boolean"
  7553. static="false" final="false" visibility="public"
  7554. deprecated="not deprecated">
  7555. <exception name="IOException" type="java.io.IOException"/>
  7556. <doc>
  7557. <![CDATA[Read a log file from start to end positions. The offsets may be negative,
  7558. in which case they are relative to the end of the file. For example,
  7559. Reader(taskid, kind, 0, -1) is the entire file and
  7560. Reader(taskid, kind, -4197, -1) is the last 4196 bytes.
  7561. @param taskid the id of the task to read the log file for
  7562. @param kind the kind of log to read
  7563. @param start the offset to read from (negative is relative to tail)
  7564. @param end the offset to read upto (negative is relative to tail)
  7565. @param isCleanup whether the attempt is cleanup attempt or not
  7566. @throws IOException]]>
  7567. </doc>
  7568. </constructor>
  7569. <method name="read" return="int"
  7570. abstract="false" native="false" synchronized="false"
  7571. static="false" final="false" visibility="public"
  7572. deprecated="not deprecated">
  7573. <exception name="IOException" type="java.io.IOException"/>
  7574. </method>
  7575. <method name="read" return="int"
  7576. abstract="false" native="false" synchronized="false"
  7577. static="false" final="false" visibility="public"
  7578. deprecated="not deprecated">
  7579. <param name="buffer" type="byte[]"/>
  7580. <param name="offset" type="int"/>
  7581. <param name="length" type="int"/>
  7582. <exception name="IOException" type="java.io.IOException"/>
  7583. </method>
  7584. <method name="available" return="int"
  7585. abstract="false" native="false" synchronized="false"
  7586. static="false" final="false" visibility="public"
  7587. deprecated="not deprecated">
  7588. <exception name="IOException" type="java.io.IOException"/>
  7589. </method>
  7590. <method name="close"
  7591. abstract="false" native="false" synchronized="false"
  7592. static="false" final="false" visibility="public"
  7593. deprecated="not deprecated">
  7594. <exception name="IOException" type="java.io.IOException"/>
  7595. </method>
  7596. </class>
  7597. <!-- end class org.apache.hadoop.mapred.TaskLog.Reader -->
  7598. <!-- start class org.apache.hadoop.mapred.TaskLogAppender -->
  7599. <class name="TaskLogAppender" extends="org.apache.log4j.FileAppender"
  7600. abstract="false"
  7601. static="false" final="false" visibility="public"
  7602. deprecated="not deprecated">
  7603. <constructor name="TaskLogAppender"
  7604. static="false" final="false" visibility="public"
  7605. deprecated="not deprecated">
  7606. </constructor>
  7607. <method name="activateOptions"
  7608. abstract="false" native="false" synchronized="false"
  7609. static="false" final="false" visibility="public"
  7610. deprecated="not deprecated">
  7611. </method>
  7612. <method name="append"
  7613. abstract="false" native="false" synchronized="false"
  7614. static="false" final="false" visibility="public"
  7615. deprecated="not deprecated">
  7616. <param name="event" type="org.apache.log4j.spi.LoggingEvent"/>
  7617. </method>
  7618. <method name="flush"
  7619. abstract="false" native="false" synchronized="false"
  7620. static="false" final="false" visibility="public"
  7621. deprecated="not deprecated">
  7622. </method>
  7623. <method name="close"
  7624. abstract="false" native="false" synchronized="true"
  7625. static="false" final="false" visibility="public"
  7626. deprecated="not deprecated">
  7627. </method>
  7628. <method name="getTaskId" return="java.lang.String"
  7629. abstract="false" native="false" synchronized="true"
  7630. static="false" final="false" visibility="public"
  7631. deprecated="not deprecated">
  7632. <doc>
  7633. <![CDATA[Getter/Setter methods for log4j.]]>
  7634. </doc>
  7635. </method>
  7636. <method name="setTaskId"
  7637. abstract="false" native="false" synchronized="true"
  7638. static="false" final="false" visibility="public"
  7639. deprecated="not deprecated">
  7640. <param name="taskId" type="java.lang.String"/>
  7641. </method>
  7642. <method name="getTotalLogFileSize" return="long"
  7643. abstract="false" native="false" synchronized="true"
  7644. static="false" final="false" visibility="public"
  7645. deprecated="not deprecated">
  7646. </method>
  7647. <method name="setTotalLogFileSize"
  7648. abstract="false" native="false" synchronized="true"
  7649. static="false" final="false" visibility="public"
  7650. deprecated="not deprecated">
  7651. <param name="logSize" type="long"/>
  7652. </method>
  7653. <method name="setIsCleanup"
  7654. abstract="false" native="false" synchronized="true"
  7655. static="false" final="false" visibility="public"
  7656. deprecated="not deprecated">
  7657. <param name="isCleanup" type="boolean"/>
  7658. <doc>
  7659. <![CDATA[Set whether the task is a cleanup attempt or not.
  7660. @param isCleanup
  7661. true if the task is cleanup attempt, false otherwise.]]>
  7662. </doc>
  7663. </method>
  7664. <method name="getIsCleanup" return="boolean"
  7665. abstract="false" native="false" synchronized="true"
  7666. static="false" final="false" visibility="public"
  7667. deprecated="not deprecated">
  7668. <doc>
  7669. <![CDATA[Get whether task is cleanup attempt or not.
  7670. @return true if the task is cleanup attempt, false otherwise.]]>
  7671. </doc>
  7672. </method>
  7673. <doc>
  7674. <![CDATA[A simple log4j-appender for the task child's
  7675. map-reduce system logs.]]>
  7676. </doc>
  7677. </class>
  7678. <!-- end class org.apache.hadoop.mapred.TaskLogAppender -->
  7679. <!-- start class org.apache.hadoop.mapred.TaskReport -->
  7680. <class name="TaskReport" extends="org.apache.hadoop.mapreduce.TaskReport"
  7681. abstract="false"
  7682. static="false" final="false" visibility="public"
  7683. deprecated="Use {@link org.apache.hadoop.mapreduce.TaskReport} instead">
  7684. <constructor name="TaskReport"
  7685. static="false" final="false" visibility="public"
  7686. deprecated="not deprecated">
  7687. </constructor>
  7688. <method name="getTaskID" return="org.apache.hadoop.mapred.TaskID"
  7689. abstract="false" native="false" synchronized="false"
  7690. static="false" final="false" visibility="public"
  7691. deprecated="not deprecated">
  7692. <doc>
  7693. <![CDATA[The id of the task.]]>
  7694. </doc>
  7695. </method>
  7696. <method name="getCounters" return="org.apache.hadoop.mapred.Counters"
  7697. abstract="false" native="false" synchronized="false"
  7698. static="false" final="false" visibility="public"
  7699. deprecated="not deprecated">
  7700. </method>
  7701. <method name="setSuccessfulAttempt"
  7702. abstract="false" native="false" synchronized="false"
  7703. static="false" final="false" visibility="public"
  7704. deprecated="not deprecated">
  7705. <param name="t" type="org.apache.hadoop.mapred.TaskAttemptID"/>
  7706. <doc>
  7707. <![CDATA[set successful attempt ID of the task.]]>
  7708. </doc>
  7709. </method>
  7710. <method name="getSuccessfulTaskAttempt" return="org.apache.hadoop.mapred.TaskAttemptID"
  7711. abstract="false" native="false" synchronized="false"
  7712. static="false" final="false" visibility="public"
  7713. deprecated="not deprecated">
  7714. <doc>
  7715. <![CDATA[Get the attempt ID that took this task to completion]]>
  7716. </doc>
  7717. </method>
  7718. <method name="setRunningTaskAttempts"
  7719. abstract="false" native="false" synchronized="false"
  7720. static="false" final="false" visibility="public"
  7721. deprecated="not deprecated">
  7722. <param name="runningAttempts" type="java.util.Collection"/>
  7723. <doc>
  7724. <![CDATA[set running attempt(s) of the task.]]>
  7725. </doc>
  7726. </method>
  7727. <method name="getRunningTaskAttempts" return="java.util.Collection"
  7728. abstract="false" native="false" synchronized="false"
  7729. static="false" final="false" visibility="public"
  7730. deprecated="not deprecated">
  7731. <doc>
  7732. <![CDATA[Get the running task attempt IDs for this task]]>
  7733. </doc>
  7734. </method>
  7735. <method name="setFinishTime"
  7736. abstract="false" native="false" synchronized="false"
  7737. static="false" final="false" visibility="protected"
  7738. deprecated="not deprecated">
  7739. <param name="finishTime" type="long"/>
  7740. <doc>
  7741. <![CDATA[set finish time of task.
  7742. @param finishTime finish time of task.]]>
  7743. </doc>
  7744. </method>
  7745. <method name="setStartTime"
  7746. abstract="false" native="false" synchronized="false"
  7747. static="false" final="false" visibility="protected"
  7748. deprecated="not deprecated">
  7749. <param name="startTime" type="long"/>
  7750. <doc>
  7751. <![CDATA[set start time of the task.]]>
  7752. </doc>
  7753. </method>
  7754. <doc>
  7755. <![CDATA[A report on the state of a task.
  7756. @deprecated Use {@link org.apache.hadoop.mapreduce.TaskReport} instead]]>
  7757. </doc>
  7758. </class>
  7759. <!-- end class org.apache.hadoop.mapred.TaskReport -->
  7760. <!-- start class org.apache.hadoop.mapred.TextInputFormat -->
  7761. <class name="TextInputFormat" extends="org.apache.hadoop.mapred.FileInputFormat"
  7762. abstract="false"
  7763. static="false" final="false" visibility="public"
  7764. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.input.TextInputFormat}
  7765. instead.">
  7766. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  7767. <constructor name="TextInputFormat"
  7768. static="false" final="false" visibility="public"
  7769. deprecated="not deprecated">
  7770. </constructor>
  7771. <method name="configure"
  7772. abstract="false" native="false" synchronized="false"
  7773. static="false" final="false" visibility="public"
  7774. deprecated="not deprecated">
  7775. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  7776. </method>
  7777. <method name="isSplitable" return="boolean"
  7778. abstract="false" native="false" synchronized="false"
  7779. static="false" final="false" visibility="protected"
  7780. deprecated="not deprecated">
  7781. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  7782. <param name="file" type="org.apache.hadoop.fs.Path"/>
  7783. </method>
  7784. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  7785. abstract="false" native="false" synchronized="false"
  7786. static="false" final="false" visibility="public"
  7787. deprecated="not deprecated">
  7788. <param name="genericSplit" type="org.apache.hadoop.mapred.InputSplit"/>
  7789. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  7790. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  7791. <exception name="IOException" type="java.io.IOException"/>
  7792. </method>
  7793. <doc>
  7794. <![CDATA[An {@link InputFormat} for plain text files. Files are broken into lines.
  7795. Either linefeed or carriage-return are used to signal end of line. Keys are
  7796. the position in the file, and values are the line of text..
  7797. @deprecated Use {@link org.apache.hadoop.mapreduce.lib.input.TextInputFormat}
  7798. instead.]]>
  7799. </doc>
  7800. </class>
  7801. <!-- end class org.apache.hadoop.mapred.TextInputFormat -->
  7802. <!-- start class org.apache.hadoop.mapred.TextOutputFormat -->
  7803. <class name="TextOutputFormat" extends="org.apache.hadoop.mapred.FileOutputFormat"
  7804. abstract="false"
  7805. static="false" final="false" visibility="public"
  7806. deprecated="Use
  7807. {@link org.apache.hadoop.mapreduce.lib.output.TextOutputFormat} instead.">
  7808. <constructor name="TextOutputFormat"
  7809. static="false" final="false" visibility="public"
  7810. deprecated="not deprecated">
  7811. </constructor>
  7812. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  7813. abstract="false" native="false" synchronized="false"
  7814. static="false" final="false" visibility="public"
  7815. deprecated="not deprecated">
  7816. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  7817. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  7818. <param name="name" type="java.lang.String"/>
  7819. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  7820. <exception name="IOException" type="java.io.IOException"/>
  7821. </method>
  7822. <doc>
  7823. <![CDATA[An {@link OutputFormat} that writes plain text files.
  7824. @deprecated Use
  7825. {@link org.apache.hadoop.mapreduce.lib.output.TextOutputFormat} instead.]]>
  7826. </doc>
  7827. </class>
  7828. <!-- end class org.apache.hadoop.mapred.TextOutputFormat -->
  7829. <!-- start class org.apache.hadoop.mapred.TextOutputFormat.LineRecordWriter -->
  7830. <class name="TextOutputFormat.LineRecordWriter" extends="java.lang.Object"
  7831. abstract="false"
  7832. static="true" final="false" visibility="protected"
  7833. deprecated="not deprecated">
  7834. <implements name="org.apache.hadoop.mapred.RecordWriter"/>
  7835. <constructor name="TextOutputFormat.LineRecordWriter" type="java.io.DataOutputStream, java.lang.String"
  7836. static="false" final="false" visibility="public"
  7837. deprecated="not deprecated">
  7838. </constructor>
  7839. <constructor name="TextOutputFormat.LineRecordWriter" type="java.io.DataOutputStream"
  7840. static="false" final="false" visibility="public"
  7841. deprecated="not deprecated">
  7842. </constructor>
  7843. <method name="write"
  7844. abstract="false" native="false" synchronized="true"
  7845. static="false" final="false" visibility="public"
  7846. deprecated="not deprecated">
  7847. <param name="key" type="K"/>
  7848. <param name="value" type="V"/>
  7849. <exception name="IOException" type="java.io.IOException"/>
  7850. </method>
  7851. <method name="close"
  7852. abstract="false" native="false" synchronized="true"
  7853. static="false" final="false" visibility="public"
  7854. deprecated="not deprecated">
  7855. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  7856. <exception name="IOException" type="java.io.IOException"/>
  7857. </method>
  7858. <field name="out" type="java.io.DataOutputStream"
  7859. transient="false" volatile="false"
  7860. static="false" final="false" visibility="protected"
  7861. deprecated="not deprecated">
  7862. </field>
  7863. </class>
  7864. <!-- end class org.apache.hadoop.mapred.TextOutputFormat.LineRecordWriter -->
  7865. <!-- start class org.apache.hadoop.mapred.Utils -->
  7866. <class name="Utils" extends="java.lang.Object"
  7867. abstract="false"
  7868. static="false" final="false" visibility="public"
  7869. deprecated="not deprecated">
  7870. <constructor name="Utils"
  7871. static="false" final="false" visibility="public"
  7872. deprecated="not deprecated">
  7873. </constructor>
  7874. <doc>
  7875. <![CDATA[A utility class. It provides
  7876. A path filter utility to filter out output/part files in the output dir]]>
  7877. </doc>
  7878. </class>
  7879. <!-- end class org.apache.hadoop.mapred.Utils -->
  7880. <!-- start class org.apache.hadoop.mapred.Utils.OutputFileUtils -->
  7881. <class name="Utils.OutputFileUtils" extends="java.lang.Object"
  7882. abstract="false"
  7883. static="true" final="false" visibility="public"
  7884. deprecated="not deprecated">
  7885. <constructor name="Utils.OutputFileUtils"
  7886. static="false" final="false" visibility="public"
  7887. deprecated="not deprecated">
  7888. </constructor>
  7889. </class>
  7890. <!-- end class org.apache.hadoop.mapred.Utils.OutputFileUtils -->
  7891. <!-- start class org.apache.hadoop.mapred.Utils.OutputFileUtils.OutputFilesFilter -->
  7892. <class name="Utils.OutputFileUtils.OutputFilesFilter" extends="org.apache.hadoop.mapred.Utils.OutputFileUtils.OutputLogFilter"
  7893. abstract="false"
  7894. static="true" final="false" visibility="public"
  7895. deprecated="not deprecated">
  7896. <constructor name="Utils.OutputFileUtils.OutputFilesFilter"
  7897. static="false" final="false" visibility="public"
  7898. deprecated="not deprecated">
  7899. </constructor>
  7900. <method name="accept" return="boolean"
  7901. abstract="false" native="false" synchronized="false"
  7902. static="false" final="false" visibility="public"
  7903. deprecated="not deprecated">
  7904. <param name="path" type="org.apache.hadoop.fs.Path"/>
  7905. </method>
  7906. <doc>
  7907. <![CDATA[This class filters output(part) files from the given directory
  7908. It does not accept files with filenames _logs and _SUCCESS.
  7909. This can be used to list paths of output directory as follows:
  7910. Path[] fileList = FileUtil.stat2Paths(fs.listStatus(outDir,
  7911. new OutputFilesFilter()));]]>
  7912. </doc>
  7913. </class>
  7914. <!-- end class org.apache.hadoop.mapred.Utils.OutputFileUtils.OutputFilesFilter -->
  7915. <!-- start class org.apache.hadoop.mapred.Utils.OutputFileUtils.OutputLogFilter -->
  7916. <class name="Utils.OutputFileUtils.OutputLogFilter" extends="java.lang.Object"
  7917. abstract="false"
  7918. static="true" final="false" visibility="public"
  7919. deprecated="not deprecated">
  7920. <implements name="org.apache.hadoop.fs.PathFilter"/>
  7921. <constructor name="Utils.OutputFileUtils.OutputLogFilter"
  7922. static="false" final="false" visibility="public"
  7923. deprecated="not deprecated">
  7924. </constructor>
  7925. <method name="accept" return="boolean"
  7926. abstract="false" native="false" synchronized="false"
  7927. static="false" final="false" visibility="public"
  7928. deprecated="not deprecated">
  7929. <param name="path" type="org.apache.hadoop.fs.Path"/>
  7930. </method>
  7931. <doc>
  7932. <![CDATA[This class filters log files from directory given
  7933. It doesnt accept paths having _logs.
  7934. This can be used to list paths of output directory as follows:
  7935. Path[] fileList = FileUtil.stat2Paths(fs.listStatus(outDir,
  7936. new OutputLogFilter()));]]>
  7937. </doc>
  7938. </class>
  7939. <!-- end class org.apache.hadoop.mapred.Utils.OutputFileUtils.OutputLogFilter -->
  7940. </package>
  7941. <package name="org.apache.hadoop.mapred.jobcontrol">
  7942. <!-- start class org.apache.hadoop.mapred.jobcontrol.Job -->
  7943. <class name="Job" extends="org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob"
  7944. abstract="false"
  7945. static="false" final="false" visibility="public"
  7946. deprecated="Use {@link ControlledJob} instead.">
  7947. <constructor name="Job" type="org.apache.hadoop.mapred.JobConf, java.util.ArrayList"
  7948. static="false" final="false" visibility="public"
  7949. deprecated="not deprecated">
  7950. <exception name="IOException" type="java.io.IOException"/>
  7951. <doc>
  7952. <![CDATA[Construct a job.
  7953. @param jobConf a mapred job configuration representing a job to be executed.
  7954. @param dependingJobs an array of jobs the current job depends on]]>
  7955. </doc>
  7956. </constructor>
  7957. <constructor name="Job" type="org.apache.hadoop.mapred.JobConf"
  7958. static="false" final="false" visibility="public"
  7959. deprecated="not deprecated">
  7960. <exception name="IOException" type="java.io.IOException"/>
  7961. </constructor>
  7962. <method name="getAssignedJobID" return="org.apache.hadoop.mapred.JobID"
  7963. abstract="false" native="false" synchronized="false"
  7964. static="false" final="false" visibility="public"
  7965. deprecated="not deprecated">
  7966. <doc>
  7967. <![CDATA[@return the mapred ID of this job as assigned by the
  7968. mapred framework.]]>
  7969. </doc>
  7970. </method>
  7971. <method name="setAssignedJobID"
  7972. abstract="false" native="false" synchronized="false"
  7973. static="false" final="false" visibility="public"
  7974. deprecated="setAssignedJobID should not be called.
  7975. JOBID is set by the framework.">
  7976. <param name="mapredJobID" type="org.apache.hadoop.mapred.JobID"/>
  7977. <doc>
  7978. <![CDATA[@deprecated setAssignedJobID should not be called.
  7979. JOBID is set by the framework.]]>
  7980. </doc>
  7981. </method>
  7982. <method name="getJobConf" return="org.apache.hadoop.mapred.JobConf"
  7983. abstract="false" native="false" synchronized="true"
  7984. static="false" final="false" visibility="public"
  7985. deprecated="not deprecated">
  7986. <doc>
  7987. <![CDATA[@return the mapred job conf of this job]]>
  7988. </doc>
  7989. </method>
  7990. <method name="setJobConf"
  7991. abstract="false" native="false" synchronized="true"
  7992. static="false" final="false" visibility="public"
  7993. deprecated="not deprecated">
  7994. <param name="jobConf" type="org.apache.hadoop.mapred.JobConf"/>
  7995. <doc>
  7996. <![CDATA[Set the mapred job conf for this job.
  7997. @param jobConf the mapred job conf for this job.]]>
  7998. </doc>
  7999. </method>
  8000. <method name="getState" return="int"
  8001. abstract="false" native="false" synchronized="true"
  8002. static="false" final="false" visibility="public"
  8003. deprecated="not deprecated">
  8004. <doc>
  8005. <![CDATA[@return the state of this job]]>
  8006. </doc>
  8007. </method>
  8008. <method name="getJobClient" return="org.apache.hadoop.mapred.JobClient"
  8009. abstract="false" native="false" synchronized="false"
  8010. static="false" final="false" visibility="public"
  8011. deprecated="not deprecated">
  8012. <doc>
  8013. <![CDATA[@return the job client of this job]]>
  8014. </doc>
  8015. </method>
  8016. <method name="getDependingJobs" return="java.util.ArrayList"
  8017. abstract="false" native="false" synchronized="false"
  8018. static="false" final="false" visibility="public"
  8019. deprecated="not deprecated">
  8020. <doc>
  8021. <![CDATA[@return the depending jobs of this job]]>
  8022. </doc>
  8023. </method>
  8024. <field name="SUCCESS" type="int"
  8025. transient="false" volatile="false"
  8026. static="true" final="true" visibility="public"
  8027. deprecated="not deprecated">
  8028. </field>
  8029. <field name="WAITING" type="int"
  8030. transient="false" volatile="false"
  8031. static="true" final="true" visibility="public"
  8032. deprecated="not deprecated">
  8033. </field>
  8034. <field name="RUNNING" type="int"
  8035. transient="false" volatile="false"
  8036. static="true" final="true" visibility="public"
  8037. deprecated="not deprecated">
  8038. </field>
  8039. <field name="READY" type="int"
  8040. transient="false" volatile="false"
  8041. static="true" final="true" visibility="public"
  8042. deprecated="not deprecated">
  8043. </field>
  8044. <field name="FAILED" type="int"
  8045. transient="false" volatile="false"
  8046. static="true" final="true" visibility="public"
  8047. deprecated="not deprecated">
  8048. </field>
  8049. <field name="DEPENDENT_FAILED" type="int"
  8050. transient="false" volatile="false"
  8051. static="true" final="true" visibility="public"
  8052. deprecated="not deprecated">
  8053. </field>
  8054. <doc>
  8055. <![CDATA[@deprecated Use {@link ControlledJob} instead.]]>
  8056. </doc>
  8057. </class>
  8058. <!-- end class org.apache.hadoop.mapred.jobcontrol.Job -->
  8059. <!-- start class org.apache.hadoop.mapred.jobcontrol.JobControl -->
  8060. <class name="JobControl" extends="org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl"
  8061. abstract="false"
  8062. static="false" final="false" visibility="public"
  8063. deprecated="Use
  8064. {@link org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl} instead">
  8065. <constructor name="JobControl" type="java.lang.String"
  8066. static="false" final="false" visibility="public"
  8067. deprecated="not deprecated">
  8068. <doc>
  8069. <![CDATA[Construct a job control for a group of jobs.
  8070. @param groupName a name identifying this group]]>
  8071. </doc>
  8072. </constructor>
  8073. <method name="getWaitingJobs" return="java.util.ArrayList"
  8074. abstract="false" native="false" synchronized="false"
  8075. static="false" final="false" visibility="public"
  8076. deprecated="not deprecated">
  8077. <doc>
  8078. <![CDATA[@return the jobs in the waiting state]]>
  8079. </doc>
  8080. </method>
  8081. <method name="getRunningJobs" return="java.util.ArrayList"
  8082. abstract="false" native="false" synchronized="false"
  8083. static="false" final="false" visibility="public"
  8084. deprecated="not deprecated">
  8085. <doc>
  8086. <![CDATA[@return the jobs in the running state]]>
  8087. </doc>
  8088. </method>
  8089. <method name="getReadyJobs" return="java.util.ArrayList"
  8090. abstract="false" native="false" synchronized="false"
  8091. static="false" final="false" visibility="public"
  8092. deprecated="not deprecated">
  8093. <doc>
  8094. <![CDATA[@return the jobs in the ready state]]>
  8095. </doc>
  8096. </method>
  8097. <method name="getSuccessfulJobs" return="java.util.ArrayList"
  8098. abstract="false" native="false" synchronized="false"
  8099. static="false" final="false" visibility="public"
  8100. deprecated="not deprecated">
  8101. <doc>
  8102. <![CDATA[@return the jobs in the success state]]>
  8103. </doc>
  8104. </method>
  8105. <method name="getFailedJobs" return="java.util.ArrayList"
  8106. abstract="false" native="false" synchronized="false"
  8107. static="false" final="false" visibility="public"
  8108. deprecated="not deprecated">
  8109. </method>
  8110. <method name="addJobs"
  8111. abstract="false" native="false" synchronized="false"
  8112. static="false" final="false" visibility="public"
  8113. deprecated="not deprecated">
  8114. <param name="jobs" type="java.util.Collection"/>
  8115. <doc>
  8116. <![CDATA[Add a collection of jobs
  8117. @param jobs]]>
  8118. </doc>
  8119. </method>
  8120. <method name="getState" return="int"
  8121. abstract="false" native="false" synchronized="false"
  8122. static="false" final="false" visibility="public"
  8123. deprecated="not deprecated">
  8124. <doc>
  8125. <![CDATA[@return the thread state]]>
  8126. </doc>
  8127. </method>
  8128. <doc>
  8129. <![CDATA[@deprecated Use
  8130. {@link org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl} instead]]>
  8131. </doc>
  8132. </class>
  8133. <!-- end class org.apache.hadoop.mapred.jobcontrol.JobControl -->
  8134. </package>
  8135. <package name="org.apache.hadoop.mapred.join">
  8136. <!-- start class org.apache.hadoop.mapred.join.ArrayListBackedIterator -->
  8137. <class name="ArrayListBackedIterator" extends="org.apache.hadoop.mapreduce.lib.join.ArrayListBackedIterator"
  8138. abstract="false"
  8139. static="false" final="false" visibility="public"
  8140. deprecated="Use
  8141. {@link org.apache.hadoop.mapreduce.lib.join.ArrayListBackedIterator} instead">
  8142. <implements name="org.apache.hadoop.mapred.join.ResetableIterator"/>
  8143. <constructor name="ArrayListBackedIterator"
  8144. static="false" final="false" visibility="public"
  8145. deprecated="not deprecated">
  8146. </constructor>
  8147. <constructor name="ArrayListBackedIterator" type="java.util.ArrayList"
  8148. static="false" final="false" visibility="public"
  8149. deprecated="not deprecated">
  8150. </constructor>
  8151. <doc>
  8152. <![CDATA[This class provides an implementation of ResetableIterator. The
  8153. implementation uses an {@link java.util.ArrayList} to store elements
  8154. added to it, replaying them as requested.
  8155. Prefer {@link StreamBackedIterator}.
  8156. @deprecated Use
  8157. {@link org.apache.hadoop.mapreduce.lib.join.ArrayListBackedIterator} instead]]>
  8158. </doc>
  8159. </class>
  8160. <!-- end class org.apache.hadoop.mapred.join.ArrayListBackedIterator -->
  8161. <!-- start interface org.apache.hadoop.mapred.join.ComposableInputFormat -->
  8162. <interface name="ComposableInputFormat" abstract="true"
  8163. static="false" final="false" visibility="public"
  8164. deprecated="Use
  8165. {@link org.apache.hadoop.mapreduce.lib.join.ComposableInputFormat} instead">
  8166. <implements name="org.apache.hadoop.mapred.InputFormat"/>
  8167. <method name="getRecordReader" return="org.apache.hadoop.mapred.join.ComposableRecordReader"
  8168. abstract="false" native="false" synchronized="false"
  8169. static="false" final="false" visibility="public"
  8170. deprecated="not deprecated">
  8171. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  8172. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  8173. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  8174. <exception name="IOException" type="java.io.IOException"/>
  8175. </method>
  8176. <doc>
  8177. <![CDATA[Refinement of InputFormat requiring implementors to provide
  8178. ComposableRecordReader instead of RecordReader.
  8179. @deprecated Use
  8180. {@link org.apache.hadoop.mapreduce.lib.join.ComposableInputFormat} instead]]>
  8181. </doc>
  8182. </interface>
  8183. <!-- end interface org.apache.hadoop.mapred.join.ComposableInputFormat -->
  8184. <!-- start interface org.apache.hadoop.mapred.join.ComposableRecordReader -->
  8185. <interface name="ComposableRecordReader" abstract="true"
  8186. static="false" final="false" visibility="public"
  8187. deprecated="Use
  8188. {@link org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader} instead">
  8189. <implements name="org.apache.hadoop.mapred.RecordReader"/>
  8190. <implements name="java.lang.Comparable"/>
  8191. <method name="id" return="int"
  8192. abstract="false" native="false" synchronized="false"
  8193. static="false" final="false" visibility="public"
  8194. deprecated="not deprecated">
  8195. <doc>
  8196. <![CDATA[Return the position in the collector this class occupies.]]>
  8197. </doc>
  8198. </method>
  8199. <method name="key" return="K"
  8200. abstract="false" native="false" synchronized="false"
  8201. static="false" final="false" visibility="public"
  8202. deprecated="not deprecated">
  8203. <doc>
  8204. <![CDATA[Return the key this RecordReader would supply on a call to next(K,V)]]>
  8205. </doc>
  8206. </method>
  8207. <method name="key"
  8208. abstract="false" native="false" synchronized="false"
  8209. static="false" final="false" visibility="public"
  8210. deprecated="not deprecated">
  8211. <param name="key" type="K"/>
  8212. <exception name="IOException" type="java.io.IOException"/>
  8213. <doc>
  8214. <![CDATA[Clone the key at the head of this RecordReader into the object provided.]]>
  8215. </doc>
  8216. </method>
  8217. <method name="hasNext" return="boolean"
  8218. abstract="false" native="false" synchronized="false"
  8219. static="false" final="false" visibility="public"
  8220. deprecated="not deprecated">
  8221. <doc>
  8222. <![CDATA[Returns true if the stream is not empty, but provides no guarantee that
  8223. a call to next(K,V) will succeed.]]>
  8224. </doc>
  8225. </method>
  8226. <method name="skip"
  8227. abstract="false" native="false" synchronized="false"
  8228. static="false" final="false" visibility="public"
  8229. deprecated="not deprecated">
  8230. <param name="key" type="K"/>
  8231. <exception name="IOException" type="java.io.IOException"/>
  8232. <doc>
  8233. <![CDATA[Skip key-value pairs with keys less than or equal to the key provided.]]>
  8234. </doc>
  8235. </method>
  8236. <method name="accept"
  8237. abstract="false" native="false" synchronized="false"
  8238. static="false" final="false" visibility="public"
  8239. deprecated="not deprecated">
  8240. <param name="jc" type="org.apache.hadoop.mapred.join.CompositeRecordReader.JoinCollector"/>
  8241. <param name="key" type="K"/>
  8242. <exception name="IOException" type="java.io.IOException"/>
  8243. <doc>
  8244. <![CDATA[While key-value pairs from this RecordReader match the given key, register
  8245. them with the JoinCollector provided.]]>
  8246. </doc>
  8247. </method>
  8248. <doc>
  8249. <![CDATA[Additional operations required of a RecordReader to participate in a join.
  8250. @deprecated Use
  8251. {@link org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader} instead]]>
  8252. </doc>
  8253. </interface>
  8254. <!-- end interface org.apache.hadoop.mapred.join.ComposableRecordReader -->
  8255. <!-- start class org.apache.hadoop.mapred.join.CompositeInputFormat -->
  8256. <class name="CompositeInputFormat" extends="java.lang.Object"
  8257. abstract="false"
  8258. static="false" final="false" visibility="public"
  8259. deprecated="Use
  8260. {@link org.apache.hadoop.mapreduce.lib.join.CompositeInputFormat} instead">
  8261. <implements name="org.apache.hadoop.mapred.join.ComposableInputFormat"/>
  8262. <constructor name="CompositeInputFormat"
  8263. static="false" final="false" visibility="public"
  8264. deprecated="not deprecated">
  8265. </constructor>
  8266. <method name="setFormat"
  8267. abstract="false" native="false" synchronized="false"
  8268. static="false" final="false" visibility="public"
  8269. deprecated="not deprecated">
  8270. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  8271. <exception name="IOException" type="java.io.IOException"/>
  8272. <doc>
  8273. <![CDATA[Interpret a given string as a composite expression.
  8274. {@code
  8275. func ::= <ident>([<func>,]*<func>)
  8276. func ::= tbl(<class>,"<path>")
  8277. class ::= @see java.lang.Class#forName(java.lang.String)
  8278. path ::= @see org.apache.hadoop.fs.Path#Path(java.lang.String)
  8279. }
  8280. Reads expression from the <tt>mapred.join.expr</tt> property and
  8281. user-supplied join types from <tt>mapred.join.define.&lt;ident&gt;</tt>
  8282. types. Paths supplied to <tt>tbl</tt> are given as input paths to the
  8283. InputFormat class listed.
  8284. @see #compose(java.lang.String, java.lang.Class, java.lang.String...)]]>
  8285. </doc>
  8286. </method>
  8287. <method name="addDefaults"
  8288. abstract="false" native="false" synchronized="false"
  8289. static="false" final="false" visibility="protected"
  8290. deprecated="not deprecated">
  8291. <doc>
  8292. <![CDATA[Adds the default set of identifiers to the parser.]]>
  8293. </doc>
  8294. </method>
  8295. <method name="getSplits" return="org.apache.hadoop.mapred.InputSplit[]"
  8296. abstract="false" native="false" synchronized="false"
  8297. static="false" final="false" visibility="public"
  8298. deprecated="not deprecated">
  8299. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  8300. <param name="numSplits" type="int"/>
  8301. <exception name="IOException" type="java.io.IOException"/>
  8302. <doc>
  8303. <![CDATA[Build a CompositeInputSplit from the child InputFormats by assigning the
  8304. ith split from each child to the ith composite split.]]>
  8305. </doc>
  8306. </method>
  8307. <method name="getRecordReader" return="org.apache.hadoop.mapred.join.ComposableRecordReader"
  8308. abstract="false" native="false" synchronized="false"
  8309. static="false" final="false" visibility="public"
  8310. deprecated="not deprecated">
  8311. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  8312. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  8313. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  8314. <exception name="IOException" type="java.io.IOException"/>
  8315. <doc>
  8316. <![CDATA[Construct a CompositeRecordReader for the children of this InputFormat
  8317. as defined in the init expression.
  8318. The outermost join need only be composable, not necessarily a composite.
  8319. Mandating TupleWritable isn't strictly correct.]]>
  8320. </doc>
  8321. </method>
  8322. <method name="compose" return="java.lang.String"
  8323. abstract="false" native="false" synchronized="false"
  8324. static="true" final="false" visibility="public"
  8325. deprecated="not deprecated">
  8326. <param name="inf" type="java.lang.Class"/>
  8327. <param name="path" type="java.lang.String"/>
  8328. <doc>
  8329. <![CDATA[Convenience method for constructing composite formats.
  8330. Given InputFormat class (inf), path (p) return:
  8331. {@code tbl(<inf>, <p>) }]]>
  8332. </doc>
  8333. </method>
  8334. <method name="compose" return="java.lang.String"
  8335. abstract="false" native="false" synchronized="false"
  8336. static="true" final="false" visibility="public"
  8337. deprecated="not deprecated">
  8338. <param name="op" type="java.lang.String"/>
  8339. <param name="inf" type="java.lang.Class"/>
  8340. <param name="path" type="java.lang.String[]"/>
  8341. <doc>
  8342. <![CDATA[Convenience method for constructing composite formats.
  8343. Given operation (op), Object class (inf), set of paths (p) return:
  8344. {@code <op>(tbl(<inf>,<p1>),tbl(<inf>,<p2>),...,tbl(<inf>,<pn>)) }]]>
  8345. </doc>
  8346. </method>
  8347. <method name="compose" return="java.lang.String"
  8348. abstract="false" native="false" synchronized="false"
  8349. static="true" final="false" visibility="public"
  8350. deprecated="not deprecated">
  8351. <param name="op" type="java.lang.String"/>
  8352. <param name="inf" type="java.lang.Class"/>
  8353. <param name="path" type="org.apache.hadoop.fs.Path[]"/>
  8354. <doc>
  8355. <![CDATA[Convenience method for constructing composite formats.
  8356. Given operation (op), Object class (inf), set of paths (p) return:
  8357. {@code <op>(tbl(<inf>,<p1>),tbl(<inf>,<p2>),...,tbl(<inf>,<pn>)) }]]>
  8358. </doc>
  8359. </method>
  8360. <doc>
  8361. <![CDATA[An InputFormat capable of performing joins over a set of data sources sorted
  8362. and partitioned the same way.
  8363. @see #setFormat
  8364. A user may define new join types by setting the property
  8365. <tt>mapred.join.define.&lt;ident&gt;</tt> to a classname. In the expression
  8366. <tt>mapred.join.expr</tt>, the identifier will be assumed to be a
  8367. ComposableRecordReader.
  8368. <tt>mapred.join.keycomparator</tt> can be a classname used to compare keys
  8369. in the join.
  8370. @see JoinRecordReader
  8371. @see MultiFilterRecordReader
  8372. @deprecated Use
  8373. {@link org.apache.hadoop.mapreduce.lib.join.CompositeInputFormat} instead]]>
  8374. </doc>
  8375. </class>
  8376. <!-- end class org.apache.hadoop.mapred.join.CompositeInputFormat -->
  8377. <!-- start class org.apache.hadoop.mapred.join.CompositeInputSplit -->
  8378. <class name="CompositeInputSplit" extends="java.lang.Object"
  8379. abstract="false"
  8380. static="false" final="false" visibility="public"
  8381. deprecated="Use
  8382. {@link org.apache.hadoop.mapreduce.lib.join.CompositeInputSplit} instead">
  8383. <implements name="org.apache.hadoop.mapred.InputSplit"/>
  8384. <constructor name="CompositeInputSplit"
  8385. static="false" final="false" visibility="public"
  8386. deprecated="not deprecated">
  8387. </constructor>
  8388. <constructor name="CompositeInputSplit" type="int"
  8389. static="false" final="false" visibility="public"
  8390. deprecated="not deprecated">
  8391. </constructor>
  8392. <method name="add"
  8393. abstract="false" native="false" synchronized="false"
  8394. static="false" final="false" visibility="public"
  8395. deprecated="not deprecated">
  8396. <param name="s" type="org.apache.hadoop.mapred.InputSplit"/>
  8397. <exception name="IOException" type="java.io.IOException"/>
  8398. <doc>
  8399. <![CDATA[Add an InputSplit to this collection.
  8400. @throws IOException If capacity was not specified during construction
  8401. or if capacity has been reached.]]>
  8402. </doc>
  8403. </method>
  8404. <method name="get" return="org.apache.hadoop.mapred.InputSplit"
  8405. abstract="false" native="false" synchronized="false"
  8406. static="false" final="false" visibility="public"
  8407. deprecated="not deprecated">
  8408. <param name="i" type="int"/>
  8409. <doc>
  8410. <![CDATA[Get ith child InputSplit.]]>
  8411. </doc>
  8412. </method>
  8413. <method name="getLength" return="long"
  8414. abstract="false" native="false" synchronized="false"
  8415. static="false" final="false" visibility="public"
  8416. deprecated="not deprecated">
  8417. <exception name="IOException" type="java.io.IOException"/>
  8418. <doc>
  8419. <![CDATA[Return the aggregate length of all child InputSplits currently added.]]>
  8420. </doc>
  8421. </method>
  8422. <method name="getLength" return="long"
  8423. abstract="false" native="false" synchronized="false"
  8424. static="false" final="false" visibility="public"
  8425. deprecated="not deprecated">
  8426. <param name="i" type="int"/>
  8427. <exception name="IOException" type="java.io.IOException"/>
  8428. <doc>
  8429. <![CDATA[Get the length of ith child InputSplit.]]>
  8430. </doc>
  8431. </method>
  8432. <method name="getLocations" return="java.lang.String[]"
  8433. abstract="false" native="false" synchronized="false"
  8434. static="false" final="false" visibility="public"
  8435. deprecated="not deprecated">
  8436. <exception name="IOException" type="java.io.IOException"/>
  8437. <doc>
  8438. <![CDATA[Collect a set of hosts from all child InputSplits.]]>
  8439. </doc>
  8440. </method>
  8441. <method name="getLocation" return="java.lang.String[]"
  8442. abstract="false" native="false" synchronized="false"
  8443. static="false" final="false" visibility="public"
  8444. deprecated="not deprecated">
  8445. <param name="i" type="int"/>
  8446. <exception name="IOException" type="java.io.IOException"/>
  8447. <doc>
  8448. <![CDATA[getLocations from ith InputSplit.]]>
  8449. </doc>
  8450. </method>
  8451. <method name="write"
  8452. abstract="false" native="false" synchronized="false"
  8453. static="false" final="false" visibility="public"
  8454. deprecated="not deprecated">
  8455. <param name="out" type="java.io.DataOutput"/>
  8456. <exception name="IOException" type="java.io.IOException"/>
  8457. <doc>
  8458. <![CDATA[Write splits in the following format.
  8459. {@code
  8460. <count><class1><class2>...<classn><split1><split2>...<splitn>
  8461. }]]>
  8462. </doc>
  8463. </method>
  8464. <method name="readFields"
  8465. abstract="false" native="false" synchronized="false"
  8466. static="false" final="false" visibility="public"
  8467. deprecated="not deprecated">
  8468. <param name="in" type="java.io.DataInput"/>
  8469. <exception name="IOException" type="java.io.IOException"/>
  8470. <doc>
  8471. <![CDATA[{@inheritDoc}
  8472. @throws IOException If the child InputSplit cannot be read, typically
  8473. for faliing access checks.]]>
  8474. </doc>
  8475. </method>
  8476. <doc>
  8477. <![CDATA[This InputSplit contains a set of child InputSplits. Any InputSplit inserted
  8478. into this collection must have a public default constructor.
  8479. @deprecated Use
  8480. {@link org.apache.hadoop.mapreduce.lib.join.CompositeInputSplit} instead]]>
  8481. </doc>
  8482. </class>
  8483. <!-- end class org.apache.hadoop.mapred.join.CompositeInputSplit -->
  8484. <!-- start class org.apache.hadoop.mapred.join.CompositeRecordReader -->
  8485. <class name="CompositeRecordReader" extends="java.lang.Object"
  8486. abstract="true"
  8487. static="false" final="false" visibility="public"
  8488. deprecated="Use
  8489. {@link org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader} instead">
  8490. <implements name="org.apache.hadoop.conf.Configurable"/>
  8491. <constructor name="CompositeRecordReader" type="int, int, java.lang.Class"
  8492. static="false" final="false" visibility="public"
  8493. deprecated="not deprecated">
  8494. <exception name="IOException" type="java.io.IOException"/>
  8495. <doc>
  8496. <![CDATA[Create a RecordReader with <tt>capacity</tt> children to position
  8497. <tt>id</tt> in the parent reader.
  8498. The id of a root CompositeRecordReader is -1 by convention, but relying
  8499. on this is not recommended.]]>
  8500. </doc>
  8501. </constructor>
  8502. <method name="combine" return="boolean"
  8503. abstract="true" native="false" synchronized="false"
  8504. static="false" final="false" visibility="protected"
  8505. deprecated="not deprecated">
  8506. <param name="srcs" type="java.lang.Object[]"/>
  8507. <param name="value" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8508. </method>
  8509. <method name="id" return="int"
  8510. abstract="false" native="false" synchronized="false"
  8511. static="false" final="false" visibility="public"
  8512. deprecated="not deprecated">
  8513. <doc>
  8514. <![CDATA[Return the position in the collector this class occupies.]]>
  8515. </doc>
  8516. </method>
  8517. <method name="setConf"
  8518. abstract="false" native="false" synchronized="false"
  8519. static="false" final="false" visibility="public"
  8520. deprecated="not deprecated">
  8521. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  8522. <doc>
  8523. <![CDATA[{@inheritDoc}]]>
  8524. </doc>
  8525. </method>
  8526. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  8527. abstract="false" native="false" synchronized="false"
  8528. static="false" final="false" visibility="public"
  8529. deprecated="not deprecated">
  8530. <doc>
  8531. <![CDATA[{@inheritDoc}]]>
  8532. </doc>
  8533. </method>
  8534. <method name="getRecordReaderQueue" return="java.util.PriorityQueue"
  8535. abstract="false" native="false" synchronized="false"
  8536. static="false" final="false" visibility="protected"
  8537. deprecated="not deprecated">
  8538. <doc>
  8539. <![CDATA[Return sorted list of RecordReaders for this composite.]]>
  8540. </doc>
  8541. </method>
  8542. <method name="getComparator" return="org.apache.hadoop.io.WritableComparator"
  8543. abstract="false" native="false" synchronized="false"
  8544. static="false" final="false" visibility="protected"
  8545. deprecated="not deprecated">
  8546. <doc>
  8547. <![CDATA[Return comparator defining the ordering for RecordReaders in this
  8548. composite.]]>
  8549. </doc>
  8550. </method>
  8551. <method name="add"
  8552. abstract="false" native="false" synchronized="false"
  8553. static="false" final="false" visibility="public"
  8554. deprecated="not deprecated">
  8555. <param name="rr" type="org.apache.hadoop.mapred.join.ComposableRecordReader"/>
  8556. <exception name="IOException" type="java.io.IOException"/>
  8557. <doc>
  8558. <![CDATA[Add a RecordReader to this collection.
  8559. The id() of a RecordReader determines where in the Tuple its
  8560. entry will appear. Adding RecordReaders with the same id has
  8561. undefined behavior.]]>
  8562. </doc>
  8563. </method>
  8564. <method name="key" return="K"
  8565. abstract="false" native="false" synchronized="false"
  8566. static="false" final="false" visibility="public"
  8567. deprecated="not deprecated">
  8568. <doc>
  8569. <![CDATA[Return the key for the current join or the value at the top of the
  8570. RecordReader heap.]]>
  8571. </doc>
  8572. </method>
  8573. <method name="key"
  8574. abstract="false" native="false" synchronized="false"
  8575. static="false" final="false" visibility="public"
  8576. deprecated="not deprecated">
  8577. <param name="key" type="K"/>
  8578. <exception name="IOException" type="java.io.IOException"/>
  8579. <doc>
  8580. <![CDATA[Clone the key at the top of this RR into the given object.]]>
  8581. </doc>
  8582. </method>
  8583. <method name="hasNext" return="boolean"
  8584. abstract="false" native="false" synchronized="false"
  8585. static="false" final="false" visibility="public"
  8586. deprecated="not deprecated">
  8587. <doc>
  8588. <![CDATA[Return true if it is possible that this could emit more values.]]>
  8589. </doc>
  8590. </method>
  8591. <method name="skip"
  8592. abstract="false" native="false" synchronized="false"
  8593. static="false" final="false" visibility="public"
  8594. deprecated="not deprecated">
  8595. <param name="key" type="K"/>
  8596. <exception name="IOException" type="java.io.IOException"/>
  8597. <doc>
  8598. <![CDATA[Pass skip key to child RRs.]]>
  8599. </doc>
  8600. </method>
  8601. <method name="getDelegate" return="org.apache.hadoop.mapred.join.ResetableIterator"
  8602. abstract="true" native="false" synchronized="false"
  8603. static="false" final="false" visibility="protected"
  8604. deprecated="not deprecated">
  8605. <doc>
  8606. <![CDATA[Obtain an iterator over the child RRs apropos of the value type
  8607. ultimately emitted from this join.]]>
  8608. </doc>
  8609. </method>
  8610. <method name="accept"
  8611. abstract="false" native="false" synchronized="false"
  8612. static="false" final="false" visibility="public"
  8613. deprecated="not deprecated">
  8614. <param name="jc" type="org.apache.hadoop.mapred.join.CompositeRecordReader.JoinCollector"/>
  8615. <param name="key" type="K"/>
  8616. <exception name="IOException" type="java.io.IOException"/>
  8617. <doc>
  8618. <![CDATA[If key provided matches that of this Composite, give JoinCollector
  8619. iterator over values it may emit.]]>
  8620. </doc>
  8621. </method>
  8622. <method name="fillJoinCollector"
  8623. abstract="false" native="false" synchronized="false"
  8624. static="false" final="false" visibility="protected"
  8625. deprecated="not deprecated">
  8626. <param name="iterkey" type="K"/>
  8627. <exception name="IOException" type="java.io.IOException"/>
  8628. <doc>
  8629. <![CDATA[For all child RRs offering the key provided, obtain an iterator
  8630. at that position in the JoinCollector.]]>
  8631. </doc>
  8632. </method>
  8633. <method name="compareTo" return="int"
  8634. abstract="false" native="false" synchronized="false"
  8635. static="false" final="false" visibility="public"
  8636. deprecated="not deprecated">
  8637. <param name="other" type="org.apache.hadoop.mapred.join.ComposableRecordReader"/>
  8638. <doc>
  8639. <![CDATA[Implement Comparable contract (compare key of join or head of heap
  8640. with that of another).]]>
  8641. </doc>
  8642. </method>
  8643. <method name="createKey" return="K"
  8644. abstract="false" native="false" synchronized="false"
  8645. static="false" final="false" visibility="public"
  8646. deprecated="not deprecated">
  8647. <doc>
  8648. <![CDATA[Create a new key value common to all child RRs.
  8649. @throws ClassCastException if key classes differ.]]>
  8650. </doc>
  8651. </method>
  8652. <method name="createInternalValue" return="org.apache.hadoop.mapred.join.TupleWritable"
  8653. abstract="false" native="false" synchronized="false"
  8654. static="false" final="false" visibility="protected"
  8655. deprecated="not deprecated">
  8656. <doc>
  8657. <![CDATA[Create a value to be used internally for joins.]]>
  8658. </doc>
  8659. </method>
  8660. <method name="getPos" return="long"
  8661. abstract="false" native="false" synchronized="false"
  8662. static="false" final="false" visibility="public"
  8663. deprecated="not deprecated">
  8664. <exception name="IOException" type="java.io.IOException"/>
  8665. <doc>
  8666. <![CDATA[Unsupported (returns zero in all cases).]]>
  8667. </doc>
  8668. </method>
  8669. <method name="close"
  8670. abstract="false" native="false" synchronized="false"
  8671. static="false" final="false" visibility="public"
  8672. deprecated="not deprecated">
  8673. <exception name="IOException" type="java.io.IOException"/>
  8674. <doc>
  8675. <![CDATA[Close all child RRs.]]>
  8676. </doc>
  8677. </method>
  8678. <method name="getProgress" return="float"
  8679. abstract="false" native="false" synchronized="false"
  8680. static="false" final="false" visibility="public"
  8681. deprecated="not deprecated">
  8682. <exception name="IOException" type="java.io.IOException"/>
  8683. <doc>
  8684. <![CDATA[Report progress as the minimum of all child RR progress.]]>
  8685. </doc>
  8686. </method>
  8687. <field name="jc" type="org.apache.hadoop.mapred.join.CompositeRecordReader.JoinCollector"
  8688. transient="false" volatile="false"
  8689. static="false" final="true" visibility="protected"
  8690. deprecated="not deprecated">
  8691. </field>
  8692. <field name="kids" type="org.apache.hadoop.mapred.join.ComposableRecordReader[]"
  8693. transient="false" volatile="false"
  8694. static="false" final="true" visibility="protected"
  8695. deprecated="not deprecated">
  8696. </field>
  8697. <doc>
  8698. <![CDATA[A RecordReader that can effect joins of RecordReaders sharing a common key
  8699. type and partitioning.
  8700. @deprecated Use
  8701. {@link org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader} instead]]>
  8702. </doc>
  8703. </class>
  8704. <!-- end class org.apache.hadoop.mapred.join.CompositeRecordReader -->
  8705. <!-- start class org.apache.hadoop.mapred.join.InnerJoinRecordReader -->
  8706. <class name="InnerJoinRecordReader" extends="org.apache.hadoop.mapred.join.JoinRecordReader"
  8707. abstract="false"
  8708. static="false" final="false" visibility="public"
  8709. deprecated="Use
  8710. {@link org.apache.hadoop.mapreduce.lib.join.InnerJoinRecordReader} instead.">
  8711. <method name="combine" return="boolean"
  8712. abstract="false" native="false" synchronized="false"
  8713. static="false" final="false" visibility="protected"
  8714. deprecated="not deprecated">
  8715. <param name="srcs" type="java.lang.Object[]"/>
  8716. <param name="dst" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8717. <doc>
  8718. <![CDATA[Return true iff the tuple is full (all data sources contain this key).]]>
  8719. </doc>
  8720. </method>
  8721. <doc>
  8722. <![CDATA[Full inner join.
  8723. @deprecated Use
  8724. {@link org.apache.hadoop.mapreduce.lib.join.InnerJoinRecordReader} instead.]]>
  8725. </doc>
  8726. </class>
  8727. <!-- end class org.apache.hadoop.mapred.join.InnerJoinRecordReader -->
  8728. <!-- start class org.apache.hadoop.mapred.join.JoinRecordReader -->
  8729. <class name="JoinRecordReader" extends="org.apache.hadoop.mapred.join.CompositeRecordReader"
  8730. abstract="true"
  8731. static="false" final="false" visibility="public"
  8732. deprecated="Use
  8733. {@link org.apache.hadoop.mapreduce.lib.join.JoinRecordReader} instead">
  8734. <implements name="org.apache.hadoop.mapred.join.ComposableRecordReader"/>
  8735. <constructor name="JoinRecordReader" type="int, org.apache.hadoop.mapred.JobConf, int, java.lang.Class"
  8736. static="false" final="false" visibility="public"
  8737. deprecated="not deprecated">
  8738. <exception name="IOException" type="java.io.IOException"/>
  8739. </constructor>
  8740. <method name="next" return="boolean"
  8741. abstract="false" native="false" synchronized="false"
  8742. static="false" final="false" visibility="public"
  8743. deprecated="not deprecated">
  8744. <param name="key" type="K"/>
  8745. <param name="value" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8746. <exception name="IOException" type="java.io.IOException"/>
  8747. <doc>
  8748. <![CDATA[Emit the next set of key, value pairs as defined by the child
  8749. RecordReaders and operation associated with this composite RR.]]>
  8750. </doc>
  8751. </method>
  8752. <method name="createValue" return="org.apache.hadoop.mapred.join.TupleWritable"
  8753. abstract="false" native="false" synchronized="false"
  8754. static="false" final="false" visibility="public"
  8755. deprecated="not deprecated">
  8756. <doc>
  8757. <![CDATA[{@inheritDoc}]]>
  8758. </doc>
  8759. </method>
  8760. <method name="getDelegate" return="org.apache.hadoop.mapred.join.ResetableIterator"
  8761. abstract="false" native="false" synchronized="false"
  8762. static="false" final="false" visibility="protected"
  8763. deprecated="not deprecated">
  8764. <doc>
  8765. <![CDATA[Return an iterator wrapping the JoinCollector.]]>
  8766. </doc>
  8767. </method>
  8768. <doc>
  8769. <![CDATA[Base class for Composite joins returning Tuples of arbitrary Writables.
  8770. @deprecated Use
  8771. {@link org.apache.hadoop.mapreduce.lib.join.JoinRecordReader} instead]]>
  8772. </doc>
  8773. </class>
  8774. <!-- end class org.apache.hadoop.mapred.join.JoinRecordReader -->
  8775. <!-- start class org.apache.hadoop.mapred.join.JoinRecordReader.JoinDelegationIterator -->
  8776. <class name="JoinRecordReader.JoinDelegationIterator" extends="java.lang.Object"
  8777. abstract="false"
  8778. static="false" final="false" visibility="protected"
  8779. deprecated="not deprecated">
  8780. <implements name="org.apache.hadoop.mapred.join.ResetableIterator"/>
  8781. <constructor name="JoinRecordReader.JoinDelegationIterator"
  8782. static="false" final="false" visibility="protected"
  8783. deprecated="not deprecated">
  8784. </constructor>
  8785. <method name="hasNext" return="boolean"
  8786. abstract="false" native="false" synchronized="false"
  8787. static="false" final="false" visibility="public"
  8788. deprecated="not deprecated">
  8789. </method>
  8790. <method name="next" return="boolean"
  8791. abstract="false" native="false" synchronized="false"
  8792. static="false" final="false" visibility="public"
  8793. deprecated="not deprecated">
  8794. <param name="val" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8795. <exception name="IOException" type="java.io.IOException"/>
  8796. </method>
  8797. <method name="replay" return="boolean"
  8798. abstract="false" native="false" synchronized="false"
  8799. static="false" final="false" visibility="public"
  8800. deprecated="not deprecated">
  8801. <param name="val" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8802. <exception name="IOException" type="java.io.IOException"/>
  8803. </method>
  8804. <method name="reset"
  8805. abstract="false" native="false" synchronized="false"
  8806. static="false" final="false" visibility="public"
  8807. deprecated="not deprecated">
  8808. </method>
  8809. <method name="add"
  8810. abstract="false" native="false" synchronized="false"
  8811. static="false" final="false" visibility="public"
  8812. deprecated="not deprecated">
  8813. <param name="item" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8814. <exception name="IOException" type="java.io.IOException"/>
  8815. </method>
  8816. <method name="close"
  8817. abstract="false" native="false" synchronized="false"
  8818. static="false" final="false" visibility="public"
  8819. deprecated="not deprecated">
  8820. <exception name="IOException" type="java.io.IOException"/>
  8821. </method>
  8822. <method name="clear"
  8823. abstract="false" native="false" synchronized="false"
  8824. static="false" final="false" visibility="public"
  8825. deprecated="not deprecated">
  8826. </method>
  8827. <doc>
  8828. <![CDATA[Since the JoinCollector is effecting our operation, we need only
  8829. provide an iterator proxy wrapping its operation.]]>
  8830. </doc>
  8831. </class>
  8832. <!-- end class org.apache.hadoop.mapred.join.JoinRecordReader.JoinDelegationIterator -->
  8833. <!-- start class org.apache.hadoop.mapred.join.MultiFilterRecordReader -->
  8834. <class name="MultiFilterRecordReader" extends="org.apache.hadoop.mapred.join.CompositeRecordReader"
  8835. abstract="true"
  8836. static="false" final="false" visibility="public"
  8837. deprecated="Use
  8838. {@link org.apache.hadoop.mapreduce.lib.join.MultiFilterRecordReader} instead">
  8839. <implements name="org.apache.hadoop.mapred.join.ComposableRecordReader"/>
  8840. <constructor name="MultiFilterRecordReader" type="int, org.apache.hadoop.mapred.JobConf, int, java.lang.Class"
  8841. static="false" final="false" visibility="public"
  8842. deprecated="not deprecated">
  8843. <exception name="IOException" type="java.io.IOException"/>
  8844. </constructor>
  8845. <method name="emit" return="V"
  8846. abstract="true" native="false" synchronized="false"
  8847. static="false" final="false" visibility="protected"
  8848. deprecated="not deprecated">
  8849. <param name="dst" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8850. <exception name="IOException" type="java.io.IOException"/>
  8851. <doc>
  8852. <![CDATA[For each tuple emitted, return a value (typically one of the values
  8853. in the tuple).
  8854. Modifying the Writables in the tuple is permitted and unlikely to affect
  8855. join behavior in most cases, but it is not recommended. It's safer to
  8856. clone first.]]>
  8857. </doc>
  8858. </method>
  8859. <method name="combine" return="boolean"
  8860. abstract="false" native="false" synchronized="false"
  8861. static="false" final="false" visibility="protected"
  8862. deprecated="not deprecated">
  8863. <param name="srcs" type="java.lang.Object[]"/>
  8864. <param name="dst" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8865. <doc>
  8866. <![CDATA[Default implementation offers {@link #emit} every Tuple from the
  8867. collector (the outer join of child RRs).]]>
  8868. </doc>
  8869. </method>
  8870. <method name="next" return="boolean"
  8871. abstract="false" native="false" synchronized="false"
  8872. static="false" final="false" visibility="public"
  8873. deprecated="not deprecated">
  8874. <param name="key" type="K"/>
  8875. <param name="value" type="V"/>
  8876. <exception name="IOException" type="java.io.IOException"/>
  8877. <doc>
  8878. <![CDATA[{@inheritDoc}]]>
  8879. </doc>
  8880. </method>
  8881. <method name="createValue" return="V"
  8882. abstract="false" native="false" synchronized="false"
  8883. static="false" final="false" visibility="public"
  8884. deprecated="not deprecated">
  8885. <doc>
  8886. <![CDATA[{@inheritDoc}]]>
  8887. </doc>
  8888. </method>
  8889. <method name="getDelegate" return="org.apache.hadoop.mapred.join.ResetableIterator"
  8890. abstract="false" native="false" synchronized="false"
  8891. static="false" final="false" visibility="protected"
  8892. deprecated="not deprecated">
  8893. <doc>
  8894. <![CDATA[Return an iterator returning a single value from the tuple.
  8895. @see MultiFilterDelegationIterator]]>
  8896. </doc>
  8897. </method>
  8898. <doc>
  8899. <![CDATA[Base class for Composite join returning values derived from multiple
  8900. sources, but generally not tuples.
  8901. @deprecated Use
  8902. {@link org.apache.hadoop.mapreduce.lib.join.MultiFilterRecordReader} instead]]>
  8903. </doc>
  8904. </class>
  8905. <!-- end class org.apache.hadoop.mapred.join.MultiFilterRecordReader -->
  8906. <!-- start class org.apache.hadoop.mapred.join.MultiFilterRecordReader.MultiFilterDelegationIterator -->
  8907. <class name="MultiFilterRecordReader.MultiFilterDelegationIterator" extends="java.lang.Object"
  8908. abstract="false"
  8909. static="false" final="false" visibility="protected"
  8910. deprecated="not deprecated">
  8911. <implements name="org.apache.hadoop.mapred.join.ResetableIterator"/>
  8912. <constructor name="MultiFilterRecordReader.MultiFilterDelegationIterator"
  8913. static="false" final="false" visibility="protected"
  8914. deprecated="not deprecated">
  8915. </constructor>
  8916. <method name="hasNext" return="boolean"
  8917. abstract="false" native="false" synchronized="false"
  8918. static="false" final="false" visibility="public"
  8919. deprecated="not deprecated">
  8920. </method>
  8921. <method name="next" return="boolean"
  8922. abstract="false" native="false" synchronized="false"
  8923. static="false" final="false" visibility="public"
  8924. deprecated="not deprecated">
  8925. <param name="val" type="V"/>
  8926. <exception name="IOException" type="java.io.IOException"/>
  8927. </method>
  8928. <method name="replay" return="boolean"
  8929. abstract="false" native="false" synchronized="false"
  8930. static="false" final="false" visibility="public"
  8931. deprecated="not deprecated">
  8932. <param name="val" type="V"/>
  8933. <exception name="IOException" type="java.io.IOException"/>
  8934. </method>
  8935. <method name="reset"
  8936. abstract="false" native="false" synchronized="false"
  8937. static="false" final="false" visibility="public"
  8938. deprecated="not deprecated">
  8939. </method>
  8940. <method name="add"
  8941. abstract="false" native="false" synchronized="false"
  8942. static="false" final="false" visibility="public"
  8943. deprecated="not deprecated">
  8944. <param name="item" type="V"/>
  8945. <exception name="IOException" type="java.io.IOException"/>
  8946. </method>
  8947. <method name="close"
  8948. abstract="false" native="false" synchronized="false"
  8949. static="false" final="false" visibility="public"
  8950. deprecated="not deprecated">
  8951. <exception name="IOException" type="java.io.IOException"/>
  8952. </method>
  8953. <method name="clear"
  8954. abstract="false" native="false" synchronized="false"
  8955. static="false" final="false" visibility="public"
  8956. deprecated="not deprecated">
  8957. </method>
  8958. <doc>
  8959. <![CDATA[Proxy the JoinCollector, but include callback to emit.]]>
  8960. </doc>
  8961. </class>
  8962. <!-- end class org.apache.hadoop.mapred.join.MultiFilterRecordReader.MultiFilterDelegationIterator -->
  8963. <!-- start class org.apache.hadoop.mapred.join.OuterJoinRecordReader -->
  8964. <class name="OuterJoinRecordReader" extends="org.apache.hadoop.mapred.join.JoinRecordReader"
  8965. abstract="false"
  8966. static="false" final="false" visibility="public"
  8967. deprecated="Use
  8968. {@link org.apache.hadoop.mapreduce.lib.join.OuterJoinRecordReader} instead">
  8969. <method name="combine" return="boolean"
  8970. abstract="false" native="false" synchronized="false"
  8971. static="false" final="false" visibility="protected"
  8972. deprecated="not deprecated">
  8973. <param name="srcs" type="java.lang.Object[]"/>
  8974. <param name="dst" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8975. <doc>
  8976. <![CDATA[Emit everything from the collector.]]>
  8977. </doc>
  8978. </method>
  8979. <doc>
  8980. <![CDATA[Full outer join.
  8981. @deprecated Use
  8982. {@link org.apache.hadoop.mapreduce.lib.join.OuterJoinRecordReader} instead]]>
  8983. </doc>
  8984. </class>
  8985. <!-- end class org.apache.hadoop.mapred.join.OuterJoinRecordReader -->
  8986. <!-- start class org.apache.hadoop.mapred.join.OverrideRecordReader -->
  8987. <class name="OverrideRecordReader" extends="org.apache.hadoop.mapred.join.MultiFilterRecordReader"
  8988. abstract="false"
  8989. static="false" final="false" visibility="public"
  8990. deprecated="Use
  8991. {@link org.apache.hadoop.mapreduce.lib.join.OverrideRecordReader} instead">
  8992. <method name="emit" return="V"
  8993. abstract="false" native="false" synchronized="false"
  8994. static="false" final="false" visibility="protected"
  8995. deprecated="not deprecated">
  8996. <param name="dst" type="org.apache.hadoop.mapred.join.TupleWritable"/>
  8997. <doc>
  8998. <![CDATA[Emit the value with the highest position in the tuple.]]>
  8999. </doc>
  9000. </method>
  9001. <method name="fillJoinCollector"
  9002. abstract="false" native="false" synchronized="false"
  9003. static="false" final="false" visibility="protected"
  9004. deprecated="not deprecated">
  9005. <param name="iterkey" type="K"/>
  9006. <exception name="IOException" type="java.io.IOException"/>
  9007. <doc>
  9008. <![CDATA[Instead of filling the JoinCollector with iterators from all
  9009. data sources, fill only the rightmost for this key.
  9010. This not only saves space by discarding the other sources, but
  9011. it also emits the number of key-value pairs in the preferred
  9012. RecordReader instead of repeating that stream n times, where
  9013. n is the cardinality of the cross product of the discarded
  9014. streams for the given key.]]>
  9015. </doc>
  9016. </method>
  9017. <doc>
  9018. <![CDATA[Prefer the &quot;rightmost&quot; data source for this key.
  9019. For example, <tt>override(S1,S2,S3)</tt> will prefer values
  9020. from S3 over S2, and values from S2 over S1 for all keys
  9021. emitted from all sources.
  9022. @deprecated Use
  9023. {@link org.apache.hadoop.mapreduce.lib.join.OverrideRecordReader} instead]]>
  9024. </doc>
  9025. </class>
  9026. <!-- end class org.apache.hadoop.mapred.join.OverrideRecordReader -->
  9027. <!-- start class org.apache.hadoop.mapred.join.Parser -->
  9028. <class name="Parser" extends="java.lang.Object"
  9029. abstract="false"
  9030. static="false" final="false" visibility="public"
  9031. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.join.Parser} instead">
  9032. <constructor name="Parser"
  9033. static="false" final="false" visibility="public"
  9034. deprecated="not deprecated">
  9035. </constructor>
  9036. <doc>
  9037. <![CDATA[Very simple shift-reduce parser for join expressions.
  9038. This should be sufficient for the user extension permitted now, but ought to
  9039. be replaced with a parser generator if more complex grammars are supported.
  9040. In particular, this &quot;shift-reduce&quot; parser has no states. Each set
  9041. of formals requires a different internal node type, which is responsible for
  9042. interpreting the list of tokens it receives. This is sufficient for the
  9043. current grammar, but it has several annoying properties that might inhibit
  9044. extension. In particular, parenthesis are always function calls; an
  9045. algebraic or filter grammar would not only require a node type, but must
  9046. also work around the internals of this parser.
  9047. For most other cases, adding classes to the hierarchy- particularly by
  9048. extending JoinRecordReader and MultiFilterRecordReader- is fairly
  9049. straightforward. One need only override the relevant method(s) (usually only
  9050. {@link CompositeRecordReader#combine}) and include a property to map its
  9051. value to an identifier in the parser.
  9052. @deprecated Use {@link org.apache.hadoop.mapreduce.lib.join.Parser} instead]]>
  9053. </doc>
  9054. </class>
  9055. <!-- end class org.apache.hadoop.mapred.join.Parser -->
  9056. <!-- start class org.apache.hadoop.mapred.join.Parser.Node -->
  9057. <class name="Parser.Node" extends="java.lang.Object"
  9058. abstract="true"
  9059. static="true" final="false" visibility="public"
  9060. deprecated="not deprecated">
  9061. <implements name="org.apache.hadoop.mapred.join.ComposableInputFormat"/>
  9062. <constructor name="Parser.Node" type="java.lang.String"
  9063. static="false" final="false" visibility="protected"
  9064. deprecated="not deprecated">
  9065. </constructor>
  9066. <method name="addIdentifier"
  9067. abstract="false" native="false" synchronized="false"
  9068. static="true" final="false" visibility="protected"
  9069. deprecated="not deprecated">
  9070. <param name="ident" type="java.lang.String"/>
  9071. <param name="mcstrSig" type="java.lang.Class[]"/>
  9072. <param name="nodetype" type="java.lang.Class"/>
  9073. <param name="cl" type="java.lang.Class"/>
  9074. <exception name="NoSuchMethodException" type="java.lang.NoSuchMethodException"/>
  9075. <doc>
  9076. <![CDATA[For a given identifier, add a mapping to the nodetype for the parse
  9077. tree and to the ComposableRecordReader to be created, including the
  9078. formals required to invoke the constructor.
  9079. The nodetype and constructor signature should be filled in from the
  9080. child node.]]>
  9081. </doc>
  9082. </method>
  9083. <method name="setID"
  9084. abstract="false" native="false" synchronized="false"
  9085. static="false" final="false" visibility="protected"
  9086. deprecated="not deprecated">
  9087. <param name="id" type="int"/>
  9088. </method>
  9089. <method name="setKeyComparator"
  9090. abstract="false" native="false" synchronized="false"
  9091. static="false" final="false" visibility="protected"
  9092. deprecated="not deprecated">
  9093. <param name="cmpcl" type="java.lang.Class"/>
  9094. </method>
  9095. <field name="rrCstrMap" type="java.util.Map"
  9096. transient="false" volatile="false"
  9097. static="true" final="true" visibility="protected"
  9098. deprecated="not deprecated">
  9099. </field>
  9100. <field name="id" type="int"
  9101. transient="false" volatile="false"
  9102. static="false" final="false" visibility="protected"
  9103. deprecated="not deprecated">
  9104. </field>
  9105. <field name="ident" type="java.lang.String"
  9106. transient="false" volatile="false"
  9107. static="false" final="false" visibility="protected"
  9108. deprecated="not deprecated">
  9109. </field>
  9110. <field name="cmpcl" type="java.lang.Class"
  9111. transient="false" volatile="false"
  9112. static="false" final="false" visibility="protected"
  9113. deprecated="not deprecated">
  9114. </field>
  9115. </class>
  9116. <!-- end class org.apache.hadoop.mapred.join.Parser.Node -->
  9117. <!-- start class org.apache.hadoop.mapred.join.Parser.NodeToken -->
  9118. <class name="Parser.NodeToken" extends="org.apache.hadoop.mapred.join.Parser.Token"
  9119. abstract="false"
  9120. static="true" final="false" visibility="public"
  9121. deprecated="not deprecated">
  9122. <method name="getNode" return="org.apache.hadoop.mapred.join.Parser.Node"
  9123. abstract="false" native="false" synchronized="false"
  9124. static="false" final="false" visibility="public"
  9125. deprecated="not deprecated">
  9126. </method>
  9127. </class>
  9128. <!-- end class org.apache.hadoop.mapred.join.Parser.NodeToken -->
  9129. <!-- start class org.apache.hadoop.mapred.join.Parser.NumToken -->
  9130. <class name="Parser.NumToken" extends="org.apache.hadoop.mapred.join.Parser.Token"
  9131. abstract="false"
  9132. static="true" final="false" visibility="public"
  9133. deprecated="not deprecated">
  9134. <constructor name="Parser.NumToken" type="double"
  9135. static="false" final="false" visibility="public"
  9136. deprecated="not deprecated">
  9137. </constructor>
  9138. <method name="getNum" return="double"
  9139. abstract="false" native="false" synchronized="false"
  9140. static="false" final="false" visibility="public"
  9141. deprecated="not deprecated">
  9142. </method>
  9143. </class>
  9144. <!-- end class org.apache.hadoop.mapred.join.Parser.NumToken -->
  9145. <!-- start class org.apache.hadoop.mapred.join.Parser.StrToken -->
  9146. <class name="Parser.StrToken" extends="org.apache.hadoop.mapred.join.Parser.Token"
  9147. abstract="false"
  9148. static="true" final="false" visibility="public"
  9149. deprecated="not deprecated">
  9150. <constructor name="Parser.StrToken" type="org.apache.hadoop.mapred.join.Parser.TType, java.lang.String"
  9151. static="false" final="false" visibility="public"
  9152. deprecated="not deprecated">
  9153. </constructor>
  9154. <method name="getStr" return="java.lang.String"
  9155. abstract="false" native="false" synchronized="false"
  9156. static="false" final="false" visibility="public"
  9157. deprecated="not deprecated">
  9158. </method>
  9159. </class>
  9160. <!-- end class org.apache.hadoop.mapred.join.Parser.StrToken -->
  9161. <!-- start class org.apache.hadoop.mapred.join.Parser.Token -->
  9162. <class name="Parser.Token" extends="java.lang.Object"
  9163. abstract="false"
  9164. static="true" final="false" visibility="public"
  9165. deprecated="not deprecated">
  9166. <method name="getType" return="org.apache.hadoop.mapred.join.Parser.TType"
  9167. abstract="false" native="false" synchronized="false"
  9168. static="false" final="false" visibility="public"
  9169. deprecated="not deprecated">
  9170. </method>
  9171. <method name="getNode" return="org.apache.hadoop.mapred.join.Parser.Node"
  9172. abstract="false" native="false" synchronized="false"
  9173. static="false" final="false" visibility="public"
  9174. deprecated="not deprecated">
  9175. <exception name="IOException" type="java.io.IOException"/>
  9176. </method>
  9177. <method name="getNum" return="double"
  9178. abstract="false" native="false" synchronized="false"
  9179. static="false" final="false" visibility="public"
  9180. deprecated="not deprecated">
  9181. <exception name="IOException" type="java.io.IOException"/>
  9182. </method>
  9183. <method name="getStr" return="java.lang.String"
  9184. abstract="false" native="false" synchronized="false"
  9185. static="false" final="false" visibility="public"
  9186. deprecated="not deprecated">
  9187. <exception name="IOException" type="java.io.IOException"/>
  9188. </method>
  9189. <doc>
  9190. <![CDATA[Tagged-union type for tokens from the join expression.
  9191. @see Parser.TType]]>
  9192. </doc>
  9193. </class>
  9194. <!-- end class org.apache.hadoop.mapred.join.Parser.Token -->
  9195. <!-- start class org.apache.hadoop.mapred.join.Parser.TType -->
  9196. <class name="Parser.TType" extends="java.lang.Enum"
  9197. abstract="false"
  9198. static="true" final="true" visibility="public"
  9199. deprecated="not deprecated">
  9200. <method name="values" return="org.apache.hadoop.mapred.join.Parser.TType[]"
  9201. abstract="false" native="false" synchronized="false"
  9202. static="true" final="false" visibility="public"
  9203. deprecated="not deprecated">
  9204. </method>
  9205. <method name="valueOf" return="org.apache.hadoop.mapred.join.Parser.TType"
  9206. abstract="false" native="false" synchronized="false"
  9207. static="true" final="false" visibility="public"
  9208. deprecated="not deprecated">
  9209. <param name="name" type="java.lang.String"/>
  9210. </method>
  9211. </class>
  9212. <!-- end class org.apache.hadoop.mapred.join.Parser.TType -->
  9213. <!-- start interface org.apache.hadoop.mapred.join.ResetableIterator -->
  9214. <interface name="ResetableIterator" abstract="true"
  9215. static="false" final="false" visibility="public"
  9216. deprecated="Use
  9217. {@link org.apache.hadoop.mapreduce.lib.join.ResetableIterator} instead">
  9218. <implements name="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"/>
  9219. <doc>
  9220. <![CDATA[This defines an interface to a stateful Iterator that can replay elements
  9221. added to it directly.
  9222. Note that this does not extend {@link java.util.Iterator}.
  9223. @deprecated Use
  9224. {@link org.apache.hadoop.mapreduce.lib.join.ResetableIterator} instead]]>
  9225. </doc>
  9226. </interface>
  9227. <!-- end interface org.apache.hadoop.mapred.join.ResetableIterator -->
  9228. <!-- start class org.apache.hadoop.mapred.join.ResetableIterator.EMPTY -->
  9229. <class name="ResetableIterator.EMPTY" extends="org.apache.hadoop.mapreduce.lib.join.ResetableIterator.EMPTY"
  9230. abstract="false"
  9231. static="true" final="false" visibility="public"
  9232. deprecated="not deprecated">
  9233. <implements name="org.apache.hadoop.mapred.join.ResetableIterator"/>
  9234. <constructor name="ResetableIterator.EMPTY"
  9235. static="false" final="false" visibility="public"
  9236. deprecated="not deprecated">
  9237. </constructor>
  9238. </class>
  9239. <!-- end class org.apache.hadoop.mapred.join.ResetableIterator.EMPTY -->
  9240. <!-- start class org.apache.hadoop.mapred.join.StreamBackedIterator -->
  9241. <class name="StreamBackedIterator" extends="org.apache.hadoop.mapreduce.lib.join.StreamBackedIterator"
  9242. abstract="false"
  9243. static="false" final="false" visibility="public"
  9244. deprecated="Use
  9245. {@link org.apache.hadoop.mapreduce.lib.join.StreamBackedIterator} instead">
  9246. <implements name="org.apache.hadoop.mapred.join.ResetableIterator"/>
  9247. <constructor name="StreamBackedIterator"
  9248. static="false" final="false" visibility="public"
  9249. deprecated="not deprecated">
  9250. </constructor>
  9251. <doc>
  9252. <![CDATA[This class provides an implementation of ResetableIterator. This
  9253. implementation uses a byte array to store elements added to it.
  9254. @deprecated Use
  9255. {@link org.apache.hadoop.mapreduce.lib.join.StreamBackedIterator} instead]]>
  9256. </doc>
  9257. </class>
  9258. <!-- end class org.apache.hadoop.mapred.join.StreamBackedIterator -->
  9259. <!-- start class org.apache.hadoop.mapred.join.TupleWritable -->
  9260. <class name="TupleWritable" extends="org.apache.hadoop.mapreduce.lib.join.TupleWritable"
  9261. abstract="false"
  9262. static="false" final="false" visibility="public"
  9263. deprecated="Use
  9264. {@link org.apache.hadoop.mapreduce.lib.join.TupleWritable} instead">
  9265. <constructor name="TupleWritable"
  9266. static="false" final="false" visibility="public"
  9267. deprecated="not deprecated">
  9268. <doc>
  9269. <![CDATA[Create an empty tuple with no allocated storage for writables.]]>
  9270. </doc>
  9271. </constructor>
  9272. <constructor name="TupleWritable" type="org.apache.hadoop.io.Writable[]"
  9273. static="false" final="false" visibility="public"
  9274. deprecated="not deprecated">
  9275. <doc>
  9276. <![CDATA[Initialize tuple with storage; unknown whether any of them contain
  9277. &quot;written&quot; values.]]>
  9278. </doc>
  9279. </constructor>
  9280. <doc>
  9281. <![CDATA[Writable type storing multiple {@link org.apache.hadoop.io.Writable}s.
  9282. This is *not* a general-purpose tuple type. In almost all cases, users are
  9283. encouraged to implement their own serializable types, which can perform
  9284. better validation and provide more efficient encodings than this class is
  9285. capable. TupleWritable relies on the join framework for type safety and
  9286. assumes its instances will rarely be persisted, assumptions not only
  9287. incompatible with, but contrary to the general case.
  9288. @see org.apache.hadoop.io.Writable
  9289. @deprecated Use
  9290. {@link org.apache.hadoop.mapreduce.lib.join.TupleWritable} instead]]>
  9291. </doc>
  9292. </class>
  9293. <!-- end class org.apache.hadoop.mapred.join.TupleWritable -->
  9294. <!-- start class org.apache.hadoop.mapred.join.WrappedRecordReader -->
  9295. <class name="WrappedRecordReader" extends="java.lang.Object"
  9296. abstract="false"
  9297. static="false" final="false" visibility="public"
  9298. deprecated="Use
  9299. {@link org.apache.hadoop.mapreduce.lib.join.WrappedRecordReader} instead">
  9300. <implements name="org.apache.hadoop.mapred.join.ComposableRecordReader"/>
  9301. <method name="id" return="int"
  9302. abstract="false" native="false" synchronized="false"
  9303. static="false" final="false" visibility="public"
  9304. deprecated="not deprecated">
  9305. <doc>
  9306. <![CDATA[{@inheritDoc}]]>
  9307. </doc>
  9308. </method>
  9309. <method name="key" return="K"
  9310. abstract="false" native="false" synchronized="false"
  9311. static="false" final="false" visibility="public"
  9312. deprecated="not deprecated">
  9313. <doc>
  9314. <![CDATA[Return the key at the head of this RR.]]>
  9315. </doc>
  9316. </method>
  9317. <method name="key"
  9318. abstract="false" native="false" synchronized="false"
  9319. static="false" final="false" visibility="public"
  9320. deprecated="not deprecated">
  9321. <param name="qkey" type="K"/>
  9322. <exception name="IOException" type="java.io.IOException"/>
  9323. <doc>
  9324. <![CDATA[Clone the key at the head of this RR into the object supplied.]]>
  9325. </doc>
  9326. </method>
  9327. <method name="hasNext" return="boolean"
  9328. abstract="false" native="false" synchronized="false"
  9329. static="false" final="false" visibility="public"
  9330. deprecated="not deprecated">
  9331. <doc>
  9332. <![CDATA[Return true if the RR- including the k,v pair stored in this object-
  9333. is exhausted.]]>
  9334. </doc>
  9335. </method>
  9336. <method name="skip"
  9337. abstract="false" native="false" synchronized="false"
  9338. static="false" final="false" visibility="public"
  9339. deprecated="not deprecated">
  9340. <param name="key" type="K"/>
  9341. <exception name="IOException" type="java.io.IOException"/>
  9342. <doc>
  9343. <![CDATA[Skip key-value pairs with keys less than or equal to the key provided.]]>
  9344. </doc>
  9345. </method>
  9346. <method name="next" return="boolean"
  9347. abstract="false" native="false" synchronized="false"
  9348. static="false" final="false" visibility="protected"
  9349. deprecated="not deprecated">
  9350. <exception name="IOException" type="java.io.IOException"/>
  9351. <doc>
  9352. <![CDATA[Read the next k,v pair into the head of this object; return true iff
  9353. the RR and this are exhausted.]]>
  9354. </doc>
  9355. </method>
  9356. <method name="accept"
  9357. abstract="false" native="false" synchronized="false"
  9358. static="false" final="false" visibility="public"
  9359. deprecated="not deprecated">
  9360. <param name="i" type="org.apache.hadoop.mapred.join.CompositeRecordReader.JoinCollector"/>
  9361. <param name="key" type="K"/>
  9362. <exception name="IOException" type="java.io.IOException"/>
  9363. <doc>
  9364. <![CDATA[Add an iterator to the collector at the position occupied by this
  9365. RecordReader over the values in this stream paired with the key
  9366. provided (ie register a stream of values from this source matching K
  9367. with a collector).]]>
  9368. </doc>
  9369. </method>
  9370. <method name="next" return="boolean"
  9371. abstract="false" native="false" synchronized="false"
  9372. static="false" final="false" visibility="public"
  9373. deprecated="not deprecated">
  9374. <param name="key" type="K"/>
  9375. <param name="value" type="U"/>
  9376. <exception name="IOException" type="java.io.IOException"/>
  9377. <doc>
  9378. <![CDATA[Write key-value pair at the head of this stream to the objects provided;
  9379. get next key-value pair from proxied RR.]]>
  9380. </doc>
  9381. </method>
  9382. <method name="createKey" return="K"
  9383. abstract="false" native="false" synchronized="false"
  9384. static="false" final="false" visibility="public"
  9385. deprecated="not deprecated">
  9386. <doc>
  9387. <![CDATA[Request new key from proxied RR.]]>
  9388. </doc>
  9389. </method>
  9390. <method name="createValue" return="U"
  9391. abstract="false" native="false" synchronized="false"
  9392. static="false" final="false" visibility="public"
  9393. deprecated="not deprecated">
  9394. <doc>
  9395. <![CDATA[Request new value from proxied RR.]]>
  9396. </doc>
  9397. </method>
  9398. <method name="getProgress" return="float"
  9399. abstract="false" native="false" synchronized="false"
  9400. static="false" final="false" visibility="public"
  9401. deprecated="not deprecated">
  9402. <exception name="IOException" type="java.io.IOException"/>
  9403. <doc>
  9404. <![CDATA[Request progress from proxied RR.]]>
  9405. </doc>
  9406. </method>
  9407. <method name="getPos" return="long"
  9408. abstract="false" native="false" synchronized="false"
  9409. static="false" final="false" visibility="public"
  9410. deprecated="not deprecated">
  9411. <exception name="IOException" type="java.io.IOException"/>
  9412. <doc>
  9413. <![CDATA[Request position from proxied RR.]]>
  9414. </doc>
  9415. </method>
  9416. <method name="close"
  9417. abstract="false" native="false" synchronized="false"
  9418. static="false" final="false" visibility="public"
  9419. deprecated="not deprecated">
  9420. <exception name="IOException" type="java.io.IOException"/>
  9421. <doc>
  9422. <![CDATA[Forward close request to proxied RR.]]>
  9423. </doc>
  9424. </method>
  9425. <method name="compareTo" return="int"
  9426. abstract="false" native="false" synchronized="false"
  9427. static="false" final="false" visibility="public"
  9428. deprecated="not deprecated">
  9429. <param name="other" type="org.apache.hadoop.mapred.join.ComposableRecordReader"/>
  9430. <doc>
  9431. <![CDATA[Implement Comparable contract (compare key at head of proxied RR
  9432. with that of another).]]>
  9433. </doc>
  9434. </method>
  9435. <method name="equals" return="boolean"
  9436. abstract="false" native="false" synchronized="false"
  9437. static="false" final="false" visibility="public"
  9438. deprecated="not deprecated">
  9439. <param name="other" type="java.lang.Object"/>
  9440. <doc>
  9441. <![CDATA[Return true iff compareTo(other) retn true.]]>
  9442. </doc>
  9443. </method>
  9444. <method name="hashCode" return="int"
  9445. abstract="false" native="false" synchronized="false"
  9446. static="false" final="false" visibility="public"
  9447. deprecated="not deprecated">
  9448. </method>
  9449. <doc>
  9450. <![CDATA[Proxy class for a RecordReader participating in the join framework.
  9451. This class keeps track of the &quot;head&quot; key-value pair for the
  9452. provided RecordReader and keeps a store of values matching a key when
  9453. this source is participating in a join.
  9454. @deprecated Use
  9455. {@link org.apache.hadoop.mapreduce.lib.join.WrappedRecordReader} instead]]>
  9456. </doc>
  9457. </class>
  9458. <!-- end class org.apache.hadoop.mapred.join.WrappedRecordReader -->
  9459. </package>
  9460. <package name="org.apache.hadoop.mapred.lib">
  9461. <!-- start class org.apache.hadoop.mapred.lib.BinaryPartitioner -->
  9462. <class name="BinaryPartitioner" extends="org.apache.hadoop.mapreduce.lib.partition.BinaryPartitioner"
  9463. abstract="false"
  9464. static="false" final="false" visibility="public"
  9465. deprecated="Use
  9466. {@link org.apache.hadoop.mapreduce.lib.partition.BinaryPartitioner}
  9467. instead.">
  9468. <implements name="org.apache.hadoop.mapred.Partitioner"/>
  9469. <constructor name="BinaryPartitioner"
  9470. static="false" final="false" visibility="public"
  9471. deprecated="not deprecated">
  9472. </constructor>
  9473. <method name="configure"
  9474. abstract="false" native="false" synchronized="false"
  9475. static="false" final="false" visibility="public"
  9476. deprecated="not deprecated">
  9477. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9478. </method>
  9479. <doc>
  9480. <![CDATA[Partition {@link BinaryComparable} keys using a configurable part of
  9481. the bytes array returned by {@link BinaryComparable#getBytes()}.
  9482. @see org.apache.hadoop.mapreduce.lib.partition.BinaryPartitioner
  9483. @deprecated Use
  9484. {@link org.apache.hadoop.mapreduce.lib.partition.BinaryPartitioner}
  9485. instead.]]>
  9486. </doc>
  9487. </class>
  9488. <!-- end class org.apache.hadoop.mapred.lib.BinaryPartitioner -->
  9489. <!-- start class org.apache.hadoop.mapred.lib.ChainMapper -->
  9490. <class name="ChainMapper" extends="java.lang.Object"
  9491. abstract="false"
  9492. static="false" final="false" visibility="public"
  9493. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.chain.ChainMapper} instead">
  9494. <implements name="org.apache.hadoop.mapred.Mapper"/>
  9495. <constructor name="ChainMapper"
  9496. static="false" final="false" visibility="public"
  9497. deprecated="not deprecated">
  9498. <doc>
  9499. <![CDATA[Constructor.]]>
  9500. </doc>
  9501. </constructor>
  9502. <method name="addMapper"
  9503. abstract="false" native="false" synchronized="false"
  9504. static="true" final="false" visibility="public"
  9505. deprecated="not deprecated">
  9506. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9507. <param name="klass" type="java.lang.Class"/>
  9508. <param name="inputKeyClass" type="java.lang.Class"/>
  9509. <param name="inputValueClass" type="java.lang.Class"/>
  9510. <param name="outputKeyClass" type="java.lang.Class"/>
  9511. <param name="outputValueClass" type="java.lang.Class"/>
  9512. <param name="byValue" type="boolean"/>
  9513. <param name="mapperConf" type="org.apache.hadoop.mapred.JobConf"/>
  9514. <doc>
  9515. <![CDATA[Adds a Mapper class to the chain job's JobConf.
  9516. <p/>
  9517. It has to be specified how key and values are passed from one element of
  9518. the chain to the next, by value or by reference. If a Mapper leverages the
  9519. assumed semantics that the key and values are not modified by the collector
  9520. 'by value' must be used. If the Mapper does not expect this semantics, as
  9521. an optimization to avoid serialization and deserialization 'by reference'
  9522. can be used.
  9523. <p/>
  9524. For the added Mapper the configuration given for it,
  9525. <code>mapperConf</code>, have precedence over the job's JobConf. This
  9526. precedence is in effect when the task is running.
  9527. <p/>
  9528. IMPORTANT: There is no need to specify the output key/value classes for the
  9529. ChainMapper, this is done by the addMapper for the last mapper in the chain
  9530. <p/>
  9531. @param job job's JobConf to add the Mapper class.
  9532. @param klass the Mapper class to add.
  9533. @param inputKeyClass mapper input key class.
  9534. @param inputValueClass mapper input value class.
  9535. @param outputKeyClass mapper output key class.
  9536. @param outputValueClass mapper output value class.
  9537. @param byValue indicates if key/values should be passed by value
  9538. to the next Mapper in the chain, if any.
  9539. @param mapperConf a JobConf with the configuration for the Mapper
  9540. class. It is recommended to use a JobConf without default values using the
  9541. <code>JobConf(boolean loadDefaults)</code> constructor with FALSE.]]>
  9542. </doc>
  9543. </method>
  9544. <method name="configure"
  9545. abstract="false" native="false" synchronized="false"
  9546. static="false" final="false" visibility="public"
  9547. deprecated="not deprecated">
  9548. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9549. <doc>
  9550. <![CDATA[Configures the ChainMapper and all the Mappers in the chain.
  9551. <p/>
  9552. If this method is overriden <code>super.configure(...)</code> should be
  9553. invoked at the beginning of the overwriter method.]]>
  9554. </doc>
  9555. </method>
  9556. <method name="map"
  9557. abstract="false" native="false" synchronized="false"
  9558. static="false" final="false" visibility="public"
  9559. deprecated="not deprecated">
  9560. <param name="key" type="java.lang.Object"/>
  9561. <param name="value" type="java.lang.Object"/>
  9562. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  9563. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  9564. <exception name="IOException" type="java.io.IOException"/>
  9565. <doc>
  9566. <![CDATA[Chains the <code>map(...)</code> methods of the Mappers in the chain.]]>
  9567. </doc>
  9568. </method>
  9569. <method name="close"
  9570. abstract="false" native="false" synchronized="false"
  9571. static="false" final="false" visibility="public"
  9572. deprecated="not deprecated">
  9573. <exception name="IOException" type="java.io.IOException"/>
  9574. <doc>
  9575. <![CDATA[Closes the ChainMapper and all the Mappers in the chain.
  9576. <p/>
  9577. If this method is overriden <code>super.close()</code> should be
  9578. invoked at the end of the overwriter method.]]>
  9579. </doc>
  9580. </method>
  9581. <doc>
  9582. <![CDATA[The ChainMapper class allows to use multiple Mapper classes within a single
  9583. Map task.
  9584. <p/>
  9585. The Mapper classes are invoked in a chained (or piped) fashion, the output of
  9586. the first becomes the input of the second, and so on until the last Mapper,
  9587. the output of the last Mapper will be written to the task's output.
  9588. <p/>
  9589. The key functionality of this feature is that the Mappers in the chain do not
  9590. need to be aware that they are executed in a chain. This enables having
  9591. reusable specialized Mappers that can be combined to perform composite
  9592. operations within a single task.
  9593. <p/>
  9594. Special care has to be taken when creating chains that the key/values output
  9595. by a Mapper are valid for the following Mapper in the chain. It is assumed
  9596. all Mappers and the Reduce in the chain use maching output and input key and
  9597. value classes as no conversion is done by the chaining code.
  9598. <p/>
  9599. Using the ChainMapper and the ChainReducer classes is possible to compose
  9600. Map/Reduce jobs that look like <code>[MAP+ / REDUCE MAP*]</code>. And
  9601. immediate benefit of this pattern is a dramatic reduction in disk IO.
  9602. <p/>
  9603. IMPORTANT: There is no need to specify the output key/value classes for the
  9604. ChainMapper, this is done by the addMapper for the last mapper in the chain.
  9605. <p/>
  9606. ChainMapper usage pattern:
  9607. <p/>
  9608. <pre>
  9609. ...
  9610. conf.setJobName("chain");
  9611. conf.setInputFormat(TextInputFormat.class);
  9612. conf.setOutputFormat(TextOutputFormat.class);
  9613. <p/>
  9614. JobConf mapAConf = new JobConf(false);
  9615. ...
  9616. ChainMapper.addMapper(conf, AMap.class, LongWritable.class, Text.class,
  9617. Text.class, Text.class, true, mapAConf);
  9618. <p/>
  9619. JobConf mapBConf = new JobConf(false);
  9620. ...
  9621. ChainMapper.addMapper(conf, BMap.class, Text.class, Text.class,
  9622. LongWritable.class, Text.class, false, mapBConf);
  9623. <p/>
  9624. JobConf reduceConf = new JobConf(false);
  9625. ...
  9626. ChainReducer.setReducer(conf, XReduce.class, LongWritable.class, Text.class,
  9627. Text.class, Text.class, true, reduceConf);
  9628. <p/>
  9629. ChainReducer.addMapper(conf, CMap.class, Text.class, Text.class,
  9630. LongWritable.class, Text.class, false, null);
  9631. <p/>
  9632. ChainReducer.addMapper(conf, DMap.class, LongWritable.class, Text.class,
  9633. LongWritable.class, LongWritable.class, true, null);
  9634. <p/>
  9635. FileInputFormat.setInputPaths(conf, inDir);
  9636. FileOutputFormat.setOutputPath(conf, outDir);
  9637. ...
  9638. <p/>
  9639. JobClient jc = new JobClient(conf);
  9640. RunningJob job = jc.submitJob(conf);
  9641. ...
  9642. </pre>
  9643. @deprecated
  9644. Use {@link org.apache.hadoop.mapreduce.lib.chain.ChainMapper} instead]]>
  9645. </doc>
  9646. </class>
  9647. <!-- end class org.apache.hadoop.mapred.lib.ChainMapper -->
  9648. <!-- start class org.apache.hadoop.mapred.lib.ChainReducer -->
  9649. <class name="ChainReducer" extends="java.lang.Object"
  9650. abstract="false"
  9651. static="false" final="false" visibility="public"
  9652. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.chain.ChainReducer} instead">
  9653. <implements name="org.apache.hadoop.mapred.Reducer"/>
  9654. <constructor name="ChainReducer"
  9655. static="false" final="false" visibility="public"
  9656. deprecated="not deprecated">
  9657. <doc>
  9658. <![CDATA[Constructor.]]>
  9659. </doc>
  9660. </constructor>
  9661. <method name="setReducer"
  9662. abstract="false" native="false" synchronized="false"
  9663. static="true" final="false" visibility="public"
  9664. deprecated="not deprecated">
  9665. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9666. <param name="klass" type="java.lang.Class"/>
  9667. <param name="inputKeyClass" type="java.lang.Class"/>
  9668. <param name="inputValueClass" type="java.lang.Class"/>
  9669. <param name="outputKeyClass" type="java.lang.Class"/>
  9670. <param name="outputValueClass" type="java.lang.Class"/>
  9671. <param name="byValue" type="boolean"/>
  9672. <param name="reducerConf" type="org.apache.hadoop.mapred.JobConf"/>
  9673. <doc>
  9674. <![CDATA[Sets the Reducer class to the chain job's JobConf.
  9675. <p/>
  9676. It has to be specified how key and values are passed from one element of
  9677. the chain to the next, by value or by reference. If a Reducer leverages the
  9678. assumed semantics that the key and values are not modified by the collector
  9679. 'by value' must be used. If the Reducer does not expect this semantics, as
  9680. an optimization to avoid serialization and deserialization 'by reference'
  9681. can be used.
  9682. <p/>
  9683. For the added Reducer the configuration given for it,
  9684. <code>reducerConf</code>, have precedence over the job's JobConf. This
  9685. precedence is in effect when the task is running.
  9686. <p/>
  9687. IMPORTANT: There is no need to specify the output key/value classes for the
  9688. ChainReducer, this is done by the setReducer or the addMapper for the last
  9689. element in the chain.
  9690. @param job job's JobConf to add the Reducer class.
  9691. @param klass the Reducer class to add.
  9692. @param inputKeyClass reducer input key class.
  9693. @param inputValueClass reducer input value class.
  9694. @param outputKeyClass reducer output key class.
  9695. @param outputValueClass reducer output value class.
  9696. @param byValue indicates if key/values should be passed by value
  9697. to the next Mapper in the chain, if any.
  9698. @param reducerConf a JobConf with the configuration for the Reducer
  9699. class. It is recommended to use a JobConf without default values using the
  9700. <code>JobConf(boolean loadDefaults)</code> constructor with FALSE.]]>
  9701. </doc>
  9702. </method>
  9703. <method name="addMapper"
  9704. abstract="false" native="false" synchronized="false"
  9705. static="true" final="false" visibility="public"
  9706. deprecated="not deprecated">
  9707. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9708. <param name="klass" type="java.lang.Class"/>
  9709. <param name="inputKeyClass" type="java.lang.Class"/>
  9710. <param name="inputValueClass" type="java.lang.Class"/>
  9711. <param name="outputKeyClass" type="java.lang.Class"/>
  9712. <param name="outputValueClass" type="java.lang.Class"/>
  9713. <param name="byValue" type="boolean"/>
  9714. <param name="mapperConf" type="org.apache.hadoop.mapred.JobConf"/>
  9715. <doc>
  9716. <![CDATA[Adds a Mapper class to the chain job's JobConf.
  9717. <p/>
  9718. It has to be specified how key and values are passed from one element of
  9719. the chain to the next, by value or by reference. If a Mapper leverages the
  9720. assumed semantics that the key and values are not modified by the collector
  9721. 'by value' must be used. If the Mapper does not expect this semantics, as
  9722. an optimization to avoid serialization and deserialization 'by reference'
  9723. can be used.
  9724. <p/>
  9725. For the added Mapper the configuration given for it,
  9726. <code>mapperConf</code>, have precedence over the job's JobConf. This
  9727. precedence is in effect when the task is running.
  9728. <p/>
  9729. IMPORTANT: There is no need to specify the output key/value classes for the
  9730. ChainMapper, this is done by the addMapper for the last mapper in the chain
  9731. .
  9732. @param job chain job's JobConf to add the Mapper class.
  9733. @param klass the Mapper class to add.
  9734. @param inputKeyClass mapper input key class.
  9735. @param inputValueClass mapper input value class.
  9736. @param outputKeyClass mapper output key class.
  9737. @param outputValueClass mapper output value class.
  9738. @param byValue indicates if key/values should be passed by value
  9739. to the next Mapper in the chain, if any.
  9740. @param mapperConf a JobConf with the configuration for the Mapper
  9741. class. It is recommended to use a JobConf without default values using the
  9742. <code>JobConf(boolean loadDefaults)</code> constructor with FALSE.]]>
  9743. </doc>
  9744. </method>
  9745. <method name="configure"
  9746. abstract="false" native="false" synchronized="false"
  9747. static="false" final="false" visibility="public"
  9748. deprecated="not deprecated">
  9749. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9750. <doc>
  9751. <![CDATA[Configures the ChainReducer, the Reducer and all the Mappers in the chain.
  9752. <p/>
  9753. If this method is overriden <code>super.configure(...)</code> should be
  9754. invoked at the beginning of the overwriter method.]]>
  9755. </doc>
  9756. </method>
  9757. <method name="reduce"
  9758. abstract="false" native="false" synchronized="false"
  9759. static="false" final="false" visibility="public"
  9760. deprecated="not deprecated">
  9761. <param name="key" type="java.lang.Object"/>
  9762. <param name="values" type="java.util.Iterator"/>
  9763. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  9764. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  9765. <exception name="IOException" type="java.io.IOException"/>
  9766. <doc>
  9767. <![CDATA[Chains the <code>reduce(...)</code> method of the Reducer with the
  9768. <code>map(...) </code> methods of the Mappers in the chain.]]>
  9769. </doc>
  9770. </method>
  9771. <method name="close"
  9772. abstract="false" native="false" synchronized="false"
  9773. static="false" final="false" visibility="public"
  9774. deprecated="not deprecated">
  9775. <exception name="IOException" type="java.io.IOException"/>
  9776. <doc>
  9777. <![CDATA[Closes the ChainReducer, the Reducer and all the Mappers in the chain.
  9778. <p/>
  9779. If this method is overriden <code>super.close()</code> should be
  9780. invoked at the end of the overwriter method.]]>
  9781. </doc>
  9782. </method>
  9783. <doc>
  9784. <![CDATA[The ChainReducer class allows to chain multiple Mapper classes after a
  9785. Reducer within the Reducer task.
  9786. <p/>
  9787. For each record output by the Reducer, the Mapper classes are invoked in a
  9788. chained (or piped) fashion, the output of the first becomes the input of the
  9789. second, and so on until the last Mapper, the output of the last Mapper will
  9790. be written to the task's output.
  9791. <p/>
  9792. The key functionality of this feature is that the Mappers in the chain do not
  9793. need to be aware that they are executed after the Reducer or in a chain.
  9794. This enables having reusable specialized Mappers that can be combined to
  9795. perform composite operations within a single task.
  9796. <p/>
  9797. Special care has to be taken when creating chains that the key/values output
  9798. by a Mapper are valid for the following Mapper in the chain. It is assumed
  9799. all Mappers and the Reduce in the chain use maching output and input key and
  9800. value classes as no conversion is done by the chaining code.
  9801. <p/>
  9802. Using the ChainMapper and the ChainReducer classes is possible to compose
  9803. Map/Reduce jobs that look like <code>[MAP+ / REDUCE MAP*]</code>. And
  9804. immediate benefit of this pattern is a dramatic reduction in disk IO.
  9805. <p/>
  9806. IMPORTANT: There is no need to specify the output key/value classes for the
  9807. ChainReducer, this is done by the setReducer or the addMapper for the last
  9808. element in the chain.
  9809. <p/>
  9810. ChainReducer usage pattern:
  9811. <p/>
  9812. <pre>
  9813. ...
  9814. conf.setJobName("chain");
  9815. conf.setInputFormat(TextInputFormat.class);
  9816. conf.setOutputFormat(TextOutputFormat.class);
  9817. <p/>
  9818. JobConf mapAConf = new JobConf(false);
  9819. ...
  9820. ChainMapper.addMapper(conf, AMap.class, LongWritable.class, Text.class,
  9821. Text.class, Text.class, true, mapAConf);
  9822. <p/>
  9823. JobConf mapBConf = new JobConf(false);
  9824. ...
  9825. ChainMapper.addMapper(conf, BMap.class, Text.class, Text.class,
  9826. LongWritable.class, Text.class, false, mapBConf);
  9827. <p/>
  9828. JobConf reduceConf = new JobConf(false);
  9829. ...
  9830. ChainReducer.setReducer(conf, XReduce.class, LongWritable.class, Text.class,
  9831. Text.class, Text.class, true, reduceConf);
  9832. <p/>
  9833. ChainReducer.addMapper(conf, CMap.class, Text.class, Text.class,
  9834. LongWritable.class, Text.class, false, null);
  9835. <p/>
  9836. ChainReducer.addMapper(conf, DMap.class, LongWritable.class, Text.class,
  9837. LongWritable.class, LongWritable.class, true, null);
  9838. <p/>
  9839. FileInputFormat.setInputPaths(conf, inDir);
  9840. FileOutputFormat.setOutputPath(conf, outDir);
  9841. ...
  9842. <p/>
  9843. JobClient jc = new JobClient(conf);
  9844. RunningJob job = jc.submitJob(conf);
  9845. ...
  9846. </pre>
  9847. @deprecated
  9848. Use {@link org.apache.hadoop.mapreduce.lib.chain.ChainReducer} instead]]>
  9849. </doc>
  9850. </class>
  9851. <!-- end class org.apache.hadoop.mapred.lib.ChainReducer -->
  9852. <!-- start class org.apache.hadoop.mapred.lib.CombineFileInputFormat -->
  9853. <class name="CombineFileInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.CombineFileInputFormat"
  9854. abstract="true"
  9855. static="false" final="false" visibility="public"
  9856. deprecated="Use
  9857. {@link org.apache.hadoop.mapreduce.lib.input.CombineFileInputFormat}">
  9858. <implements name="org.apache.hadoop.mapred.InputFormat"/>
  9859. <constructor name="CombineFileInputFormat"
  9860. static="false" final="false" visibility="public"
  9861. deprecated="not deprecated">
  9862. <doc>
  9863. <![CDATA[default constructor]]>
  9864. </doc>
  9865. </constructor>
  9866. <method name="getSplits" return="org.apache.hadoop.mapred.InputSplit[]"
  9867. abstract="false" native="false" synchronized="false"
  9868. static="false" final="false" visibility="public"
  9869. deprecated="not deprecated">
  9870. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9871. <param name="numSplits" type="int"/>
  9872. <exception name="IOException" type="java.io.IOException"/>
  9873. </method>
  9874. <method name="createPool"
  9875. abstract="false" native="false" synchronized="false"
  9876. static="false" final="false" visibility="protected"
  9877. deprecated="Use {@link #createPool(List)}.">
  9878. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  9879. <param name="filters" type="java.util.List"/>
  9880. <doc>
  9881. <![CDATA[Create a new pool and add the filters to it.
  9882. A split cannot have files from different pools.
  9883. @deprecated Use {@link #createPool(List)}.]]>
  9884. </doc>
  9885. </method>
  9886. <method name="createPool"
  9887. abstract="false" native="false" synchronized="false"
  9888. static="false" final="false" visibility="protected"
  9889. deprecated="Use {@link #createPool(PathFilter...)}.">
  9890. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  9891. <param name="filters" type="org.apache.hadoop.fs.PathFilter[]"/>
  9892. <doc>
  9893. <![CDATA[Create a new pool and add the filters to it.
  9894. A pathname can satisfy any one of the specified filters.
  9895. A split cannot have files from different pools.
  9896. @deprecated Use {@link #createPool(PathFilter...)}.]]>
  9897. </doc>
  9898. </method>
  9899. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  9900. abstract="true" native="false" synchronized="false"
  9901. static="false" final="false" visibility="public"
  9902. deprecated="not deprecated">
  9903. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  9904. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  9905. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  9906. <exception name="IOException" type="java.io.IOException"/>
  9907. <doc>
  9908. <![CDATA[This is not implemented yet.]]>
  9909. </doc>
  9910. </method>
  9911. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  9912. abstract="false" native="false" synchronized="false"
  9913. static="false" final="false" visibility="public"
  9914. deprecated="not deprecated">
  9915. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  9916. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  9917. <exception name="IOException" type="java.io.IOException"/>
  9918. </method>
  9919. <doc>
  9920. <![CDATA[An abstract {@link org.apache.hadoop.mapred.InputFormat} that returns {@link CombineFileSplit}'s
  9921. in {@link org.apache.hadoop.mapred.InputFormat#getSplits(JobConf, int)} method.
  9922. Splits are constructed from the files under the input paths.
  9923. A split cannot have files from different pools.
  9924. Each split returned may contain blocks from different files.
  9925. If a maxSplitSize is specified, then blocks on the same node are
  9926. combined to form a single split. Blocks that are left over are
  9927. then combined with other blocks in the same rack.
  9928. If maxSplitSize is not specified, then blocks from the same rack
  9929. are combined in a single split; no attempt is made to create
  9930. node-local splits.
  9931. If the maxSplitSize is equal to the block size, then this class
  9932. is similar to the default spliting behaviour in Hadoop: each
  9933. block is a locally processed split.
  9934. Subclasses implement {@link org.apache.hadoop.mapred.InputFormat#getRecordReader(InputSplit, JobConf, Reporter)}
  9935. to construct <code>RecordReader</code>'s for <code>CombineFileSplit</code>'s.
  9936. @see CombineFileSplit
  9937. @deprecated Use
  9938. {@link org.apache.hadoop.mapreduce.lib.input.CombineFileInputFormat}]]>
  9939. </doc>
  9940. </class>
  9941. <!-- end class org.apache.hadoop.mapred.lib.CombineFileInputFormat -->
  9942. <!-- start class org.apache.hadoop.mapred.lib.CombineFileRecordReader -->
  9943. <class name="CombineFileRecordReader" extends="java.lang.Object"
  9944. abstract="false"
  9945. static="false" final="false" visibility="public"
  9946. deprecated="Use
  9947. {@link org.apache.hadoop.mapreduce.lib.input.CombineFileRecordReader}">
  9948. <implements name="org.apache.hadoop.mapred.RecordReader"/>
  9949. <constructor name="CombineFileRecordReader" type="org.apache.hadoop.mapred.JobConf, org.apache.hadoop.mapred.lib.CombineFileSplit, org.apache.hadoop.mapred.Reporter, java.lang.Class"
  9950. static="false" final="false" visibility="public"
  9951. deprecated="not deprecated">
  9952. <exception name="IOException" type="java.io.IOException"/>
  9953. <doc>
  9954. <![CDATA[A generic RecordReader that can hand out different recordReaders
  9955. for each chunk in the CombineFileSplit.]]>
  9956. </doc>
  9957. </constructor>
  9958. <method name="next" return="boolean"
  9959. abstract="false" native="false" synchronized="false"
  9960. static="false" final="false" visibility="public"
  9961. deprecated="not deprecated">
  9962. <param name="key" type="K"/>
  9963. <param name="value" type="V"/>
  9964. <exception name="IOException" type="java.io.IOException"/>
  9965. </method>
  9966. <method name="createKey" return="K"
  9967. abstract="false" native="false" synchronized="false"
  9968. static="false" final="false" visibility="public"
  9969. deprecated="not deprecated">
  9970. </method>
  9971. <method name="createValue" return="V"
  9972. abstract="false" native="false" synchronized="false"
  9973. static="false" final="false" visibility="public"
  9974. deprecated="not deprecated">
  9975. </method>
  9976. <method name="getPos" return="long"
  9977. abstract="false" native="false" synchronized="false"
  9978. static="false" final="false" visibility="public"
  9979. deprecated="not deprecated">
  9980. <exception name="IOException" type="java.io.IOException"/>
  9981. <doc>
  9982. <![CDATA[return the amount of data processed]]>
  9983. </doc>
  9984. </method>
  9985. <method name="close"
  9986. abstract="false" native="false" synchronized="false"
  9987. static="false" final="false" visibility="public"
  9988. deprecated="not deprecated">
  9989. <exception name="IOException" type="java.io.IOException"/>
  9990. </method>
  9991. <method name="getProgress" return="float"
  9992. abstract="false" native="false" synchronized="false"
  9993. static="false" final="false" visibility="public"
  9994. deprecated="not deprecated">
  9995. <exception name="IOException" type="java.io.IOException"/>
  9996. <doc>
  9997. <![CDATA[return progress based on the amount of data processed so far.]]>
  9998. </doc>
  9999. </method>
  10000. <method name="initNextRecordReader" return="boolean"
  10001. abstract="false" native="false" synchronized="false"
  10002. static="false" final="false" visibility="protected"
  10003. deprecated="not deprecated">
  10004. <exception name="IOException" type="java.io.IOException"/>
  10005. <doc>
  10006. <![CDATA[Get the record reader for the next chunk in this CombineFileSplit.]]>
  10007. </doc>
  10008. </method>
  10009. <field name="split" type="org.apache.hadoop.mapred.lib.CombineFileSplit"
  10010. transient="false" volatile="false"
  10011. static="false" final="false" visibility="protected"
  10012. deprecated="not deprecated">
  10013. </field>
  10014. <field name="jc" type="org.apache.hadoop.mapred.JobConf"
  10015. transient="false" volatile="false"
  10016. static="false" final="false" visibility="protected"
  10017. deprecated="not deprecated">
  10018. </field>
  10019. <field name="reporter" type="org.apache.hadoop.mapred.Reporter"
  10020. transient="false" volatile="false"
  10021. static="false" final="false" visibility="protected"
  10022. deprecated="not deprecated">
  10023. </field>
  10024. <field name="rrClass" type="java.lang.Class"
  10025. transient="false" volatile="false"
  10026. static="false" final="false" visibility="protected"
  10027. deprecated="not deprecated">
  10028. </field>
  10029. <field name="rrConstructor" type="java.lang.reflect.Constructor"
  10030. transient="false" volatile="false"
  10031. static="false" final="false" visibility="protected"
  10032. deprecated="not deprecated">
  10033. </field>
  10034. <field name="fs" type="org.apache.hadoop.fs.FileSystem"
  10035. transient="false" volatile="false"
  10036. static="false" final="false" visibility="protected"
  10037. deprecated="not deprecated">
  10038. </field>
  10039. <field name="idx" type="int"
  10040. transient="false" volatile="false"
  10041. static="false" final="false" visibility="protected"
  10042. deprecated="not deprecated">
  10043. </field>
  10044. <field name="progress" type="long"
  10045. transient="false" volatile="false"
  10046. static="false" final="false" visibility="protected"
  10047. deprecated="not deprecated">
  10048. </field>
  10049. <field name="curReader" type="org.apache.hadoop.mapred.RecordReader"
  10050. transient="false" volatile="false"
  10051. static="false" final="false" visibility="protected"
  10052. deprecated="not deprecated">
  10053. </field>
  10054. <doc>
  10055. <![CDATA[A generic RecordReader that can hand out different recordReaders
  10056. for each chunk in a {@link CombineFileSplit}.
  10057. A CombineFileSplit can combine data chunks from multiple files.
  10058. This class allows using different RecordReaders for processing
  10059. these data chunks from different files.
  10060. @see CombineFileSplit
  10061. @deprecated Use
  10062. {@link org.apache.hadoop.mapreduce.lib.input.CombineFileRecordReader}]]>
  10063. </doc>
  10064. </class>
  10065. <!-- end class org.apache.hadoop.mapred.lib.CombineFileRecordReader -->
  10066. <!-- start class org.apache.hadoop.mapred.lib.CombineFileSplit -->
  10067. <class name="CombineFileSplit" extends="org.apache.hadoop.mapreduce.lib.input.CombineFileSplit"
  10068. abstract="false"
  10069. static="false" final="false" visibility="public"
  10070. deprecated="Use
  10071. {@link org.apache.hadoop.mapreduce.lib.input.CombineFileSplit}">
  10072. <implements name="org.apache.hadoop.mapred.InputSplit"/>
  10073. <constructor name="CombineFileSplit"
  10074. static="false" final="false" visibility="public"
  10075. deprecated="not deprecated">
  10076. </constructor>
  10077. <constructor name="CombineFileSplit" type="org.apache.hadoop.mapred.JobConf, org.apache.hadoop.fs.Path[], long[], long[], java.lang.String[]"
  10078. static="false" final="false" visibility="public"
  10079. deprecated="not deprecated">
  10080. </constructor>
  10081. <constructor name="CombineFileSplit" type="org.apache.hadoop.mapred.JobConf, org.apache.hadoop.fs.Path[], long[]"
  10082. static="false" final="false" visibility="public"
  10083. deprecated="not deprecated">
  10084. </constructor>
  10085. <constructor name="CombineFileSplit" type="org.apache.hadoop.mapred.lib.CombineFileSplit"
  10086. static="false" final="false" visibility="public"
  10087. deprecated="not deprecated">
  10088. <exception name="IOException" type="java.io.IOException"/>
  10089. <doc>
  10090. <![CDATA[Copy constructor]]>
  10091. </doc>
  10092. </constructor>
  10093. <method name="getJob" return="org.apache.hadoop.mapred.JobConf"
  10094. abstract="false" native="false" synchronized="false"
  10095. static="false" final="false" visibility="public"
  10096. deprecated="not deprecated">
  10097. </method>
  10098. <doc>
  10099. <![CDATA[@deprecated Use
  10100. {@link org.apache.hadoop.mapreduce.lib.input.CombineFileSplit}]]>
  10101. </doc>
  10102. </class>
  10103. <!-- end class org.apache.hadoop.mapred.lib.CombineFileSplit -->
  10104. <!-- start class org.apache.hadoop.mapred.lib.FieldSelectionMapReduce -->
  10105. <class name="FieldSelectionMapReduce" extends="java.lang.Object"
  10106. abstract="false"
  10107. static="false" final="false" visibility="public"
  10108. deprecated="Use {@link FieldSelectionMapper} and
  10109. {@link FieldSelectionReducer} instead">
  10110. <implements name="org.apache.hadoop.mapred.Mapper"/>
  10111. <implements name="org.apache.hadoop.mapred.Reducer"/>
  10112. <constructor name="FieldSelectionMapReduce"
  10113. static="false" final="false" visibility="public"
  10114. deprecated="not deprecated">
  10115. </constructor>
  10116. <method name="map"
  10117. abstract="false" native="false" synchronized="false"
  10118. static="false" final="false" visibility="public"
  10119. deprecated="not deprecated">
  10120. <param name="key" type="K"/>
  10121. <param name="val" type="V"/>
  10122. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  10123. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10124. <exception name="IOException" type="java.io.IOException"/>
  10125. <doc>
  10126. <![CDATA[The identify function. Input key/value pair is written directly to output.]]>
  10127. </doc>
  10128. </method>
  10129. <method name="configure"
  10130. abstract="false" native="false" synchronized="false"
  10131. static="false" final="false" visibility="public"
  10132. deprecated="not deprecated">
  10133. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10134. </method>
  10135. <method name="close"
  10136. abstract="false" native="false" synchronized="false"
  10137. static="false" final="false" visibility="public"
  10138. deprecated="not deprecated">
  10139. <exception name="IOException" type="java.io.IOException"/>
  10140. </method>
  10141. <method name="reduce"
  10142. abstract="false" native="false" synchronized="false"
  10143. static="false" final="false" visibility="public"
  10144. deprecated="not deprecated">
  10145. <param name="key" type="org.apache.hadoop.io.Text"/>
  10146. <param name="values" type="java.util.Iterator"/>
  10147. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  10148. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10149. <exception name="IOException" type="java.io.IOException"/>
  10150. </method>
  10151. <field name="LOG" type="org.apache.commons.logging.Log"
  10152. transient="false" volatile="false"
  10153. static="true" final="true" visibility="public"
  10154. deprecated="not deprecated">
  10155. </field>
  10156. <doc>
  10157. <![CDATA[This class implements a mapper/reducer class that can be used to perform
  10158. field selections in a manner similar to unix cut. The input data is treated
  10159. as fields separated by a user specified separator (the default value is
  10160. "\t"). The user can specify a list of fields that form the map output keys,
  10161. and a list of fields that form the map output values. If the inputformat is
  10162. TextInputFormat, the mapper will ignore the key to the map function. and the
  10163. fields are from the value only. Otherwise, the fields are the union of those
  10164. from the key and those from the value.
  10165. The field separator is under attribute "mapreduce.fieldsel.data.field.separator"
  10166. The map output field list spec is under attribute
  10167. "mapreduce.fieldsel.map.output.key.value.fields.spec".
  10168. The value is expected to be like "keyFieldsSpec:valueFieldsSpec"
  10169. key/valueFieldsSpec are comma (,) separated field spec: fieldSpec,fieldSpec,fieldSpec ...
  10170. Each field spec can be a simple number (e.g. 5) specifying a specific field, or a range
  10171. (like 2-5) to specify a range of fields, or an open range (like 3-) specifying all
  10172. the fields starting from field 3. The open range field spec applies value fields only.
  10173. They have no effect on the key fields.
  10174. Here is an example: "4,3,0,1:6,5,1-3,7-". It specifies to use fields 4,3,0 and 1 for keys,
  10175. and use fields 6,5,1,2,3,7 and above for values.
  10176. The reduce output field list spec is under attribute
  10177. "mapreduce.fieldsel.reduce.output.key.value.fields.spec".
  10178. The reducer extracts output key/value pairs in a similar manner, except that
  10179. the key is never ignored.
  10180. @deprecated Use {@link FieldSelectionMapper} and
  10181. {@link FieldSelectionReducer} instead]]>
  10182. </doc>
  10183. </class>
  10184. <!-- end class org.apache.hadoop.mapred.lib.FieldSelectionMapReduce -->
  10185. <!-- start class org.apache.hadoop.mapred.lib.FilterOutputFormat -->
  10186. <class name="FilterOutputFormat" extends="java.lang.Object"
  10187. abstract="false"
  10188. static="false" final="false" visibility="public"
  10189. deprecated="Use
  10190. {@link org.apache.hadoop.mapreduce.lib.output.FilterOutputFormat} instead.">
  10191. <implements name="org.apache.hadoop.mapred.OutputFormat"/>
  10192. <constructor name="FilterOutputFormat"
  10193. static="false" final="false" visibility="public"
  10194. deprecated="not deprecated">
  10195. </constructor>
  10196. <constructor name="FilterOutputFormat" type="org.apache.hadoop.mapred.OutputFormat"
  10197. static="false" final="false" visibility="public"
  10198. deprecated="not deprecated">
  10199. <doc>
  10200. <![CDATA[Create a FilterOutputFormat based on the supplied output format.
  10201. @param out the underlying OutputFormat]]>
  10202. </doc>
  10203. </constructor>
  10204. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  10205. abstract="false" native="false" synchronized="false"
  10206. static="false" final="false" visibility="public"
  10207. deprecated="not deprecated">
  10208. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  10209. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10210. <param name="name" type="java.lang.String"/>
  10211. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  10212. <exception name="IOException" type="java.io.IOException"/>
  10213. </method>
  10214. <method name="checkOutputSpecs"
  10215. abstract="false" native="false" synchronized="false"
  10216. static="false" final="false" visibility="public"
  10217. deprecated="not deprecated">
  10218. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  10219. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10220. <exception name="IOException" type="java.io.IOException"/>
  10221. </method>
  10222. <field name="baseOut" type="org.apache.hadoop.mapred.OutputFormat"
  10223. transient="false" volatile="false"
  10224. static="false" final="false" visibility="protected"
  10225. deprecated="not deprecated">
  10226. </field>
  10227. <doc>
  10228. <![CDATA[FilterOutputFormat is a convenience class that wraps OutputFormat.
  10229. @deprecated Use
  10230. {@link org.apache.hadoop.mapreduce.lib.output.FilterOutputFormat} instead.]]>
  10231. </doc>
  10232. </class>
  10233. <!-- end class org.apache.hadoop.mapred.lib.FilterOutputFormat -->
  10234. <!-- start class org.apache.hadoop.mapred.lib.FilterOutputFormat.FilterRecordWriter -->
  10235. <class name="FilterOutputFormat.FilterRecordWriter" extends="java.lang.Object"
  10236. abstract="false"
  10237. static="true" final="false" visibility="public"
  10238. deprecated="not deprecated">
  10239. <implements name="org.apache.hadoop.mapred.RecordWriter"/>
  10240. <constructor name="FilterOutputFormat.FilterRecordWriter"
  10241. static="false" final="false" visibility="public"
  10242. deprecated="not deprecated">
  10243. <exception name="IOException" type="java.io.IOException"/>
  10244. </constructor>
  10245. <constructor name="FilterOutputFormat.FilterRecordWriter" type="org.apache.hadoop.mapred.RecordWriter"
  10246. static="false" final="false" visibility="public"
  10247. deprecated="not deprecated">
  10248. <exception name="IOException" type="java.io.IOException"/>
  10249. </constructor>
  10250. <method name="close"
  10251. abstract="false" native="false" synchronized="false"
  10252. static="false" final="false" visibility="public"
  10253. deprecated="not deprecated">
  10254. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10255. <exception name="IOException" type="java.io.IOException"/>
  10256. </method>
  10257. <method name="write"
  10258. abstract="false" native="false" synchronized="false"
  10259. static="false" final="false" visibility="public"
  10260. deprecated="not deprecated">
  10261. <param name="key" type="K"/>
  10262. <param name="value" type="V"/>
  10263. <exception name="IOException" type="java.io.IOException"/>
  10264. </method>
  10265. <field name="rawWriter" type="org.apache.hadoop.mapred.RecordWriter"
  10266. transient="false" volatile="false"
  10267. static="false" final="false" visibility="protected"
  10268. deprecated="not deprecated">
  10269. </field>
  10270. <doc>
  10271. <![CDATA[<code>FilterRecordWriter</code> is a convenience wrapper
  10272. class that implements {@link RecordWriter}.]]>
  10273. </doc>
  10274. </class>
  10275. <!-- end class org.apache.hadoop.mapred.lib.FilterOutputFormat.FilterRecordWriter -->
  10276. <!-- start class org.apache.hadoop.mapred.lib.HashPartitioner -->
  10277. <class name="HashPartitioner" extends="java.lang.Object"
  10278. abstract="false"
  10279. static="false" final="false" visibility="public"
  10280. deprecated="Use
  10281. {@link org.apache.hadoop.mapreduce.lib.partition.HashPartitioner} instead.">
  10282. <implements name="org.apache.hadoop.mapred.Partitioner"/>
  10283. <constructor name="HashPartitioner"
  10284. static="false" final="false" visibility="public"
  10285. deprecated="not deprecated">
  10286. </constructor>
  10287. <method name="configure"
  10288. abstract="false" native="false" synchronized="false"
  10289. static="false" final="false" visibility="public"
  10290. deprecated="not deprecated">
  10291. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10292. </method>
  10293. <method name="getPartition" return="int"
  10294. abstract="false" native="false" synchronized="false"
  10295. static="false" final="false" visibility="public"
  10296. deprecated="not deprecated">
  10297. <param name="key" type="K2"/>
  10298. <param name="value" type="V2"/>
  10299. <param name="numReduceTasks" type="int"/>
  10300. <doc>
  10301. <![CDATA[Use {@link Object#hashCode()} to partition.]]>
  10302. </doc>
  10303. </method>
  10304. <doc>
  10305. <![CDATA[Partition keys by their {@link Object#hashCode()}.
  10306. @deprecated Use
  10307. {@link org.apache.hadoop.mapreduce.lib.partition.HashPartitioner} instead.]]>
  10308. </doc>
  10309. </class>
  10310. <!-- end class org.apache.hadoop.mapred.lib.HashPartitioner -->
  10311. <!-- start class org.apache.hadoop.mapred.lib.IdentityMapper -->
  10312. <class name="IdentityMapper" extends="org.apache.hadoop.mapred.MapReduceBase"
  10313. abstract="false"
  10314. static="false" final="false" visibility="public"
  10315. deprecated="Use {@link org.apache.hadoop.mapreduce.Mapper} instead.">
  10316. <implements name="org.apache.hadoop.mapred.Mapper"/>
  10317. <constructor name="IdentityMapper"
  10318. static="false" final="false" visibility="public"
  10319. deprecated="not deprecated">
  10320. </constructor>
  10321. <method name="map"
  10322. abstract="false" native="false" synchronized="false"
  10323. static="false" final="false" visibility="public"
  10324. deprecated="not deprecated">
  10325. <param name="key" type="K"/>
  10326. <param name="val" type="V"/>
  10327. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  10328. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10329. <exception name="IOException" type="java.io.IOException"/>
  10330. <doc>
  10331. <![CDATA[The identify function. Input key/value pair is written directly to
  10332. output.]]>
  10333. </doc>
  10334. </method>
  10335. <doc>
  10336. <![CDATA[Implements the identity function, mapping inputs directly to outputs.
  10337. @deprecated Use {@link org.apache.hadoop.mapreduce.Mapper} instead.]]>
  10338. </doc>
  10339. </class>
  10340. <!-- end class org.apache.hadoop.mapred.lib.IdentityMapper -->
  10341. <!-- start class org.apache.hadoop.mapred.lib.IdentityReducer -->
  10342. <class name="IdentityReducer" extends="org.apache.hadoop.mapred.MapReduceBase"
  10343. abstract="false"
  10344. static="false" final="false" visibility="public"
  10345. deprecated="Use {@link org.apache.hadoop.mapreduce.Reducer} instead.">
  10346. <implements name="org.apache.hadoop.mapred.Reducer"/>
  10347. <constructor name="IdentityReducer"
  10348. static="false" final="false" visibility="public"
  10349. deprecated="not deprecated">
  10350. </constructor>
  10351. <method name="reduce"
  10352. abstract="false" native="false" synchronized="false"
  10353. static="false" final="false" visibility="public"
  10354. deprecated="not deprecated">
  10355. <param name="key" type="K"/>
  10356. <param name="values" type="java.util.Iterator"/>
  10357. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  10358. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10359. <exception name="IOException" type="java.io.IOException"/>
  10360. <doc>
  10361. <![CDATA[Writes all keys and values directly to output.]]>
  10362. </doc>
  10363. </method>
  10364. <doc>
  10365. <![CDATA[Performs no reduction, writing all input values directly to the output.
  10366. @deprecated Use {@link org.apache.hadoop.mapreduce.Reducer} instead.]]>
  10367. </doc>
  10368. </class>
  10369. <!-- end class org.apache.hadoop.mapred.lib.IdentityReducer -->
  10370. <!-- start class org.apache.hadoop.mapred.lib.InputSampler -->
  10371. <class name="InputSampler" extends="org.apache.hadoop.mapreduce.lib.partition.InputSampler"
  10372. abstract="false"
  10373. static="false" final="false" visibility="public"
  10374. deprecated="Use
  10375. {@link org.apache.hadoop.mapreduce.lib.partition.InputSampler}">
  10376. <constructor name="InputSampler" type="org.apache.hadoop.mapred.JobConf"
  10377. static="false" final="false" visibility="public"
  10378. deprecated="not deprecated">
  10379. </constructor>
  10380. <method name="writePartitionFile"
  10381. abstract="false" native="false" synchronized="false"
  10382. static="true" final="false" visibility="public"
  10383. deprecated="not deprecated">
  10384. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10385. <param name="sampler" type="org.apache.hadoop.mapreduce.lib.partition.InputSampler.Sampler"/>
  10386. <exception name="IOException" type="java.io.IOException"/>
  10387. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  10388. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  10389. </method>
  10390. <doc>
  10391. <![CDATA[@deprecated Use
  10392. {@link org.apache.hadoop.mapreduce.lib.partition.InputSampler}]]>
  10393. </doc>
  10394. </class>
  10395. <!-- end class org.apache.hadoop.mapred.lib.InputSampler -->
  10396. <!-- start class org.apache.hadoop.mapred.lib.InverseMapper -->
  10397. <class name="InverseMapper" extends="org.apache.hadoop.mapred.MapReduceBase"
  10398. abstract="false"
  10399. static="false" final="false" visibility="public"
  10400. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.map.InverseMapper}
  10401. instead.">
  10402. <implements name="org.apache.hadoop.mapred.Mapper"/>
  10403. <constructor name="InverseMapper"
  10404. static="false" final="false" visibility="public"
  10405. deprecated="not deprecated">
  10406. </constructor>
  10407. <method name="map"
  10408. abstract="false" native="false" synchronized="false"
  10409. static="false" final="false" visibility="public"
  10410. deprecated="not deprecated">
  10411. <param name="key" type="K"/>
  10412. <param name="value" type="V"/>
  10413. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  10414. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10415. <exception name="IOException" type="java.io.IOException"/>
  10416. <doc>
  10417. <![CDATA[The inverse function. Input keys and values are swapped.]]>
  10418. </doc>
  10419. </method>
  10420. <doc>
  10421. <![CDATA[A {@link Mapper} that swaps keys and values.
  10422. @deprecated Use {@link org.apache.hadoop.mapreduce.lib.map.InverseMapper}
  10423. instead.]]>
  10424. </doc>
  10425. </class>
  10426. <!-- end class org.apache.hadoop.mapred.lib.InverseMapper -->
  10427. <!-- start class org.apache.hadoop.mapred.lib.KeyFieldBasedComparator -->
  10428. <class name="KeyFieldBasedComparator" extends="org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedComparator"
  10429. abstract="false"
  10430. static="false" final="false" visibility="public"
  10431. deprecated="Use
  10432. {@link org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedComparator}
  10433. instead">
  10434. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  10435. <constructor name="KeyFieldBasedComparator"
  10436. static="false" final="false" visibility="public"
  10437. deprecated="not deprecated">
  10438. </constructor>
  10439. <method name="configure"
  10440. abstract="false" native="false" synchronized="false"
  10441. static="false" final="false" visibility="public"
  10442. deprecated="not deprecated">
  10443. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10444. </method>
  10445. <doc>
  10446. <![CDATA[This comparator implementation provides a subset of the features provided
  10447. by the Unix/GNU Sort. In particular, the supported features are:
  10448. -n, (Sort numerically)
  10449. -r, (Reverse the result of comparison)
  10450. -k pos1[,pos2], where pos is of the form f[.c][opts], where f is the number
  10451. of the field to use, and c is the number of the first character from the
  10452. beginning of the field. Fields and character posns are numbered starting
  10453. with 1; a character position of zero in pos2 indicates the field's last
  10454. character. If '.c' is omitted from pos1, it defaults to 1 (the beginning
  10455. of the field); if omitted from pos2, it defaults to 0 (the end of the
  10456. field). opts are ordering options (any of 'nr' as described above).
  10457. We assume that the fields in the key are separated by
  10458. {@link JobContext#MAP_OUTPUT_KEY_FIELD_SEPERATOR}
  10459. @deprecated Use
  10460. {@link org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedComparator}
  10461. instead]]>
  10462. </doc>
  10463. </class>
  10464. <!-- end class org.apache.hadoop.mapred.lib.KeyFieldBasedComparator -->
  10465. <!-- start class org.apache.hadoop.mapred.lib.KeyFieldBasedPartitioner -->
  10466. <class name="KeyFieldBasedPartitioner" extends="org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedPartitioner"
  10467. abstract="false"
  10468. static="false" final="false" visibility="public"
  10469. deprecated="Use
  10470. {@link org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedPartitioner}
  10471. instead">
  10472. <implements name="org.apache.hadoop.mapred.Partitioner"/>
  10473. <constructor name="KeyFieldBasedPartitioner"
  10474. static="false" final="false" visibility="public"
  10475. deprecated="not deprecated">
  10476. </constructor>
  10477. <method name="configure"
  10478. abstract="false" native="false" synchronized="false"
  10479. static="false" final="false" visibility="public"
  10480. deprecated="not deprecated">
  10481. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10482. </method>
  10483. <doc>
  10484. <![CDATA[Defines a way to partition keys based on certain key fields (also see
  10485. {@link KeyFieldBasedComparator}.
  10486. The key specification supported is of the form -k pos1[,pos2], where,
  10487. pos is of the form f[.c][opts], where f is the number
  10488. of the key field to use, and c is the number of the first character from
  10489. the beginning of the field. Fields and character posns are numbered
  10490. starting with 1; a character position of zero in pos2 indicates the
  10491. field's last character. If '.c' is omitted from pos1, it defaults to 1
  10492. (the beginning of the field); if omitted from pos2, it defaults to 0
  10493. (the end of the field).
  10494. @deprecated Use
  10495. {@link org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedPartitioner}
  10496. instead]]>
  10497. </doc>
  10498. </class>
  10499. <!-- end class org.apache.hadoop.mapred.lib.KeyFieldBasedPartitioner -->
  10500. <!-- start class org.apache.hadoop.mapred.lib.LazyOutputFormat -->
  10501. <class name="LazyOutputFormat" extends="org.apache.hadoop.mapred.lib.FilterOutputFormat"
  10502. abstract="false"
  10503. static="false" final="false" visibility="public"
  10504. deprecated="Use
  10505. {@link org.apache.hadoop.mapreduce.lib.output.LazyOutputFormat} instead.">
  10506. <constructor name="LazyOutputFormat"
  10507. static="false" final="false" visibility="public"
  10508. deprecated="not deprecated">
  10509. </constructor>
  10510. <method name="setOutputFormatClass"
  10511. abstract="false" native="false" synchronized="false"
  10512. static="true" final="false" visibility="public"
  10513. deprecated="not deprecated">
  10514. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10515. <param name="theClass" type="java.lang.Class"/>
  10516. <doc>
  10517. <![CDATA[Set the underlying output format for LazyOutputFormat.
  10518. @param job the {@link JobConf} to modify
  10519. @param theClass the underlying class]]>
  10520. </doc>
  10521. </method>
  10522. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  10523. abstract="false" native="false" synchronized="false"
  10524. static="false" final="false" visibility="public"
  10525. deprecated="not deprecated">
  10526. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  10527. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10528. <param name="name" type="java.lang.String"/>
  10529. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  10530. <exception name="IOException" type="java.io.IOException"/>
  10531. </method>
  10532. <method name="checkOutputSpecs"
  10533. abstract="false" native="false" synchronized="false"
  10534. static="false" final="false" visibility="public"
  10535. deprecated="not deprecated">
  10536. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  10537. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10538. <exception name="IOException" type="java.io.IOException"/>
  10539. </method>
  10540. <doc>
  10541. <![CDATA[A Convenience class that creates output lazily.
  10542. @deprecated Use
  10543. {@link org.apache.hadoop.mapreduce.lib.output.LazyOutputFormat} instead.]]>
  10544. </doc>
  10545. </class>
  10546. <!-- end class org.apache.hadoop.mapred.lib.LazyOutputFormat -->
  10547. <!-- start class org.apache.hadoop.mapred.lib.LongSumReducer -->
  10548. <class name="LongSumReducer" extends="org.apache.hadoop.mapred.MapReduceBase"
  10549. abstract="false"
  10550. static="false" final="false" visibility="public"
  10551. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.reduce.LongSumReducer}
  10552. instead.">
  10553. <implements name="org.apache.hadoop.mapred.Reducer"/>
  10554. <constructor name="LongSumReducer"
  10555. static="false" final="false" visibility="public"
  10556. deprecated="not deprecated">
  10557. </constructor>
  10558. <method name="reduce"
  10559. abstract="false" native="false" synchronized="false"
  10560. static="false" final="false" visibility="public"
  10561. deprecated="not deprecated">
  10562. <param name="key" type="K"/>
  10563. <param name="values" type="java.util.Iterator"/>
  10564. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  10565. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10566. <exception name="IOException" type="java.io.IOException"/>
  10567. </method>
  10568. <doc>
  10569. <![CDATA[A {@link Reducer} that sums long values.
  10570. @deprecated Use {@link org.apache.hadoop.mapreduce.lib.reduce.LongSumReducer}
  10571. instead.]]>
  10572. </doc>
  10573. </class>
  10574. <!-- end class org.apache.hadoop.mapred.lib.LongSumReducer -->
  10575. <!-- start class org.apache.hadoop.mapred.lib.MultipleInputs -->
  10576. <class name="MultipleInputs" extends="java.lang.Object"
  10577. abstract="false"
  10578. static="false" final="false" visibility="public"
  10579. deprecated="Use
  10580. {@link org.apache.hadoop.mapreduce.lib.input.MultipleInputs} instead">
  10581. <constructor name="MultipleInputs"
  10582. static="false" final="false" visibility="public"
  10583. deprecated="not deprecated">
  10584. </constructor>
  10585. <method name="addInputPath"
  10586. abstract="false" native="false" synchronized="false"
  10587. static="true" final="false" visibility="public"
  10588. deprecated="not deprecated">
  10589. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10590. <param name="path" type="org.apache.hadoop.fs.Path"/>
  10591. <param name="inputFormatClass" type="java.lang.Class"/>
  10592. <doc>
  10593. <![CDATA[Add a {@link Path} with a custom {@link InputFormat} to the list of
  10594. inputs for the map-reduce job.
  10595. @param conf The configuration of the job
  10596. @param path {@link Path} to be added to the list of inputs for the job
  10597. @param inputFormatClass {@link InputFormat} class to use for this path]]>
  10598. </doc>
  10599. </method>
  10600. <method name="addInputPath"
  10601. abstract="false" native="false" synchronized="false"
  10602. static="true" final="false" visibility="public"
  10603. deprecated="not deprecated">
  10604. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10605. <param name="path" type="org.apache.hadoop.fs.Path"/>
  10606. <param name="inputFormatClass" type="java.lang.Class"/>
  10607. <param name="mapperClass" type="java.lang.Class"/>
  10608. <doc>
  10609. <![CDATA[Add a {@link Path} with a custom {@link InputFormat} and
  10610. {@link Mapper} to the list of inputs for the map-reduce job.
  10611. @param conf The configuration of the job
  10612. @param path {@link Path} to be added to the list of inputs for the job
  10613. @param inputFormatClass {@link InputFormat} class to use for this path
  10614. @param mapperClass {@link Mapper} class to use for this path]]>
  10615. </doc>
  10616. </method>
  10617. <doc>
  10618. <![CDATA[This class supports MapReduce jobs that have multiple input paths with
  10619. a different {@link InputFormat} and {@link Mapper} for each path
  10620. @deprecated Use
  10621. {@link org.apache.hadoop.mapreduce.lib.input.MultipleInputs} instead]]>
  10622. </doc>
  10623. </class>
  10624. <!-- end class org.apache.hadoop.mapred.lib.MultipleInputs -->
  10625. <!-- start class org.apache.hadoop.mapred.lib.MultipleOutputFormat -->
  10626. <class name="MultipleOutputFormat" extends="org.apache.hadoop.mapred.FileOutputFormat"
  10627. abstract="true"
  10628. static="false" final="false" visibility="public"
  10629. deprecated="Use
  10630. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead">
  10631. <constructor name="MultipleOutputFormat"
  10632. static="false" final="false" visibility="public"
  10633. deprecated="not deprecated">
  10634. </constructor>
  10635. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  10636. abstract="false" native="false" synchronized="false"
  10637. static="false" final="false" visibility="public"
  10638. deprecated="not deprecated">
  10639. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  10640. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10641. <param name="name" type="java.lang.String"/>
  10642. <param name="arg3" type="org.apache.hadoop.util.Progressable"/>
  10643. <exception name="IOException" type="java.io.IOException"/>
  10644. <doc>
  10645. <![CDATA[Create a composite record writer that can write key/value data to different
  10646. output files
  10647. @param fs
  10648. the file system to use
  10649. @param job
  10650. the job conf for the job
  10651. @param name
  10652. the leaf file name for the output file (such as part-00000")
  10653. @param arg3
  10654. a progressable for reporting progress.
  10655. @return a composite record writer
  10656. @throws IOException]]>
  10657. </doc>
  10658. </method>
  10659. <method name="generateLeafFileName" return="java.lang.String"
  10660. abstract="false" native="false" synchronized="false"
  10661. static="false" final="false" visibility="protected"
  10662. deprecated="not deprecated">
  10663. <param name="name" type="java.lang.String"/>
  10664. <doc>
  10665. <![CDATA[Generate the leaf name for the output file name. The default behavior does
  10666. not change the leaf file name (such as part-00000)
  10667. @param name
  10668. the leaf file name for the output file
  10669. @return the given leaf file name]]>
  10670. </doc>
  10671. </method>
  10672. <method name="generateFileNameForKeyValue" return="java.lang.String"
  10673. abstract="false" native="false" synchronized="false"
  10674. static="false" final="false" visibility="protected"
  10675. deprecated="not deprecated">
  10676. <param name="key" type="K"/>
  10677. <param name="value" type="V"/>
  10678. <param name="name" type="java.lang.String"/>
  10679. <doc>
  10680. <![CDATA[Generate the file output file name based on the given key and the leaf file
  10681. name. The default behavior is that the file name does not depend on the
  10682. key.
  10683. @param key
  10684. the key of the output data
  10685. @param name
  10686. the leaf file name
  10687. @return generated file name]]>
  10688. </doc>
  10689. </method>
  10690. <method name="generateActualKey" return="K"
  10691. abstract="false" native="false" synchronized="false"
  10692. static="false" final="false" visibility="protected"
  10693. deprecated="not deprecated">
  10694. <param name="key" type="K"/>
  10695. <param name="value" type="V"/>
  10696. <doc>
  10697. <![CDATA[Generate the actual key from the given key/value. The default behavior is that
  10698. the actual key is equal to the given key
  10699. @param key
  10700. the key of the output data
  10701. @param value
  10702. the value of the output data
  10703. @return the actual key derived from the given key/value]]>
  10704. </doc>
  10705. </method>
  10706. <method name="generateActualValue" return="V"
  10707. abstract="false" native="false" synchronized="false"
  10708. static="false" final="false" visibility="protected"
  10709. deprecated="not deprecated">
  10710. <param name="key" type="K"/>
  10711. <param name="value" type="V"/>
  10712. <doc>
  10713. <![CDATA[Generate the actual value from the given key and value. The default behavior is that
  10714. the actual value is equal to the given value
  10715. @param key
  10716. the key of the output data
  10717. @param value
  10718. the value of the output data
  10719. @return the actual value derived from the given key/value]]>
  10720. </doc>
  10721. </method>
  10722. <method name="getInputFileBasedOutputFileName" return="java.lang.String"
  10723. abstract="false" native="false" synchronized="false"
  10724. static="false" final="false" visibility="protected"
  10725. deprecated="not deprecated">
  10726. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10727. <param name="name" type="java.lang.String"/>
  10728. <doc>
  10729. <![CDATA[Generate the outfile name based on a given anme and the input file name. If
  10730. the {@link JobContext#MAP_INPUT_FILE} does not exists (i.e. this is not for a map only job),
  10731. the given name is returned unchanged. If the config value for
  10732. "num.of.trailing.legs.to.use" is not set, or set 0 or negative, the given
  10733. name is returned unchanged. Otherwise, return a file name consisting of the
  10734. N trailing legs of the input file name where N is the config value for
  10735. "num.of.trailing.legs.to.use".
  10736. @param job
  10737. the job config
  10738. @param name
  10739. the output file name
  10740. @return the outfile name based on a given anme and the input file name.]]>
  10741. </doc>
  10742. </method>
  10743. <method name="getBaseRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  10744. abstract="true" native="false" synchronized="false"
  10745. static="false" final="false" visibility="protected"
  10746. deprecated="not deprecated">
  10747. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  10748. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  10749. <param name="name" type="java.lang.String"/>
  10750. <param name="arg3" type="org.apache.hadoop.util.Progressable"/>
  10751. <exception name="IOException" type="java.io.IOException"/>
  10752. <doc>
  10753. <![CDATA[@param fs
  10754. the file system to use
  10755. @param job
  10756. a job conf object
  10757. @param name
  10758. the name of the file over which a record writer object will be
  10759. constructed
  10760. @param arg3
  10761. a progressable object
  10762. @return A RecordWriter object over the given file
  10763. @throws IOException]]>
  10764. </doc>
  10765. </method>
  10766. <doc>
  10767. <![CDATA[This abstract class extends the FileOutputFormat, allowing to write the
  10768. output data to different output files. There are three basic use cases for
  10769. this class.
  10770. Case one: This class is used for a map reduce job with at least one reducer.
  10771. The reducer wants to write data to different files depending on the actual
  10772. keys. It is assumed that a key (or value) encodes the actual key (value)
  10773. and the desired location for the actual key (value).
  10774. Case two: This class is used for a map only job. The job wants to use an
  10775. output file name that is either a part of the input file name of the input
  10776. data, or some derivation of it.
  10777. Case three: This class is used for a map only job. The job wants to use an
  10778. output file name that depends on both the keys and the input file name,
  10779. @deprecated Use
  10780. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead]]>
  10781. </doc>
  10782. </class>
  10783. <!-- end class org.apache.hadoop.mapred.lib.MultipleOutputFormat -->
  10784. <!-- start class org.apache.hadoop.mapred.lib.MultipleOutputs -->
  10785. <class name="MultipleOutputs" extends="java.lang.Object"
  10786. abstract="false"
  10787. static="false" final="false" visibility="public"
  10788. deprecated="Use
  10789. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead">
  10790. <constructor name="MultipleOutputs" type="org.apache.hadoop.mapred.JobConf"
  10791. static="false" final="false" visibility="public"
  10792. deprecated="not deprecated">
  10793. <doc>
  10794. <![CDATA[Creates and initializes multiple named outputs support, it should be
  10795. instantiated in the Mapper/Reducer configure method.
  10796. @param job the job configuration object]]>
  10797. </doc>
  10798. </constructor>
  10799. <method name="getNamedOutputsList" return="java.util.List"
  10800. abstract="false" native="false" synchronized="false"
  10801. static="true" final="false" visibility="public"
  10802. deprecated="not deprecated">
  10803. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10804. <doc>
  10805. <![CDATA[Returns list of channel names.
  10806. @param conf job conf
  10807. @return List of channel Names]]>
  10808. </doc>
  10809. </method>
  10810. <method name="isMultiNamedOutput" return="boolean"
  10811. abstract="false" native="false" synchronized="false"
  10812. static="true" final="false" visibility="public"
  10813. deprecated="not deprecated">
  10814. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10815. <param name="namedOutput" type="java.lang.String"/>
  10816. <doc>
  10817. <![CDATA[Returns if a named output is multiple.
  10818. @param conf job conf
  10819. @param namedOutput named output
  10820. @return <code>true</code> if the name output is multi, <code>false</code>
  10821. if it is single. If the name output is not defined it returns
  10822. <code>false</code>]]>
  10823. </doc>
  10824. </method>
  10825. <method name="getNamedOutputFormatClass" return="java.lang.Class"
  10826. abstract="false" native="false" synchronized="false"
  10827. static="true" final="false" visibility="public"
  10828. deprecated="not deprecated">
  10829. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10830. <param name="namedOutput" type="java.lang.String"/>
  10831. <doc>
  10832. <![CDATA[Returns the named output OutputFormat.
  10833. @param conf job conf
  10834. @param namedOutput named output
  10835. @return namedOutput OutputFormat]]>
  10836. </doc>
  10837. </method>
  10838. <method name="getNamedOutputKeyClass" return="java.lang.Class"
  10839. abstract="false" native="false" synchronized="false"
  10840. static="true" final="false" visibility="public"
  10841. deprecated="not deprecated">
  10842. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10843. <param name="namedOutput" type="java.lang.String"/>
  10844. <doc>
  10845. <![CDATA[Returns the key class for a named output.
  10846. @param conf job conf
  10847. @param namedOutput named output
  10848. @return class for the named output key]]>
  10849. </doc>
  10850. </method>
  10851. <method name="getNamedOutputValueClass" return="java.lang.Class"
  10852. abstract="false" native="false" synchronized="false"
  10853. static="true" final="false" visibility="public"
  10854. deprecated="not deprecated">
  10855. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10856. <param name="namedOutput" type="java.lang.String"/>
  10857. <doc>
  10858. <![CDATA[Returns the value class for a named output.
  10859. @param conf job conf
  10860. @param namedOutput named output
  10861. @return class of named output value]]>
  10862. </doc>
  10863. </method>
  10864. <method name="addNamedOutput"
  10865. abstract="false" native="false" synchronized="false"
  10866. static="true" final="false" visibility="public"
  10867. deprecated="not deprecated">
  10868. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10869. <param name="namedOutput" type="java.lang.String"/>
  10870. <param name="outputFormatClass" type="java.lang.Class"/>
  10871. <param name="keyClass" type="java.lang.Class"/>
  10872. <param name="valueClass" type="java.lang.Class"/>
  10873. <doc>
  10874. <![CDATA[Adds a named output for the job.
  10875. <p/>
  10876. @param conf job conf to add the named output
  10877. @param namedOutput named output name, it has to be a word, letters
  10878. and numbers only, cannot be the word 'part' as
  10879. that is reserved for the
  10880. default output.
  10881. @param outputFormatClass OutputFormat class.
  10882. @param keyClass key class
  10883. @param valueClass value class]]>
  10884. </doc>
  10885. </method>
  10886. <method name="addMultiNamedOutput"
  10887. abstract="false" native="false" synchronized="false"
  10888. static="true" final="false" visibility="public"
  10889. deprecated="not deprecated">
  10890. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10891. <param name="namedOutput" type="java.lang.String"/>
  10892. <param name="outputFormatClass" type="java.lang.Class"/>
  10893. <param name="keyClass" type="java.lang.Class"/>
  10894. <param name="valueClass" type="java.lang.Class"/>
  10895. <doc>
  10896. <![CDATA[Adds a multi named output for the job.
  10897. <p/>
  10898. @param conf job conf to add the named output
  10899. @param namedOutput named output name, it has to be a word, letters
  10900. and numbers only, cannot be the word 'part' as
  10901. that is reserved for the
  10902. default output.
  10903. @param outputFormatClass OutputFormat class.
  10904. @param keyClass key class
  10905. @param valueClass value class]]>
  10906. </doc>
  10907. </method>
  10908. <method name="setCountersEnabled"
  10909. abstract="false" native="false" synchronized="false"
  10910. static="true" final="false" visibility="public"
  10911. deprecated="not deprecated">
  10912. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10913. <param name="enabled" type="boolean"/>
  10914. <doc>
  10915. <![CDATA[Enables or disables counters for the named outputs.
  10916. <p/>
  10917. By default these counters are disabled.
  10918. <p/>
  10919. MultipleOutputs supports counters, by default the are disabled.
  10920. The counters group is the {@link MultipleOutputs} class name.
  10921. </p>
  10922. The names of the counters are the same as the named outputs. For multi
  10923. named outputs the name of the counter is the concatenation of the named
  10924. output, and underscore '_' and the multiname.
  10925. @param conf job conf to enableadd the named output.
  10926. @param enabled indicates if the counters will be enabled or not.]]>
  10927. </doc>
  10928. </method>
  10929. <method name="getCountersEnabled" return="boolean"
  10930. abstract="false" native="false" synchronized="false"
  10931. static="true" final="false" visibility="public"
  10932. deprecated="not deprecated">
  10933. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  10934. <doc>
  10935. <![CDATA[Returns if the counters for the named outputs are enabled or not.
  10936. <p/>
  10937. By default these counters are disabled.
  10938. <p/>
  10939. MultipleOutputs supports counters, by default the are disabled.
  10940. The counters group is the {@link MultipleOutputs} class name.
  10941. </p>
  10942. The names of the counters are the same as the named outputs. For multi
  10943. named outputs the name of the counter is the concatenation of the named
  10944. output, and underscore '_' and the multiname.
  10945. @param conf job conf to enableadd the named output.
  10946. @return TRUE if the counters are enabled, FALSE if they are disabled.]]>
  10947. </doc>
  10948. </method>
  10949. <method name="getNamedOutputs" return="java.util.Iterator"
  10950. abstract="false" native="false" synchronized="false"
  10951. static="false" final="false" visibility="public"
  10952. deprecated="not deprecated">
  10953. <doc>
  10954. <![CDATA[Returns iterator with the defined name outputs.
  10955. @return iterator with the defined named outputs]]>
  10956. </doc>
  10957. </method>
  10958. <method name="getCollector" return="org.apache.hadoop.mapred.OutputCollector"
  10959. abstract="false" native="false" synchronized="false"
  10960. static="false" final="false" visibility="public"
  10961. deprecated="not deprecated">
  10962. <param name="namedOutput" type="java.lang.String"/>
  10963. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10964. <exception name="IOException" type="java.io.IOException"/>
  10965. <doc>
  10966. <![CDATA[Gets the output collector for a named output.
  10967. <p/>
  10968. @param namedOutput the named output name
  10969. @param reporter the reporter
  10970. @return the output collector for the given named output
  10971. @throws IOException thrown if output collector could not be created]]>
  10972. </doc>
  10973. </method>
  10974. <method name="getCollector" return="org.apache.hadoop.mapred.OutputCollector"
  10975. abstract="false" native="false" synchronized="false"
  10976. static="false" final="false" visibility="public"
  10977. deprecated="not deprecated">
  10978. <param name="namedOutput" type="java.lang.String"/>
  10979. <param name="multiName" type="java.lang.String"/>
  10980. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  10981. <exception name="IOException" type="java.io.IOException"/>
  10982. <doc>
  10983. <![CDATA[Gets the output collector for a multi named output.
  10984. <p/>
  10985. @param namedOutput the named output name
  10986. @param multiName the multi name part
  10987. @param reporter the reporter
  10988. @return the output collector for the given named output
  10989. @throws IOException thrown if output collector could not be created]]>
  10990. </doc>
  10991. </method>
  10992. <method name="close"
  10993. abstract="false" native="false" synchronized="false"
  10994. static="false" final="false" visibility="public"
  10995. deprecated="not deprecated">
  10996. <exception name="IOException" type="java.io.IOException"/>
  10997. <doc>
  10998. <![CDATA[Closes all the opened named outputs.
  10999. <p/>
  11000. If overriden subclasses must invoke <code>super.close()</code> at the
  11001. end of their <code>close()</code>
  11002. @throws java.io.IOException thrown if any of the MultipleOutput files
  11003. could not be closed properly.]]>
  11004. </doc>
  11005. </method>
  11006. <doc>
  11007. <![CDATA[The MultipleOutputs class simplifies writting to additional outputs other
  11008. than the job default output via the <code>OutputCollector</code> passed to
  11009. the <code>map()</code> and <code>reduce()</code> methods of the
  11010. <code>Mapper</code> and <code>Reducer</code> implementations.
  11011. <p/>
  11012. Each additional output, or named output, may be configured with its own
  11013. <code>OutputFormat</code>, with its own key class and with its own value
  11014. class.
  11015. <p/>
  11016. A named output can be a single file or a multi file. The later is refered as
  11017. a multi named output.
  11018. <p/>
  11019. A multi named output is an unbound set of files all sharing the same
  11020. <code>OutputFormat</code>, key class and value class configuration.
  11021. <p/>
  11022. When named outputs are used within a <code>Mapper</code> implementation,
  11023. key/values written to a name output are not part of the reduce phase, only
  11024. key/values written to the job <code>OutputCollector</code> are part of the
  11025. reduce phase.
  11026. <p/>
  11027. MultipleOutputs supports counters, by default the are disabled. The counters
  11028. group is the {@link MultipleOutputs} class name.
  11029. </p>
  11030. The names of the counters are the same as the named outputs. For multi
  11031. named outputs the name of the counter is the concatenation of the named
  11032. output, and underscore '_' and the multiname.
  11033. <p/>
  11034. Job configuration usage pattern is:
  11035. <pre>
  11036. JobConf conf = new JobConf();
  11037. conf.setInputPath(inDir);
  11038. FileOutputFormat.setOutputPath(conf, outDir);
  11039. conf.setMapperClass(MOMap.class);
  11040. conf.setReducerClass(MOReduce.class);
  11041. ...
  11042. // Defines additional single text based output 'text' for the job
  11043. MultipleOutputs.addNamedOutput(conf, "text", TextOutputFormat.class,
  11044. LongWritable.class, Text.class);
  11045. // Defines additional multi sequencefile based output 'sequence' for the
  11046. // job
  11047. MultipleOutputs.addMultiNamedOutput(conf, "seq",
  11048. SequenceFileOutputFormat.class,
  11049. LongWritable.class, Text.class);
  11050. ...
  11051. JobClient jc = new JobClient();
  11052. RunningJob job = jc.submitJob(conf);
  11053. ...
  11054. </pre>
  11055. <p/>
  11056. Job configuration usage pattern is:
  11057. <pre>
  11058. public class MOReduce implements
  11059. Reducer&lt;WritableComparable, Writable&gt; {
  11060. private MultipleOutputs mos;
  11061. public void configure(JobConf conf) {
  11062. ...
  11063. mos = new MultipleOutputs(conf);
  11064. }
  11065. public void reduce(WritableComparable key, Iterator&lt;Writable&gt; values,
  11066. OutputCollector output, Reporter reporter)
  11067. throws IOException {
  11068. ...
  11069. mos.getCollector("text", reporter).collect(key, new Text("Hello"));
  11070. mos.getCollector("seq", "A", reporter).collect(key, new Text("Bye"));
  11071. mos.getCollector("seq", "B", reporter).collect(key, new Text("Chau"));
  11072. ...
  11073. }
  11074. public void close() throws IOException {
  11075. mos.close();
  11076. ...
  11077. }
  11078. }
  11079. </pre>
  11080. @deprecated Use
  11081. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead]]>
  11082. </doc>
  11083. </class>
  11084. <!-- end class org.apache.hadoop.mapred.lib.MultipleOutputs -->
  11085. <!-- start class org.apache.hadoop.mapred.lib.MultipleSequenceFileOutputFormat -->
  11086. <class name="MultipleSequenceFileOutputFormat" extends="org.apache.hadoop.mapred.lib.MultipleOutputFormat"
  11087. abstract="false"
  11088. static="false" final="false" visibility="public"
  11089. deprecated="Use
  11090. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead">
  11091. <constructor name="MultipleSequenceFileOutputFormat"
  11092. static="false" final="false" visibility="public"
  11093. deprecated="not deprecated">
  11094. </constructor>
  11095. <method name="getBaseRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  11096. abstract="false" native="false" synchronized="false"
  11097. static="false" final="false" visibility="protected"
  11098. deprecated="not deprecated">
  11099. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  11100. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11101. <param name="name" type="java.lang.String"/>
  11102. <param name="arg3" type="org.apache.hadoop.util.Progressable"/>
  11103. <exception name="IOException" type="java.io.IOException"/>
  11104. </method>
  11105. <doc>
  11106. <![CDATA[This class extends the MultipleOutputFormat, allowing to write the output data
  11107. to different output files in sequence file output format.
  11108. @deprecated Use
  11109. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead]]>
  11110. </doc>
  11111. </class>
  11112. <!-- end class org.apache.hadoop.mapred.lib.MultipleSequenceFileOutputFormat -->
  11113. <!-- start class org.apache.hadoop.mapred.lib.MultipleTextOutputFormat -->
  11114. <class name="MultipleTextOutputFormat" extends="org.apache.hadoop.mapred.lib.MultipleOutputFormat"
  11115. abstract="false"
  11116. static="false" final="false" visibility="public"
  11117. deprecated="Use
  11118. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead">
  11119. <constructor name="MultipleTextOutputFormat"
  11120. static="false" final="false" visibility="public"
  11121. deprecated="not deprecated">
  11122. </constructor>
  11123. <method name="getBaseRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  11124. abstract="false" native="false" synchronized="false"
  11125. static="false" final="false" visibility="protected"
  11126. deprecated="not deprecated">
  11127. <param name="fs" type="org.apache.hadoop.fs.FileSystem"/>
  11128. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11129. <param name="name" type="java.lang.String"/>
  11130. <param name="arg3" type="org.apache.hadoop.util.Progressable"/>
  11131. <exception name="IOException" type="java.io.IOException"/>
  11132. </method>
  11133. <doc>
  11134. <![CDATA[This class extends the MultipleOutputFormat, allowing to write the output
  11135. data to different output files in Text output format.
  11136. @deprecated Use
  11137. {@link org.apache.hadoop.mapreduce.lib.output.MultipleOutputs} instead]]>
  11138. </doc>
  11139. </class>
  11140. <!-- end class org.apache.hadoop.mapred.lib.MultipleTextOutputFormat -->
  11141. <!-- start class org.apache.hadoop.mapred.lib.MultithreadedMapRunner -->
  11142. <class name="MultithreadedMapRunner" extends="java.lang.Object"
  11143. abstract="false"
  11144. static="false" final="false" visibility="public"
  11145. deprecated="Use {@link MultithreadedMapper} instead.">
  11146. <implements name="org.apache.hadoop.mapred.MapRunnable"/>
  11147. <constructor name="MultithreadedMapRunner"
  11148. static="false" final="false" visibility="public"
  11149. deprecated="not deprecated">
  11150. </constructor>
  11151. <method name="configure"
  11152. abstract="false" native="false" synchronized="false"
  11153. static="false" final="false" visibility="public"
  11154. deprecated="not deprecated">
  11155. <param name="jobConf" type="org.apache.hadoop.mapred.JobConf"/>
  11156. </method>
  11157. <method name="run"
  11158. abstract="false" native="false" synchronized="false"
  11159. static="false" final="false" visibility="public"
  11160. deprecated="not deprecated">
  11161. <param name="input" type="org.apache.hadoop.mapred.RecordReader"/>
  11162. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  11163. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  11164. <exception name="IOException" type="java.io.IOException"/>
  11165. </method>
  11166. <doc>
  11167. <![CDATA[Multithreaded implementation for @link org.apache.hadoop.mapred.MapRunnable.
  11168. <p>
  11169. It can be used instead of the default implementation,
  11170. @link org.apache.hadoop.mapred.MapRunner, when the Map operation is not CPU
  11171. bound in order to improve throughput.
  11172. <p>
  11173. Map implementations using this MapRunnable must be thread-safe.
  11174. <p>
  11175. The Map-Reduce job has to be configured to use this MapRunnable class (using
  11176. the JobConf.setMapRunnerClass method) and
  11177. the number of thread the thread-pool can use with the
  11178. <code>mapred.map.multithreadedrunner.threads</code> property, its default
  11179. value is 10 threads.
  11180. <p>
  11181. @deprecated Use {@link MultithreadedMapper} instead.]]>
  11182. </doc>
  11183. </class>
  11184. <!-- end class org.apache.hadoop.mapred.lib.MultithreadedMapRunner -->
  11185. <!-- start class org.apache.hadoop.mapred.lib.NLineInputFormat -->
  11186. <class name="NLineInputFormat" extends="org.apache.hadoop.mapred.FileInputFormat"
  11187. abstract="false"
  11188. static="false" final="false" visibility="public"
  11189. deprecated="Use
  11190. {@link org.apache.hadoop.mapreduce.lib.input.NLineInputFormat} instead">
  11191. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  11192. <constructor name="NLineInputFormat"
  11193. static="false" final="false" visibility="public"
  11194. deprecated="not deprecated">
  11195. </constructor>
  11196. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  11197. abstract="false" native="false" synchronized="false"
  11198. static="false" final="false" visibility="public"
  11199. deprecated="not deprecated">
  11200. <param name="genericSplit" type="org.apache.hadoop.mapred.InputSplit"/>
  11201. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11202. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  11203. <exception name="IOException" type="java.io.IOException"/>
  11204. </method>
  11205. <method name="getSplits" return="org.apache.hadoop.mapred.InputSplit[]"
  11206. abstract="false" native="false" synchronized="false"
  11207. static="false" final="false" visibility="public"
  11208. deprecated="not deprecated">
  11209. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11210. <param name="numSplits" type="int"/>
  11211. <exception name="IOException" type="java.io.IOException"/>
  11212. <doc>
  11213. <![CDATA[Logically splits the set of input files for the job, splits N lines
  11214. of the input as one split.
  11215. @see org.apache.hadoop.mapred.FileInputFormat#getSplits(JobConf, int)]]>
  11216. </doc>
  11217. </method>
  11218. <method name="configure"
  11219. abstract="false" native="false" synchronized="false"
  11220. static="false" final="false" visibility="public"
  11221. deprecated="not deprecated">
  11222. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  11223. </method>
  11224. <doc>
  11225. <![CDATA[NLineInputFormat which splits N lines of input as one split.
  11226. In many "pleasantly" parallel applications, each process/mapper
  11227. processes the same input file (s), but with computations are
  11228. controlled by different parameters.(Referred to as "parameter sweeps").
  11229. One way to achieve this, is to specify a set of parameters
  11230. (one set per line) as input in a control file
  11231. (which is the input path to the map-reduce application,
  11232. where as the input dataset is specified
  11233. via a config variable in JobConf.).
  11234. The NLineInputFormat can be used in such applications, that splits
  11235. the input file such that by default, one line is fed as
  11236. a value to one map task, and key is the offset.
  11237. i.e. (k,v) is (LongWritable, Text).
  11238. The location hints will span the whole mapred cluster.
  11239. @deprecated Use
  11240. {@link org.apache.hadoop.mapreduce.lib.input.NLineInputFormat} instead]]>
  11241. </doc>
  11242. </class>
  11243. <!-- end class org.apache.hadoop.mapred.lib.NLineInputFormat -->
  11244. <!-- start class org.apache.hadoop.mapred.lib.NullOutputFormat -->
  11245. <class name="NullOutputFormat" extends="java.lang.Object"
  11246. abstract="false"
  11247. static="false" final="false" visibility="public"
  11248. deprecated="Use
  11249. {@link org.apache.hadoop.mapreduce.lib.output.NullOutputFormat} instead.">
  11250. <implements name="org.apache.hadoop.mapred.OutputFormat"/>
  11251. <constructor name="NullOutputFormat"
  11252. static="false" final="false" visibility="public"
  11253. deprecated="not deprecated">
  11254. </constructor>
  11255. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  11256. abstract="false" native="false" synchronized="false"
  11257. static="false" final="false" visibility="public"
  11258. deprecated="not deprecated">
  11259. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  11260. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11261. <param name="name" type="java.lang.String"/>
  11262. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  11263. </method>
  11264. <method name="checkOutputSpecs"
  11265. abstract="false" native="false" synchronized="false"
  11266. static="false" final="false" visibility="public"
  11267. deprecated="not deprecated">
  11268. <param name="ignored" type="org.apache.hadoop.fs.FileSystem"/>
  11269. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11270. </method>
  11271. <doc>
  11272. <![CDATA[Consume all outputs and put them in /dev/null.
  11273. @deprecated Use
  11274. {@link org.apache.hadoop.mapreduce.lib.output.NullOutputFormat} instead.]]>
  11275. </doc>
  11276. </class>
  11277. <!-- end class org.apache.hadoop.mapred.lib.NullOutputFormat -->
  11278. <!-- start class org.apache.hadoop.mapred.lib.RegexMapper -->
  11279. <class name="RegexMapper" extends="org.apache.hadoop.mapred.MapReduceBase"
  11280. abstract="false"
  11281. static="false" final="false" visibility="public"
  11282. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.map.RegexMapper}">
  11283. <implements name="org.apache.hadoop.mapred.Mapper"/>
  11284. <constructor name="RegexMapper"
  11285. static="false" final="false" visibility="public"
  11286. deprecated="not deprecated">
  11287. </constructor>
  11288. <method name="configure"
  11289. abstract="false" native="false" synchronized="false"
  11290. static="false" final="false" visibility="public"
  11291. deprecated="not deprecated">
  11292. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11293. </method>
  11294. <method name="map"
  11295. abstract="false" native="false" synchronized="false"
  11296. static="false" final="false" visibility="public"
  11297. deprecated="not deprecated">
  11298. <param name="key" type="K"/>
  11299. <param name="value" type="org.apache.hadoop.io.Text"/>
  11300. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  11301. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  11302. <exception name="IOException" type="java.io.IOException"/>
  11303. </method>
  11304. <doc>
  11305. <![CDATA[A {@link Mapper} that extracts text matching a regular expression.
  11306. @deprecated Use {@link org.apache.hadoop.mapreduce.lib.map.RegexMapper}]]>
  11307. </doc>
  11308. </class>
  11309. <!-- end class org.apache.hadoop.mapred.lib.RegexMapper -->
  11310. <!-- start class org.apache.hadoop.mapred.lib.TokenCountMapper -->
  11311. <class name="TokenCountMapper" extends="org.apache.hadoop.mapred.MapReduceBase"
  11312. abstract="false"
  11313. static="false" final="false" visibility="public"
  11314. deprecated="Use
  11315. {@link org.apache.hadoop.mapreduce.lib.map.TokenCounterMapper} instead.">
  11316. <implements name="org.apache.hadoop.mapred.Mapper"/>
  11317. <constructor name="TokenCountMapper"
  11318. static="false" final="false" visibility="public"
  11319. deprecated="not deprecated">
  11320. </constructor>
  11321. <method name="map"
  11322. abstract="false" native="false" synchronized="false"
  11323. static="false" final="false" visibility="public"
  11324. deprecated="not deprecated">
  11325. <param name="key" type="K"/>
  11326. <param name="value" type="org.apache.hadoop.io.Text"/>
  11327. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  11328. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  11329. <exception name="IOException" type="java.io.IOException"/>
  11330. </method>
  11331. <doc>
  11332. <![CDATA[A {@link Mapper} that maps text values into <token,freq> pairs. Uses
  11333. {@link StringTokenizer} to break text into tokens.
  11334. @deprecated Use
  11335. {@link org.apache.hadoop.mapreduce.lib.map.TokenCounterMapper} instead.]]>
  11336. </doc>
  11337. </class>
  11338. <!-- end class org.apache.hadoop.mapred.lib.TokenCountMapper -->
  11339. <!-- start class org.apache.hadoop.mapred.lib.TotalOrderPartitioner -->
  11340. <class name="TotalOrderPartitioner" extends="org.apache.hadoop.mapreduce.lib.partition.TotalOrderPartitioner"
  11341. abstract="false"
  11342. static="false" final="false" visibility="public"
  11343. deprecated="Use
  11344. {@link org.apache.hadoop.mapreduce.lib.partition.TotalOrderPartitioner}">
  11345. <implements name="org.apache.hadoop.mapred.Partitioner"/>
  11346. <constructor name="TotalOrderPartitioner"
  11347. static="false" final="false" visibility="public"
  11348. deprecated="not deprecated">
  11349. </constructor>
  11350. <method name="configure"
  11351. abstract="false" native="false" synchronized="false"
  11352. static="false" final="false" visibility="public"
  11353. deprecated="not deprecated">
  11354. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11355. </method>
  11356. <doc>
  11357. <![CDATA[Partitioner effecting a total order by reading split points from
  11358. an externally generated source.
  11359. @deprecated Use
  11360. {@link org.apache.hadoop.mapreduce.lib.partition.TotalOrderPartitioner}]]>
  11361. </doc>
  11362. </class>
  11363. <!-- end class org.apache.hadoop.mapred.lib.TotalOrderPartitioner -->
  11364. </package>
  11365. <package name="org.apache.hadoop.mapred.lib.aggregate">
  11366. <!-- start class org.apache.hadoop.mapred.lib.aggregate.DoubleValueSum -->
  11367. <class name="DoubleValueSum" extends="org.apache.hadoop.mapreduce.lib.aggregate.DoubleValueSum"
  11368. abstract="false"
  11369. static="false" final="false" visibility="public"
  11370. deprecated="Use
  11371. {@link org.apache.hadoop.mapreduce.lib.aggregate.DoubleValueSum} instead">
  11372. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  11373. <constructor name="DoubleValueSum"
  11374. static="false" final="false" visibility="public"
  11375. deprecated="not deprecated">
  11376. </constructor>
  11377. <doc>
  11378. <![CDATA[This class implements a value aggregator that sums up a sequence of double
  11379. values.
  11380. @deprecated Use
  11381. {@link org.apache.hadoop.mapreduce.lib.aggregate.DoubleValueSum} instead]]>
  11382. </doc>
  11383. </class>
  11384. <!-- end class org.apache.hadoop.mapred.lib.aggregate.DoubleValueSum -->
  11385. <!-- start class org.apache.hadoop.mapred.lib.aggregate.LongValueMax -->
  11386. <class name="LongValueMax" extends="org.apache.hadoop.mapreduce.lib.aggregate.LongValueMax"
  11387. abstract="false"
  11388. static="false" final="false" visibility="public"
  11389. deprecated="Use
  11390. {@link org.apache.hadoop.mapreduce.lib.aggregate.LongValueMax} instead">
  11391. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  11392. <constructor name="LongValueMax"
  11393. static="false" final="false" visibility="public"
  11394. deprecated="not deprecated">
  11395. </constructor>
  11396. <doc>
  11397. <![CDATA[This class implements a value aggregator that maintain the maximum of
  11398. a sequence of long values.
  11399. @deprecated Use
  11400. {@link org.apache.hadoop.mapreduce.lib.aggregate.LongValueMax} instead]]>
  11401. </doc>
  11402. </class>
  11403. <!-- end class org.apache.hadoop.mapred.lib.aggregate.LongValueMax -->
  11404. <!-- start class org.apache.hadoop.mapred.lib.aggregate.LongValueMin -->
  11405. <class name="LongValueMin" extends="org.apache.hadoop.mapreduce.lib.aggregate.LongValueMin"
  11406. abstract="false"
  11407. static="false" final="false" visibility="public"
  11408. deprecated="Use
  11409. {@link org.apache.hadoop.mapreduce.lib.aggregate.LongValueMin} instead">
  11410. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  11411. <constructor name="LongValueMin"
  11412. static="false" final="false" visibility="public"
  11413. deprecated="not deprecated">
  11414. </constructor>
  11415. <doc>
  11416. <![CDATA[This class implements a value aggregator that maintain the minimum of
  11417. a sequence of long values.
  11418. @deprecated Use
  11419. {@link org.apache.hadoop.mapreduce.lib.aggregate.LongValueMin} instead]]>
  11420. </doc>
  11421. </class>
  11422. <!-- end class org.apache.hadoop.mapred.lib.aggregate.LongValueMin -->
  11423. <!-- start class org.apache.hadoop.mapred.lib.aggregate.LongValueSum -->
  11424. <class name="LongValueSum" extends="org.apache.hadoop.mapreduce.lib.aggregate.LongValueSum"
  11425. abstract="false"
  11426. static="false" final="false" visibility="public"
  11427. deprecated="Use
  11428. {@link org.apache.hadoop.mapreduce.lib.aggregate.LongValueSum} instead">
  11429. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  11430. <constructor name="LongValueSum"
  11431. static="false" final="false" visibility="public"
  11432. deprecated="not deprecated">
  11433. </constructor>
  11434. <doc>
  11435. <![CDATA[This class implements a value aggregator that sums up
  11436. a sequence of long values.
  11437. @deprecated Use
  11438. {@link org.apache.hadoop.mapreduce.lib.aggregate.LongValueSum} instead]]>
  11439. </doc>
  11440. </class>
  11441. <!-- end class org.apache.hadoop.mapred.lib.aggregate.LongValueSum -->
  11442. <!-- start class org.apache.hadoop.mapred.lib.aggregate.StringValueMax -->
  11443. <class name="StringValueMax" extends="org.apache.hadoop.mapreduce.lib.aggregate.StringValueMax"
  11444. abstract="false"
  11445. static="false" final="false" visibility="public"
  11446. deprecated="Use
  11447. {@link org.apache.hadoop.mapreduce.lib.aggregate.StringValueMax} instead">
  11448. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  11449. <constructor name="StringValueMax"
  11450. static="false" final="false" visibility="public"
  11451. deprecated="not deprecated">
  11452. </constructor>
  11453. <doc>
  11454. <![CDATA[This class implements a value aggregator that maintain the biggest of
  11455. a sequence of strings.
  11456. @deprecated Use
  11457. {@link org.apache.hadoop.mapreduce.lib.aggregate.StringValueMax} instead]]>
  11458. </doc>
  11459. </class>
  11460. <!-- end class org.apache.hadoop.mapred.lib.aggregate.StringValueMax -->
  11461. <!-- start class org.apache.hadoop.mapred.lib.aggregate.StringValueMin -->
  11462. <class name="StringValueMin" extends="org.apache.hadoop.mapreduce.lib.aggregate.StringValueMin"
  11463. abstract="false"
  11464. static="false" final="false" visibility="public"
  11465. deprecated="Use
  11466. {@link org.apache.hadoop.mapreduce.lib.aggregate.StringValueMin} instead">
  11467. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  11468. <constructor name="StringValueMin"
  11469. static="false" final="false" visibility="public"
  11470. deprecated="not deprecated">
  11471. </constructor>
  11472. <doc>
  11473. <![CDATA[This class implements a value aggregator that maintain the smallest of
  11474. a sequence of strings.
  11475. @deprecated Use
  11476. {@link org.apache.hadoop.mapreduce.lib.aggregate.StringValueMin} instead]]>
  11477. </doc>
  11478. </class>
  11479. <!-- end class org.apache.hadoop.mapred.lib.aggregate.StringValueMin -->
  11480. <!-- start class org.apache.hadoop.mapred.lib.aggregate.UniqValueCount -->
  11481. <class name="UniqValueCount" extends="org.apache.hadoop.mapreduce.lib.aggregate.UniqValueCount"
  11482. abstract="false"
  11483. static="false" final="false" visibility="public"
  11484. deprecated="Use
  11485. {@link org.apache.hadoop.mapreduce.lib.aggregate.UniqValueCount} instead">
  11486. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  11487. <constructor name="UniqValueCount"
  11488. static="false" final="false" visibility="public"
  11489. deprecated="not deprecated">
  11490. <doc>
  11491. <![CDATA[the default constructor]]>
  11492. </doc>
  11493. </constructor>
  11494. <constructor name="UniqValueCount" type="long"
  11495. static="false" final="false" visibility="public"
  11496. deprecated="not deprecated">
  11497. <doc>
  11498. <![CDATA[constructor
  11499. @param maxNum the limit in the number of unique values to keep.]]>
  11500. </doc>
  11501. </constructor>
  11502. <doc>
  11503. <![CDATA[This class implements a value aggregator that dedupes a sequence of objects.
  11504. @deprecated Use
  11505. {@link org.apache.hadoop.mapreduce.lib.aggregate.UniqValueCount} instead]]>
  11506. </doc>
  11507. </class>
  11508. <!-- end class org.apache.hadoop.mapred.lib.aggregate.UniqValueCount -->
  11509. <!-- start class org.apache.hadoop.mapred.lib.aggregate.UserDefinedValueAggregatorDescriptor -->
  11510. <class name="UserDefinedValueAggregatorDescriptor" extends="org.apache.hadoop.mapreduce.lib.aggregate.UserDefinedValueAggregatorDescriptor"
  11511. abstract="false"
  11512. static="false" final="false" visibility="public"
  11513. deprecated="Use
  11514. {@link org.apache.hadoop.mapreduce.lib.aggregate.UserDefinedValueAggregatorDescriptor}
  11515. instead">
  11516. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorDescriptor"/>
  11517. <constructor name="UserDefinedValueAggregatorDescriptor" type="java.lang.String, org.apache.hadoop.mapred.JobConf"
  11518. static="false" final="false" visibility="public"
  11519. deprecated="not deprecated">
  11520. <doc>
  11521. <![CDATA[@param className the class name of the user defined descriptor class
  11522. @param job a configure object used for decriptor configuration]]>
  11523. </doc>
  11524. </constructor>
  11525. <method name="createInstance" return="java.lang.Object"
  11526. abstract="false" native="false" synchronized="false"
  11527. static="true" final="false" visibility="public"
  11528. deprecated="not deprecated">
  11529. <param name="className" type="java.lang.String"/>
  11530. <doc>
  11531. <![CDATA[Create an instance of the given class
  11532. @param className the name of the class
  11533. @return a dynamically created instance of the given class]]>
  11534. </doc>
  11535. </method>
  11536. <method name="configure"
  11537. abstract="false" native="false" synchronized="false"
  11538. static="false" final="false" visibility="public"
  11539. deprecated="not deprecated">
  11540. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11541. <doc>
  11542. <![CDATA[Do nothing.]]>
  11543. </doc>
  11544. </method>
  11545. <doc>
  11546. <![CDATA[This class implements a wrapper for a user defined value aggregator descriptor.
  11547. It servs two functions: One is to create an object of ValueAggregatorDescriptor from the
  11548. name of a user defined class that may be dynamically loaded. The other is to
  11549. deligate inviokations of generateKeyValPairs function to the created object.
  11550. @deprecated Use
  11551. {@link org.apache.hadoop.mapreduce.lib.aggregate.UserDefinedValueAggregatorDescriptor}
  11552. instead]]>
  11553. </doc>
  11554. </class>
  11555. <!-- end class org.apache.hadoop.mapred.lib.aggregate.UserDefinedValueAggregatorDescriptor -->
  11556. <!-- start interface org.apache.hadoop.mapred.lib.aggregate.ValueAggregator -->
  11557. <interface name="ValueAggregator" abstract="true"
  11558. static="false" final="false" visibility="public"
  11559. deprecated="Use
  11560. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator} instead">
  11561. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  11562. <doc>
  11563. <![CDATA[This interface defines the minimal protocol for value aggregators.
  11564. @deprecated Use
  11565. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator} instead]]>
  11566. </doc>
  11567. </interface>
  11568. <!-- end interface org.apache.hadoop.mapred.lib.aggregate.ValueAggregator -->
  11569. <!-- start class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorBaseDescriptor -->
  11570. <class name="ValueAggregatorBaseDescriptor" extends="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorBaseDescriptor"
  11571. abstract="false"
  11572. static="false" final="false" visibility="public"
  11573. deprecated="Use
  11574. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorBaseDescriptor}
  11575. instead">
  11576. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorDescriptor"/>
  11577. <constructor name="ValueAggregatorBaseDescriptor"
  11578. static="false" final="false" visibility="public"
  11579. deprecated="not deprecated">
  11580. </constructor>
  11581. <method name="generateEntry" return="java.util.Map.Entry"
  11582. abstract="false" native="false" synchronized="false"
  11583. static="true" final="false" visibility="public"
  11584. deprecated="not deprecated">
  11585. <param name="type" type="java.lang.String"/>
  11586. <param name="id" type="java.lang.String"/>
  11587. <param name="val" type="org.apache.hadoop.io.Text"/>
  11588. <doc>
  11589. <![CDATA[@param type the aggregation type
  11590. @param id the aggregation id
  11591. @param val the val associated with the id to be aggregated
  11592. @return an Entry whose key is the aggregation id prefixed with
  11593. the aggregation type.]]>
  11594. </doc>
  11595. </method>
  11596. <method name="generateValueAggregator" return="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"
  11597. abstract="false" native="false" synchronized="false"
  11598. static="true" final="false" visibility="public"
  11599. deprecated="not deprecated">
  11600. <param name="type" type="java.lang.String"/>
  11601. <doc>
  11602. <![CDATA[@param type the aggregation type
  11603. @return a value aggregator of the given type.]]>
  11604. </doc>
  11605. </method>
  11606. <method name="configure"
  11607. abstract="false" native="false" synchronized="false"
  11608. static="false" final="false" visibility="public"
  11609. deprecated="not deprecated">
  11610. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11611. <doc>
  11612. <![CDATA[get the input file name.
  11613. @param job a job configuration object]]>
  11614. </doc>
  11615. </method>
  11616. <field name="UNIQ_VALUE_COUNT" type="java.lang.String"
  11617. transient="false" volatile="false"
  11618. static="true" final="true" visibility="public"
  11619. deprecated="not deprecated">
  11620. </field>
  11621. <field name="LONG_VALUE_SUM" type="java.lang.String"
  11622. transient="false" volatile="false"
  11623. static="true" final="true" visibility="public"
  11624. deprecated="not deprecated">
  11625. </field>
  11626. <field name="DOUBLE_VALUE_SUM" type="java.lang.String"
  11627. transient="false" volatile="false"
  11628. static="true" final="true" visibility="public"
  11629. deprecated="not deprecated">
  11630. </field>
  11631. <field name="VALUE_HISTOGRAM" type="java.lang.String"
  11632. transient="false" volatile="false"
  11633. static="true" final="true" visibility="public"
  11634. deprecated="not deprecated">
  11635. </field>
  11636. <field name="LONG_VALUE_MAX" type="java.lang.String"
  11637. transient="false" volatile="false"
  11638. static="true" final="true" visibility="public"
  11639. deprecated="not deprecated">
  11640. </field>
  11641. <field name="LONG_VALUE_MIN" type="java.lang.String"
  11642. transient="false" volatile="false"
  11643. static="true" final="true" visibility="public"
  11644. deprecated="not deprecated">
  11645. </field>
  11646. <field name="STRING_VALUE_MAX" type="java.lang.String"
  11647. transient="false" volatile="false"
  11648. static="true" final="true" visibility="public"
  11649. deprecated="not deprecated">
  11650. </field>
  11651. <field name="STRING_VALUE_MIN" type="java.lang.String"
  11652. transient="false" volatile="false"
  11653. static="true" final="true" visibility="public"
  11654. deprecated="not deprecated">
  11655. </field>
  11656. <doc>
  11657. <![CDATA[This class implements the common functionalities of
  11658. the subclasses of ValueAggregatorDescriptor class.
  11659. @deprecated Use
  11660. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorBaseDescriptor}
  11661. instead]]>
  11662. </doc>
  11663. </class>
  11664. <!-- end class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorBaseDescriptor -->
  11665. <!-- start class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorCombiner -->
  11666. <class name="ValueAggregatorCombiner" extends="org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorJobBase"
  11667. abstract="false"
  11668. static="false" final="false" visibility="public"
  11669. deprecated="Use
  11670. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorCombiner}
  11671. instead">
  11672. <constructor name="ValueAggregatorCombiner"
  11673. static="false" final="false" visibility="public"
  11674. deprecated="not deprecated">
  11675. </constructor>
  11676. <method name="configure"
  11677. abstract="false" native="false" synchronized="false"
  11678. static="false" final="false" visibility="public"
  11679. deprecated="not deprecated">
  11680. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11681. <doc>
  11682. <![CDATA[Combiner does not need to configure.]]>
  11683. </doc>
  11684. </method>
  11685. <method name="reduce"
  11686. abstract="false" native="false" synchronized="false"
  11687. static="false" final="false" visibility="public"
  11688. deprecated="not deprecated">
  11689. <param name="key" type="org.apache.hadoop.io.Text"/>
  11690. <param name="values" type="java.util.Iterator"/>
  11691. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  11692. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  11693. <exception name="IOException" type="java.io.IOException"/>
  11694. <doc>
  11695. <![CDATA[Combines values for a given key.
  11696. @param key the key is expected to be a Text object, whose prefix indicates
  11697. the type of aggregation to aggregate the values.
  11698. @param values the values to combine
  11699. @param output to collect combined values]]>
  11700. </doc>
  11701. </method>
  11702. <method name="close"
  11703. abstract="false" native="false" synchronized="false"
  11704. static="false" final="false" visibility="public"
  11705. deprecated="not deprecated">
  11706. <exception name="IOException" type="java.io.IOException"/>
  11707. <doc>
  11708. <![CDATA[Do nothing.]]>
  11709. </doc>
  11710. </method>
  11711. <method name="map"
  11712. abstract="false" native="false" synchronized="false"
  11713. static="false" final="false" visibility="public"
  11714. deprecated="not deprecated">
  11715. <param name="arg0" type="K1"/>
  11716. <param name="arg1" type="V1"/>
  11717. <param name="arg2" type="org.apache.hadoop.mapred.OutputCollector"/>
  11718. <param name="arg3" type="org.apache.hadoop.mapred.Reporter"/>
  11719. <exception name="IOException" type="java.io.IOException"/>
  11720. <doc>
  11721. <![CDATA[Do nothing. Should not be called.]]>
  11722. </doc>
  11723. </method>
  11724. <doc>
  11725. <![CDATA[This class implements the generic combiner of Aggregate.
  11726. @deprecated Use
  11727. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorCombiner}
  11728. instead]]>
  11729. </doc>
  11730. </class>
  11731. <!-- end class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorCombiner -->
  11732. <!-- start interface org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorDescriptor -->
  11733. <interface name="ValueAggregatorDescriptor" abstract="true"
  11734. static="false" final="false" visibility="public"
  11735. deprecated="Use
  11736. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor}
  11737. instead">
  11738. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor"/>
  11739. <method name="configure"
  11740. abstract="false" native="false" synchronized="false"
  11741. static="false" final="false" visibility="public"
  11742. deprecated="not deprecated">
  11743. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11744. <doc>
  11745. <![CDATA[Configure the object
  11746. @param job
  11747. a JobConf object that may contain the information that can be used
  11748. to configure the object.]]>
  11749. </doc>
  11750. </method>
  11751. <field name="TYPE_SEPARATOR" type="java.lang.String"
  11752. transient="false" volatile="false"
  11753. static="true" final="true" visibility="public"
  11754. deprecated="not deprecated">
  11755. </field>
  11756. <field name="ONE" type="org.apache.hadoop.io.Text"
  11757. transient="false" volatile="false"
  11758. static="true" final="true" visibility="public"
  11759. deprecated="not deprecated">
  11760. </field>
  11761. <doc>
  11762. <![CDATA[This interface defines the contract a value aggregator descriptor must
  11763. support. Such a descriptor can be configured with a JobConf object. Its main
  11764. function is to generate a list of aggregation-id/value pairs. An aggregation
  11765. id encodes an aggregation type which is used to guide the way to aggregate
  11766. the value in the reduce/combiner phrase of an Aggregate based job.The mapper in
  11767. an Aggregate based map/reduce job may create one or more of
  11768. ValueAggregatorDescriptor objects at configuration time. For each input
  11769. key/value pair, the mapper will use those objects to create aggregation
  11770. id/value pairs.
  11771. @deprecated Use
  11772. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor}
  11773. instead]]>
  11774. </doc>
  11775. </interface>
  11776. <!-- end interface org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorDescriptor -->
  11777. <!-- start class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorJob -->
  11778. <class name="ValueAggregatorJob" extends="java.lang.Object"
  11779. abstract="false"
  11780. static="false" final="false" visibility="public"
  11781. deprecated="Use
  11782. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJob} instead">
  11783. <constructor name="ValueAggregatorJob"
  11784. static="false" final="false" visibility="public"
  11785. deprecated="not deprecated">
  11786. </constructor>
  11787. <method name="createValueAggregatorJobs" return="org.apache.hadoop.mapred.jobcontrol.JobControl"
  11788. abstract="false" native="false" synchronized="false"
  11789. static="true" final="false" visibility="public"
  11790. deprecated="not deprecated">
  11791. <param name="args" type="java.lang.String[]"/>
  11792. <param name="descriptors" type="java.lang.Class[]"/>
  11793. <exception name="IOException" type="java.io.IOException"/>
  11794. </method>
  11795. <method name="createValueAggregatorJobs" return="org.apache.hadoop.mapred.jobcontrol.JobControl"
  11796. abstract="false" native="false" synchronized="false"
  11797. static="true" final="false" visibility="public"
  11798. deprecated="not deprecated">
  11799. <param name="args" type="java.lang.String[]"/>
  11800. <exception name="IOException" type="java.io.IOException"/>
  11801. </method>
  11802. <method name="createValueAggregatorJob" return="org.apache.hadoop.mapred.JobConf"
  11803. abstract="false" native="false" synchronized="false"
  11804. static="true" final="false" visibility="public"
  11805. deprecated="not deprecated">
  11806. <param name="args" type="java.lang.String[]"/>
  11807. <exception name="IOException" type="java.io.IOException"/>
  11808. <doc>
  11809. <![CDATA[Create an Aggregate based map/reduce job.
  11810. @param args the arguments used for job creation. Generic hadoop
  11811. arguments are accepted.
  11812. @return a JobConf object ready for submission.
  11813. @throws IOException
  11814. @see GenericOptionsParser]]>
  11815. </doc>
  11816. </method>
  11817. <method name="createValueAggregatorJob" return="org.apache.hadoop.mapred.JobConf"
  11818. abstract="false" native="false" synchronized="false"
  11819. static="true" final="false" visibility="public"
  11820. deprecated="not deprecated">
  11821. <param name="args" type="java.lang.String[]"/>
  11822. <param name="descriptors" type="java.lang.Class[]"/>
  11823. <exception name="IOException" type="java.io.IOException"/>
  11824. </method>
  11825. <method name="setAggregatorDescriptors"
  11826. abstract="false" native="false" synchronized="false"
  11827. static="true" final="false" visibility="public"
  11828. deprecated="not deprecated">
  11829. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11830. <param name="descriptors" type="java.lang.Class[]"/>
  11831. </method>
  11832. <method name="main"
  11833. abstract="false" native="false" synchronized="false"
  11834. static="true" final="false" visibility="public"
  11835. deprecated="not deprecated">
  11836. <param name="args" type="java.lang.String[]"/>
  11837. <exception name="IOException" type="java.io.IOException"/>
  11838. <doc>
  11839. <![CDATA[create and run an Aggregate based map/reduce job.
  11840. @param args the arguments used for job creation
  11841. @throws IOException]]>
  11842. </doc>
  11843. </method>
  11844. <doc>
  11845. <![CDATA[This is the main class for creating a map/reduce job using Aggregate
  11846. framework. The Aggregate is a specialization of map/reduce framework,
  11847. specilizing for performing various simple aggregations.
  11848. Generally speaking, in order to implement an application using Map/Reduce
  11849. model, the developer is to implement Map and Reduce functions (and possibly
  11850. combine function). However, a lot of applications related to counting and
  11851. statistics computing have very similar characteristics. Aggregate abstracts
  11852. out the general patterns of these functions and implementing those patterns.
  11853. In particular, the package provides generic mapper/redducer/combiner classes,
  11854. and a set of built-in value aggregators, and a generic utility class that
  11855. helps user create map/reduce jobs using the generic class. The built-in
  11856. aggregators include:
  11857. sum over numeric values count the number of distinct values compute the
  11858. histogram of values compute the minimum, maximum, media,average, standard
  11859. deviation of numeric values
  11860. The developer using Aggregate will need only to provide a plugin class
  11861. conforming to the following interface:
  11862. public interface ValueAggregatorDescriptor { public ArrayList<Entry>
  11863. generateKeyValPairs(Object key, Object value); public void
  11864. configure(JobConfjob); }
  11865. The package also provides a base class, ValueAggregatorBaseDescriptor,
  11866. implementing the above interface. The user can extend the base class and
  11867. implement generateKeyValPairs accordingly.
  11868. The primary work of generateKeyValPairs is to emit one or more key/value
  11869. pairs based on the input key/value pair. The key in an output key/value pair
  11870. encode two pieces of information: aggregation type and aggregation id. The
  11871. value will be aggregated onto the aggregation id according the aggregation
  11872. type.
  11873. This class offers a function to generate a map/reduce job using Aggregate
  11874. framework. The function takes the following parameters: input directory spec
  11875. input format (text or sequence file) output directory a file specifying the
  11876. user plugin class
  11877. @deprecated Use
  11878. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJob} instead]]>
  11879. </doc>
  11880. </class>
  11881. <!-- end class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorJob -->
  11882. <!-- start class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorJobBase -->
  11883. <class name="ValueAggregatorJobBase" extends="java.lang.Object"
  11884. abstract="true"
  11885. static="false" final="false" visibility="public"
  11886. deprecated="Use
  11887. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJobBase}
  11888. instead">
  11889. <implements name="org.apache.hadoop.mapred.Mapper"/>
  11890. <implements name="org.apache.hadoop.mapred.Reducer"/>
  11891. <constructor name="ValueAggregatorJobBase"
  11892. static="false" final="false" visibility="public"
  11893. deprecated="not deprecated">
  11894. </constructor>
  11895. <method name="configure"
  11896. abstract="false" native="false" synchronized="false"
  11897. static="false" final="false" visibility="public"
  11898. deprecated="not deprecated">
  11899. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  11900. </method>
  11901. <method name="logSpec"
  11902. abstract="false" native="false" synchronized="false"
  11903. static="false" final="false" visibility="protected"
  11904. deprecated="not deprecated">
  11905. </method>
  11906. <method name="close"
  11907. abstract="false" native="false" synchronized="false"
  11908. static="false" final="false" visibility="public"
  11909. deprecated="not deprecated">
  11910. <exception name="IOException" type="java.io.IOException"/>
  11911. </method>
  11912. <field name="aggregatorDescriptorList" type="java.util.ArrayList"
  11913. transient="false" volatile="false"
  11914. static="false" final="false" visibility="protected"
  11915. deprecated="not deprecated">
  11916. </field>
  11917. <doc>
  11918. <![CDATA[This abstract class implements some common functionalities of the
  11919. the generic mapper, reducer and combiner classes of Aggregate.
  11920. @deprecated Use
  11921. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJobBase}
  11922. instead]]>
  11923. </doc>
  11924. </class>
  11925. <!-- end class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorJobBase -->
  11926. <!-- start class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorMapper -->
  11927. <class name="ValueAggregatorMapper" extends="org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorJobBase"
  11928. abstract="false"
  11929. static="false" final="false" visibility="public"
  11930. deprecated="Use
  11931. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorMapper}
  11932. instead">
  11933. <constructor name="ValueAggregatorMapper"
  11934. static="false" final="false" visibility="public"
  11935. deprecated="not deprecated">
  11936. </constructor>
  11937. <method name="map"
  11938. abstract="false" native="false" synchronized="false"
  11939. static="false" final="false" visibility="public"
  11940. deprecated="not deprecated">
  11941. <param name="key" type="K1"/>
  11942. <param name="value" type="V1"/>
  11943. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  11944. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  11945. <exception name="IOException" type="java.io.IOException"/>
  11946. <doc>
  11947. <![CDATA[the map function. It iterates through the value aggregator descriptor
  11948. list to generate aggregation id/value pairs and emit them.]]>
  11949. </doc>
  11950. </method>
  11951. <method name="reduce"
  11952. abstract="false" native="false" synchronized="false"
  11953. static="false" final="false" visibility="public"
  11954. deprecated="not deprecated">
  11955. <param name="arg0" type="org.apache.hadoop.io.Text"/>
  11956. <param name="arg1" type="java.util.Iterator"/>
  11957. <param name="arg2" type="org.apache.hadoop.mapred.OutputCollector"/>
  11958. <param name="arg3" type="org.apache.hadoop.mapred.Reporter"/>
  11959. <exception name="IOException" type="java.io.IOException"/>
  11960. <doc>
  11961. <![CDATA[Do nothing. Should not be called.]]>
  11962. </doc>
  11963. </method>
  11964. <doc>
  11965. <![CDATA[This class implements the generic mapper of Aggregate.
  11966. @deprecated Use
  11967. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorMapper}
  11968. instead]]>
  11969. </doc>
  11970. </class>
  11971. <!-- end class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorMapper -->
  11972. <!-- start class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorReducer -->
  11973. <class name="ValueAggregatorReducer" extends="org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorJobBase"
  11974. abstract="false"
  11975. static="false" final="false" visibility="public"
  11976. deprecated="Use
  11977. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorReducer}
  11978. instead">
  11979. <constructor name="ValueAggregatorReducer"
  11980. static="false" final="false" visibility="public"
  11981. deprecated="not deprecated">
  11982. </constructor>
  11983. <method name="reduce"
  11984. abstract="false" native="false" synchronized="false"
  11985. static="false" final="false" visibility="public"
  11986. deprecated="not deprecated">
  11987. <param name="key" type="org.apache.hadoop.io.Text"/>
  11988. <param name="values" type="java.util.Iterator"/>
  11989. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  11990. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  11991. <exception name="IOException" type="java.io.IOException"/>
  11992. <doc>
  11993. <![CDATA[@param key
  11994. the key is expected to be a Text object, whose prefix indicates
  11995. the type of aggregation to aggregate the values. In effect, data
  11996. driven computing is achieved. It is assumed that each aggregator's
  11997. getReport method emits appropriate output for the aggregator. This
  11998. may be further customiized.
  11999. @value the values to be aggregated]]>
  12000. </doc>
  12001. </method>
  12002. <method name="map"
  12003. abstract="false" native="false" synchronized="false"
  12004. static="false" final="false" visibility="public"
  12005. deprecated="not deprecated">
  12006. <param name="arg0" type="K1"/>
  12007. <param name="arg1" type="V1"/>
  12008. <param name="arg2" type="org.apache.hadoop.mapred.OutputCollector"/>
  12009. <param name="arg3" type="org.apache.hadoop.mapred.Reporter"/>
  12010. <exception name="IOException" type="java.io.IOException"/>
  12011. <doc>
  12012. <![CDATA[Do nothing. Should not be called]]>
  12013. </doc>
  12014. </method>
  12015. <doc>
  12016. <![CDATA[This class implements the generic reducer of Aggregate.
  12017. @deprecated Use
  12018. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorReducer}
  12019. instead]]>
  12020. </doc>
  12021. </class>
  12022. <!-- end class org.apache.hadoop.mapred.lib.aggregate.ValueAggregatorReducer -->
  12023. <!-- start class org.apache.hadoop.mapred.lib.aggregate.ValueHistogram -->
  12024. <class name="ValueHistogram" extends="org.apache.hadoop.mapreduce.lib.aggregate.ValueHistogram"
  12025. abstract="false"
  12026. static="false" final="false" visibility="public"
  12027. deprecated="Use
  12028. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueHistogram} instead">
  12029. <implements name="org.apache.hadoop.mapred.lib.aggregate.ValueAggregator"/>
  12030. <constructor name="ValueHistogram"
  12031. static="false" final="false" visibility="public"
  12032. deprecated="not deprecated">
  12033. </constructor>
  12034. <doc>
  12035. <![CDATA[This class implements a value aggregator that computes the
  12036. histogram of a sequence of strings.
  12037. @deprecated Use
  12038. {@link org.apache.hadoop.mapreduce.lib.aggregate.ValueHistogram} instead]]>
  12039. </doc>
  12040. </class>
  12041. <!-- end class org.apache.hadoop.mapred.lib.aggregate.ValueHistogram -->
  12042. </package>
  12043. <package name="org.apache.hadoop.mapred.lib.db">
  12044. <!-- start class org.apache.hadoop.mapred.lib.db.DBConfiguration -->
  12045. <class name="DBConfiguration" extends="org.apache.hadoop.mapreduce.lib.db.DBConfiguration"
  12046. abstract="false"
  12047. static="false" final="false" visibility="public"
  12048. deprecated="Use
  12049. {@link org.apache.hadoop.mapreduce.lib.db.DBConfiguration} instead">
  12050. <method name="configureDB"
  12051. abstract="false" native="false" synchronized="false"
  12052. static="true" final="false" visibility="public"
  12053. deprecated="not deprecated">
  12054. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12055. <param name="driverClass" type="java.lang.String"/>
  12056. <param name="dbUrl" type="java.lang.String"/>
  12057. <param name="userName" type="java.lang.String"/>
  12058. <param name="passwd" type="java.lang.String"/>
  12059. <doc>
  12060. <![CDATA[Sets the DB access related fields in the JobConf.
  12061. @param job the job
  12062. @param driverClass JDBC Driver class name
  12063. @param dbUrl JDBC DB access URL.
  12064. @param userName DB access username
  12065. @param passwd DB access passwd]]>
  12066. </doc>
  12067. </method>
  12068. <method name="configureDB"
  12069. abstract="false" native="false" synchronized="false"
  12070. static="true" final="false" visibility="public"
  12071. deprecated="not deprecated">
  12072. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12073. <param name="driverClass" type="java.lang.String"/>
  12074. <param name="dbUrl" type="java.lang.String"/>
  12075. <doc>
  12076. <![CDATA[Sets the DB access related fields in the JobConf.
  12077. @param job the job
  12078. @param driverClass JDBC Driver class name
  12079. @param dbUrl JDBC DB access URL.]]>
  12080. </doc>
  12081. </method>
  12082. <field name="DRIVER_CLASS_PROPERTY" type="java.lang.String"
  12083. transient="false" volatile="false"
  12084. static="true" final="true" visibility="public"
  12085. deprecated="not deprecated">
  12086. <doc>
  12087. <![CDATA[The JDBC Driver class name]]>
  12088. </doc>
  12089. </field>
  12090. <field name="URL_PROPERTY" type="java.lang.String"
  12091. transient="false" volatile="false"
  12092. static="true" final="true" visibility="public"
  12093. deprecated="not deprecated">
  12094. <doc>
  12095. <![CDATA[JDBC Database access URL]]>
  12096. </doc>
  12097. </field>
  12098. <field name="USERNAME_PROPERTY" type="java.lang.String"
  12099. transient="false" volatile="false"
  12100. static="true" final="true" visibility="public"
  12101. deprecated="not deprecated">
  12102. <doc>
  12103. <![CDATA[User name to access the database]]>
  12104. </doc>
  12105. </field>
  12106. <field name="PASSWORD_PROPERTY" type="java.lang.String"
  12107. transient="false" volatile="false"
  12108. static="true" final="true" visibility="public"
  12109. deprecated="not deprecated">
  12110. <doc>
  12111. <![CDATA[Password to access the database]]>
  12112. </doc>
  12113. </field>
  12114. <field name="INPUT_TABLE_NAME_PROPERTY" type="java.lang.String"
  12115. transient="false" volatile="false"
  12116. static="true" final="true" visibility="public"
  12117. deprecated="not deprecated">
  12118. <doc>
  12119. <![CDATA[Input table name]]>
  12120. </doc>
  12121. </field>
  12122. <field name="INPUT_FIELD_NAMES_PROPERTY" type="java.lang.String"
  12123. transient="false" volatile="false"
  12124. static="true" final="true" visibility="public"
  12125. deprecated="not deprecated">
  12126. <doc>
  12127. <![CDATA[Field names in the Input table]]>
  12128. </doc>
  12129. </field>
  12130. <field name="INPUT_CONDITIONS_PROPERTY" type="java.lang.String"
  12131. transient="false" volatile="false"
  12132. static="true" final="true" visibility="public"
  12133. deprecated="not deprecated">
  12134. <doc>
  12135. <![CDATA[WHERE clause in the input SELECT statement]]>
  12136. </doc>
  12137. </field>
  12138. <field name="INPUT_ORDER_BY_PROPERTY" type="java.lang.String"
  12139. transient="false" volatile="false"
  12140. static="true" final="true" visibility="public"
  12141. deprecated="not deprecated">
  12142. <doc>
  12143. <![CDATA[ORDER BY clause in the input SELECT statement]]>
  12144. </doc>
  12145. </field>
  12146. <field name="INPUT_QUERY" type="java.lang.String"
  12147. transient="false" volatile="false"
  12148. static="true" final="true" visibility="public"
  12149. deprecated="not deprecated">
  12150. <doc>
  12151. <![CDATA[Whole input query, exluding LIMIT...OFFSET]]>
  12152. </doc>
  12153. </field>
  12154. <field name="INPUT_COUNT_QUERY" type="java.lang.String"
  12155. transient="false" volatile="false"
  12156. static="true" final="true" visibility="public"
  12157. deprecated="not deprecated">
  12158. <doc>
  12159. <![CDATA[Input query to get the count of records]]>
  12160. </doc>
  12161. </field>
  12162. <field name="INPUT_CLASS_PROPERTY" type="java.lang.String"
  12163. transient="false" volatile="false"
  12164. static="true" final="true" visibility="public"
  12165. deprecated="not deprecated">
  12166. <doc>
  12167. <![CDATA[Class name implementing DBWritable which will hold input tuples]]>
  12168. </doc>
  12169. </field>
  12170. <field name="OUTPUT_TABLE_NAME_PROPERTY" type="java.lang.String"
  12171. transient="false" volatile="false"
  12172. static="true" final="true" visibility="public"
  12173. deprecated="not deprecated">
  12174. <doc>
  12175. <![CDATA[Output table name]]>
  12176. </doc>
  12177. </field>
  12178. <field name="OUTPUT_FIELD_NAMES_PROPERTY" type="java.lang.String"
  12179. transient="false" volatile="false"
  12180. static="true" final="true" visibility="public"
  12181. deprecated="not deprecated">
  12182. <doc>
  12183. <![CDATA[Field names in the Output table]]>
  12184. </doc>
  12185. </field>
  12186. <field name="OUTPUT_FIELD_COUNT_PROPERTY" type="java.lang.String"
  12187. transient="false" volatile="false"
  12188. static="true" final="true" visibility="public"
  12189. deprecated="not deprecated">
  12190. <doc>
  12191. <![CDATA[Number of fields in the Output table]]>
  12192. </doc>
  12193. </field>
  12194. <doc>
  12195. <![CDATA[@deprecated Use
  12196. {@link org.apache.hadoop.mapreduce.lib.db.DBConfiguration} instead]]>
  12197. </doc>
  12198. </class>
  12199. <!-- end class org.apache.hadoop.mapred.lib.db.DBConfiguration -->
  12200. <!-- start class org.apache.hadoop.mapred.lib.db.DBInputFormat -->
  12201. <class name="DBInputFormat" extends="org.apache.hadoop.mapreduce.lib.db.DBInputFormat"
  12202. abstract="false"
  12203. static="false" final="false" visibility="public"
  12204. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.db.DBInputFormat} instead.">
  12205. <implements name="org.apache.hadoop.mapred.InputFormat"/>
  12206. <implements name="org.apache.hadoop.mapred.JobConfigurable"/>
  12207. <constructor name="DBInputFormat"
  12208. static="false" final="false" visibility="public"
  12209. deprecated="not deprecated">
  12210. </constructor>
  12211. <method name="configure"
  12212. abstract="false" native="false" synchronized="false"
  12213. static="false" final="false" visibility="public"
  12214. deprecated="not deprecated">
  12215. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12216. <doc>
  12217. <![CDATA[{@inheritDoc}]]>
  12218. </doc>
  12219. </method>
  12220. <method name="getRecordReader" return="org.apache.hadoop.mapred.RecordReader"
  12221. abstract="false" native="false" synchronized="false"
  12222. static="false" final="false" visibility="public"
  12223. deprecated="not deprecated">
  12224. <param name="split" type="org.apache.hadoop.mapred.InputSplit"/>
  12225. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12226. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  12227. <exception name="IOException" type="java.io.IOException"/>
  12228. <doc>
  12229. <![CDATA[{@inheritDoc}]]>
  12230. </doc>
  12231. </method>
  12232. <method name="getSplits" return="org.apache.hadoop.mapred.InputSplit[]"
  12233. abstract="false" native="false" synchronized="false"
  12234. static="false" final="false" visibility="public"
  12235. deprecated="not deprecated">
  12236. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12237. <param name="chunks" type="int"/>
  12238. <exception name="IOException" type="java.io.IOException"/>
  12239. <doc>
  12240. <![CDATA[{@inheritDoc}]]>
  12241. </doc>
  12242. </method>
  12243. <method name="setInput"
  12244. abstract="false" native="false" synchronized="false"
  12245. static="true" final="false" visibility="public"
  12246. deprecated="not deprecated">
  12247. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12248. <param name="inputClass" type="java.lang.Class"/>
  12249. <param name="tableName" type="java.lang.String"/>
  12250. <param name="conditions" type="java.lang.String"/>
  12251. <param name="orderBy" type="java.lang.String"/>
  12252. <param name="fieldNames" type="java.lang.String[]"/>
  12253. <doc>
  12254. <![CDATA[Initializes the map-part of the job with the appropriate input settings.
  12255. @param job The job
  12256. @param inputClass the class object implementing DBWritable, which is the
  12257. Java object holding tuple fields.
  12258. @param tableName The table to read data from
  12259. @param conditions The condition which to select data with, eg. '(updated >
  12260. 20070101 AND length > 0)'
  12261. @param orderBy the fieldNames in the orderBy clause.
  12262. @param fieldNames The field names in the table
  12263. @see #setInput(JobConf, Class, String, String)]]>
  12264. </doc>
  12265. </method>
  12266. <method name="setInput"
  12267. abstract="false" native="false" synchronized="false"
  12268. static="true" final="false" visibility="public"
  12269. deprecated="not deprecated">
  12270. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12271. <param name="inputClass" type="java.lang.Class"/>
  12272. <param name="inputQuery" type="java.lang.String"/>
  12273. <param name="inputCountQuery" type="java.lang.String"/>
  12274. <doc>
  12275. <![CDATA[Initializes the map-part of the job with the appropriate input settings.
  12276. @param job The job
  12277. @param inputClass the class object implementing DBWritable, which is the
  12278. Java object holding tuple fields.
  12279. @param inputQuery the input query to select fields. Example :
  12280. "SELECT f1, f2, f3 FROM Mytable ORDER BY f1"
  12281. @param inputCountQuery the input query that returns the number of records in
  12282. the table.
  12283. Example : "SELECT COUNT(f1) FROM Mytable"
  12284. @see #setInput(JobConf, Class, String, String, String, String...)]]>
  12285. </doc>
  12286. </method>
  12287. <doc>
  12288. <![CDATA[@deprecated
  12289. Use {@link org.apache.hadoop.mapreduce.lib.db.DBInputFormat} instead.]]>
  12290. </doc>
  12291. </class>
  12292. <!-- end class org.apache.hadoop.mapred.lib.db.DBInputFormat -->
  12293. <!-- start class org.apache.hadoop.mapred.lib.db.DBInputFormat.DBInputSplit -->
  12294. <class name="DBInputFormat.DBInputSplit" extends="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit"
  12295. abstract="false"
  12296. static="true" final="false" visibility="protected"
  12297. deprecated="not deprecated">
  12298. <implements name="org.apache.hadoop.mapred.InputSplit"/>
  12299. <constructor name="DBInputFormat.DBInputSplit"
  12300. static="false" final="false" visibility="public"
  12301. deprecated="not deprecated">
  12302. <doc>
  12303. <![CDATA[Default Constructor]]>
  12304. </doc>
  12305. </constructor>
  12306. <constructor name="DBInputFormat.DBInputSplit" type="long, long"
  12307. static="false" final="false" visibility="public"
  12308. deprecated="not deprecated">
  12309. <doc>
  12310. <![CDATA[Convenience Constructor
  12311. @param start the index of the first row to select
  12312. @param end the index of the last row to select]]>
  12313. </doc>
  12314. </constructor>
  12315. <doc>
  12316. <![CDATA[A InputSplit that spans a set of rows]]>
  12317. </doc>
  12318. </class>
  12319. <!-- end class org.apache.hadoop.mapred.lib.db.DBInputFormat.DBInputSplit -->
  12320. <!-- start class org.apache.hadoop.mapred.lib.db.DBInputFormat.DBRecordReader -->
  12321. <class name="DBInputFormat.DBRecordReader" extends="org.apache.hadoop.mapreduce.lib.db.DBRecordReader"
  12322. abstract="false"
  12323. static="false" final="false" visibility="protected"
  12324. deprecated="not deprecated">
  12325. <implements name="org.apache.hadoop.mapred.RecordReader"/>
  12326. <constructor name="DBInputFormat.DBRecordReader" type="org.apache.hadoop.mapred.lib.db.DBInputFormat.DBInputSplit, java.lang.Class, org.apache.hadoop.mapred.JobConf, java.sql.Connection, org.apache.hadoop.mapred.lib.db.DBConfiguration, java.lang.String, java.lang.String[], java.lang.String"
  12327. static="false" final="false" visibility="protected"
  12328. deprecated="not deprecated">
  12329. <exception name="SQLException" type="java.sql.SQLException"/>
  12330. <doc>
  12331. <![CDATA[@param split The InputSplit to read data for
  12332. @throws SQLException]]>
  12333. </doc>
  12334. </constructor>
  12335. <method name="createKey" return="org.apache.hadoop.io.LongWritable"
  12336. abstract="false" native="false" synchronized="false"
  12337. static="false" final="false" visibility="public"
  12338. deprecated="not deprecated">
  12339. <doc>
  12340. <![CDATA[{@inheritDoc}]]>
  12341. </doc>
  12342. </method>
  12343. <method name="createValue" return="T"
  12344. abstract="false" native="false" synchronized="false"
  12345. static="false" final="false" visibility="public"
  12346. deprecated="not deprecated">
  12347. <doc>
  12348. <![CDATA[{@inheritDoc}]]>
  12349. </doc>
  12350. </method>
  12351. <method name="getPos" return="long"
  12352. abstract="false" native="false" synchronized="false"
  12353. static="false" final="false" visibility="public"
  12354. deprecated="not deprecated">
  12355. <exception name="IOException" type="java.io.IOException"/>
  12356. </method>
  12357. <method name="next" return="boolean"
  12358. abstract="false" native="false" synchronized="false"
  12359. static="false" final="false" visibility="public"
  12360. deprecated="not deprecated">
  12361. <param name="key" type="org.apache.hadoop.io.LongWritable"/>
  12362. <param name="value" type="T"/>
  12363. <exception name="IOException" type="java.io.IOException"/>
  12364. <doc>
  12365. <![CDATA[{@inheritDoc}]]>
  12366. </doc>
  12367. </method>
  12368. <doc>
  12369. <![CDATA[A RecordReader that reads records from a SQL table.
  12370. Emits LongWritables containing the record number as
  12371. key and DBWritables as value.]]>
  12372. </doc>
  12373. </class>
  12374. <!-- end class org.apache.hadoop.mapred.lib.db.DBInputFormat.DBRecordReader -->
  12375. <!-- start class org.apache.hadoop.mapred.lib.db.DBInputFormat.NullDBWritable -->
  12376. <class name="DBInputFormat.NullDBWritable" extends="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.NullDBWritable"
  12377. abstract="false"
  12378. static="true" final="false" visibility="public"
  12379. deprecated="not deprecated">
  12380. <implements name="org.apache.hadoop.mapred.lib.db.DBWritable"/>
  12381. <implements name="org.apache.hadoop.io.Writable"/>
  12382. <constructor name="DBInputFormat.NullDBWritable"
  12383. static="false" final="false" visibility="public"
  12384. deprecated="not deprecated">
  12385. </constructor>
  12386. <doc>
  12387. <![CDATA[A Class that does nothing, implementing DBWritable]]>
  12388. </doc>
  12389. </class>
  12390. <!-- end class org.apache.hadoop.mapred.lib.db.DBInputFormat.NullDBWritable -->
  12391. <!-- start class org.apache.hadoop.mapred.lib.db.DBOutputFormat -->
  12392. <class name="DBOutputFormat" extends="org.apache.hadoop.mapreduce.lib.db.DBOutputFormat"
  12393. abstract="false"
  12394. static="false" final="false" visibility="public"
  12395. deprecated="Use org.apache.hadoop.mapreduce.lib.db.DBOutputFormat instead">
  12396. <implements name="org.apache.hadoop.mapred.OutputFormat"/>
  12397. <constructor name="DBOutputFormat"
  12398. static="false" final="false" visibility="public"
  12399. deprecated="not deprecated">
  12400. </constructor>
  12401. <method name="checkOutputSpecs"
  12402. abstract="false" native="false" synchronized="false"
  12403. static="false" final="false" visibility="public"
  12404. deprecated="not deprecated">
  12405. <param name="filesystem" type="org.apache.hadoop.fs.FileSystem"/>
  12406. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12407. <exception name="IOException" type="java.io.IOException"/>
  12408. <doc>
  12409. <![CDATA[{@inheritDoc}]]>
  12410. </doc>
  12411. </method>
  12412. <method name="getRecordWriter" return="org.apache.hadoop.mapred.RecordWriter"
  12413. abstract="false" native="false" synchronized="false"
  12414. static="false" final="false" visibility="public"
  12415. deprecated="not deprecated">
  12416. <param name="filesystem" type="org.apache.hadoop.fs.FileSystem"/>
  12417. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12418. <param name="name" type="java.lang.String"/>
  12419. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  12420. <exception name="IOException" type="java.io.IOException"/>
  12421. <doc>
  12422. <![CDATA[{@inheritDoc}]]>
  12423. </doc>
  12424. </method>
  12425. <method name="setOutput"
  12426. abstract="false" native="false" synchronized="false"
  12427. static="true" final="false" visibility="public"
  12428. deprecated="not deprecated">
  12429. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12430. <param name="tableName" type="java.lang.String"/>
  12431. <param name="fieldNames" type="java.lang.String[]"/>
  12432. <doc>
  12433. <![CDATA[Initializes the reduce-part of the job with the appropriate output settings
  12434. @param job The job
  12435. @param tableName The table to insert data into
  12436. @param fieldNames The field names in the table.]]>
  12437. </doc>
  12438. </method>
  12439. <method name="setOutput"
  12440. abstract="false" native="false" synchronized="false"
  12441. static="true" final="false" visibility="public"
  12442. deprecated="not deprecated">
  12443. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  12444. <param name="tableName" type="java.lang.String"/>
  12445. <param name="fieldCount" type="int"/>
  12446. <doc>
  12447. <![CDATA[Initializes the reduce-part of the job with the appropriate output settings
  12448. @param job The job
  12449. @param tableName The table to insert data into
  12450. @param fieldCount the number of fields in the table.]]>
  12451. </doc>
  12452. </method>
  12453. <doc>
  12454. <![CDATA[@deprecated Use org.apache.hadoop.mapreduce.lib.db.DBOutputFormat instead]]>
  12455. </doc>
  12456. </class>
  12457. <!-- end class org.apache.hadoop.mapred.lib.db.DBOutputFormat -->
  12458. <!-- start class org.apache.hadoop.mapred.lib.db.DBOutputFormat.DBRecordWriter -->
  12459. <class name="DBOutputFormat.DBRecordWriter" extends="org.apache.hadoop.mapreduce.lib.db.DBOutputFormat.DBRecordWriter"
  12460. abstract="false"
  12461. static="false" final="false" visibility="protected"
  12462. deprecated="not deprecated">
  12463. <implements name="org.apache.hadoop.mapred.RecordWriter"/>
  12464. <constructor name="DBOutputFormat.DBRecordWriter" type="java.sql.Connection, java.sql.PreparedStatement"
  12465. static="false" final="false" visibility="protected"
  12466. deprecated="not deprecated">
  12467. <exception name="SQLException" type="java.sql.SQLException"/>
  12468. </constructor>
  12469. <method name="close"
  12470. abstract="false" native="false" synchronized="false"
  12471. static="false" final="false" visibility="public"
  12472. deprecated="not deprecated">
  12473. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  12474. <exception name="IOException" type="java.io.IOException"/>
  12475. <doc>
  12476. <![CDATA[{@inheritDoc}]]>
  12477. </doc>
  12478. </method>
  12479. <doc>
  12480. <![CDATA[A RecordWriter that writes the reduce output to a SQL table]]>
  12481. </doc>
  12482. </class>
  12483. <!-- end class org.apache.hadoop.mapred.lib.db.DBOutputFormat.DBRecordWriter -->
  12484. <!-- start interface org.apache.hadoop.mapred.lib.db.DBWritable -->
  12485. <interface name="DBWritable" abstract="true"
  12486. static="false" final="false" visibility="public"
  12487. deprecated="Use {@link org.apache.hadoop.mapreduce.lib.db.DBWritable} instead">
  12488. <implements name="org.apache.hadoop.mapreduce.lib.db.DBWritable"/>
  12489. <doc>
  12490. <![CDATA[@deprecated
  12491. Use {@link org.apache.hadoop.mapreduce.lib.db.DBWritable} instead]]>
  12492. </doc>
  12493. </interface>
  12494. <!-- end interface org.apache.hadoop.mapred.lib.db.DBWritable -->
  12495. </package>
  12496. <package name="org.apache.hadoop.mapred.pipes">
  12497. <!-- start class org.apache.hadoop.mapred.pipes.Submitter -->
  12498. <class name="Submitter" extends="org.apache.hadoop.conf.Configured"
  12499. abstract="false"
  12500. static="false" final="false" visibility="public"
  12501. deprecated="not deprecated">
  12502. <implements name="org.apache.hadoop.util.Tool"/>
  12503. <constructor name="Submitter"
  12504. static="false" final="false" visibility="public"
  12505. deprecated="not deprecated">
  12506. </constructor>
  12507. <constructor name="Submitter" type="org.apache.hadoop.conf.Configuration"
  12508. static="false" final="false" visibility="public"
  12509. deprecated="not deprecated">
  12510. </constructor>
  12511. <method name="getExecutable" return="java.lang.String"
  12512. abstract="false" native="false" synchronized="false"
  12513. static="true" final="false" visibility="public"
  12514. deprecated="not deprecated">
  12515. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12516. <doc>
  12517. <![CDATA[Get the URI of the application's executable.
  12518. @param conf
  12519. @return the URI where the application's executable is located]]>
  12520. </doc>
  12521. </method>
  12522. <method name="setExecutable"
  12523. abstract="false" native="false" synchronized="false"
  12524. static="true" final="false" visibility="public"
  12525. deprecated="not deprecated">
  12526. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12527. <param name="executable" type="java.lang.String"/>
  12528. <doc>
  12529. <![CDATA[Set the URI for the application's executable. Normally this is a hdfs:
  12530. location.
  12531. @param conf
  12532. @param executable The URI of the application's executable.]]>
  12533. </doc>
  12534. </method>
  12535. <method name="setIsJavaRecordReader"
  12536. abstract="false" native="false" synchronized="false"
  12537. static="true" final="false" visibility="public"
  12538. deprecated="not deprecated">
  12539. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12540. <param name="value" type="boolean"/>
  12541. <doc>
  12542. <![CDATA[Set whether the job is using a Java RecordReader.
  12543. @param conf the configuration to modify
  12544. @param value the new value]]>
  12545. </doc>
  12546. </method>
  12547. <method name="getIsJavaRecordReader" return="boolean"
  12548. abstract="false" native="false" synchronized="false"
  12549. static="true" final="false" visibility="public"
  12550. deprecated="not deprecated">
  12551. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12552. <doc>
  12553. <![CDATA[Check whether the job is using a Java RecordReader
  12554. @param conf the configuration to check
  12555. @return is it a Java RecordReader?]]>
  12556. </doc>
  12557. </method>
  12558. <method name="setIsJavaMapper"
  12559. abstract="false" native="false" synchronized="false"
  12560. static="true" final="false" visibility="public"
  12561. deprecated="not deprecated">
  12562. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12563. <param name="value" type="boolean"/>
  12564. <doc>
  12565. <![CDATA[Set whether the Mapper is written in Java.
  12566. @param conf the configuration to modify
  12567. @param value the new value]]>
  12568. </doc>
  12569. </method>
  12570. <method name="getIsJavaMapper" return="boolean"
  12571. abstract="false" native="false" synchronized="false"
  12572. static="true" final="false" visibility="public"
  12573. deprecated="not deprecated">
  12574. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12575. <doc>
  12576. <![CDATA[Check whether the job is using a Java Mapper.
  12577. @param conf the configuration to check
  12578. @return is it a Java Mapper?]]>
  12579. </doc>
  12580. </method>
  12581. <method name="setIsJavaReducer"
  12582. abstract="false" native="false" synchronized="false"
  12583. static="true" final="false" visibility="public"
  12584. deprecated="not deprecated">
  12585. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12586. <param name="value" type="boolean"/>
  12587. <doc>
  12588. <![CDATA[Set whether the Reducer is written in Java.
  12589. @param conf the configuration to modify
  12590. @param value the new value]]>
  12591. </doc>
  12592. </method>
  12593. <method name="getIsJavaReducer" return="boolean"
  12594. abstract="false" native="false" synchronized="false"
  12595. static="true" final="false" visibility="public"
  12596. deprecated="not deprecated">
  12597. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12598. <doc>
  12599. <![CDATA[Check whether the job is using a Java Reducer.
  12600. @param conf the configuration to check
  12601. @return is it a Java Reducer?]]>
  12602. </doc>
  12603. </method>
  12604. <method name="setIsJavaRecordWriter"
  12605. abstract="false" native="false" synchronized="false"
  12606. static="true" final="false" visibility="public"
  12607. deprecated="not deprecated">
  12608. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12609. <param name="value" type="boolean"/>
  12610. <doc>
  12611. <![CDATA[Set whether the job will use a Java RecordWriter.
  12612. @param conf the configuration to modify
  12613. @param value the new value to set]]>
  12614. </doc>
  12615. </method>
  12616. <method name="getIsJavaRecordWriter" return="boolean"
  12617. abstract="false" native="false" synchronized="false"
  12618. static="true" final="false" visibility="public"
  12619. deprecated="not deprecated">
  12620. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12621. <doc>
  12622. <![CDATA[Will the reduce use a Java RecordWriter?
  12623. @param conf the configuration to check
  12624. @return true, if the output of the job will be written by Java]]>
  12625. </doc>
  12626. </method>
  12627. <method name="getKeepCommandFile" return="boolean"
  12628. abstract="false" native="false" synchronized="false"
  12629. static="true" final="false" visibility="public"
  12630. deprecated="not deprecated">
  12631. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12632. <doc>
  12633. <![CDATA[Does the user want to keep the command file for debugging? If this is
  12634. true, pipes will write a copy of the command data to a file in the
  12635. task directory named "downlink.data", which may be used to run the C++
  12636. program under the debugger. You probably also want to set
  12637. JobConf.setKeepFailedTaskFiles(true) to keep the entire directory from
  12638. being deleted.
  12639. To run using the data file, set the environment variable
  12640. "mapreduce.pipes.commandfile" to point to the file.
  12641. @param conf the configuration to check
  12642. @return will the framework save the command file?]]>
  12643. </doc>
  12644. </method>
  12645. <method name="setKeepCommandFile"
  12646. abstract="false" native="false" synchronized="false"
  12647. static="true" final="false" visibility="public"
  12648. deprecated="not deprecated">
  12649. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12650. <param name="keep" type="boolean"/>
  12651. <doc>
  12652. <![CDATA[Set whether to keep the command file for debugging
  12653. @param conf the configuration to modify
  12654. @param keep the new value]]>
  12655. </doc>
  12656. </method>
  12657. <method name="submitJob" return="org.apache.hadoop.mapred.RunningJob"
  12658. abstract="false" native="false" synchronized="false"
  12659. static="true" final="false" visibility="public"
  12660. deprecated="Use {@link Submitter#runJob(JobConf)}">
  12661. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12662. <exception name="IOException" type="java.io.IOException"/>
  12663. <doc>
  12664. <![CDATA[Submit a job to the map/reduce cluster. All of the necessary modifications
  12665. to the job to run under pipes are made to the configuration.
  12666. @param conf the job to submit to the cluster (MODIFIED)
  12667. @throws IOException
  12668. @deprecated Use {@link Submitter#runJob(JobConf)}]]>
  12669. </doc>
  12670. </method>
  12671. <method name="runJob" return="org.apache.hadoop.mapred.RunningJob"
  12672. abstract="false" native="false" synchronized="false"
  12673. static="true" final="false" visibility="public"
  12674. deprecated="not deprecated">
  12675. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12676. <exception name="IOException" type="java.io.IOException"/>
  12677. <doc>
  12678. <![CDATA[Submit a job to the map/reduce cluster. All of the necessary modifications
  12679. to the job to run under pipes are made to the configuration.
  12680. @param conf the job to submit to the cluster (MODIFIED)
  12681. @throws IOException]]>
  12682. </doc>
  12683. </method>
  12684. <method name="jobSubmit" return="org.apache.hadoop.mapred.RunningJob"
  12685. abstract="false" native="false" synchronized="false"
  12686. static="true" final="false" visibility="public"
  12687. deprecated="not deprecated">
  12688. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  12689. <exception name="IOException" type="java.io.IOException"/>
  12690. <doc>
  12691. <![CDATA[Submit a job to the Map-Reduce framework.
  12692. This returns a handle to the {@link RunningJob} which can be used to track
  12693. the running-job.
  12694. @param conf the job configuration.
  12695. @return a handle to the {@link RunningJob} which can be used to track the
  12696. running-job.
  12697. @throws IOException]]>
  12698. </doc>
  12699. </method>
  12700. <method name="run" return="int"
  12701. abstract="false" native="false" synchronized="false"
  12702. static="false" final="false" visibility="public"
  12703. deprecated="not deprecated">
  12704. <param name="args" type="java.lang.String[]"/>
  12705. <exception name="Exception" type="java.lang.Exception"/>
  12706. </method>
  12707. <method name="main"
  12708. abstract="false" native="false" synchronized="false"
  12709. static="true" final="false" visibility="public"
  12710. deprecated="not deprecated">
  12711. <param name="args" type="java.lang.String[]"/>
  12712. <exception name="Exception" type="java.lang.Exception"/>
  12713. <doc>
  12714. <![CDATA[Submit a pipes job based on the command line arguments.
  12715. @param args]]>
  12716. </doc>
  12717. </method>
  12718. <field name="LOG" type="org.apache.commons.logging.Log"
  12719. transient="false" volatile="false"
  12720. static="true" final="true" visibility="protected"
  12721. deprecated="not deprecated">
  12722. </field>
  12723. <field name="PRESERVE_COMMANDFILE" type="java.lang.String"
  12724. transient="false" volatile="false"
  12725. static="true" final="true" visibility="public"
  12726. deprecated="not deprecated">
  12727. </field>
  12728. <field name="EXECUTABLE" type="java.lang.String"
  12729. transient="false" volatile="false"
  12730. static="true" final="true" visibility="public"
  12731. deprecated="not deprecated">
  12732. </field>
  12733. <field name="INTERPRETOR" type="java.lang.String"
  12734. transient="false" volatile="false"
  12735. static="true" final="true" visibility="public"
  12736. deprecated="not deprecated">
  12737. </field>
  12738. <field name="IS_JAVA_MAP" type="java.lang.String"
  12739. transient="false" volatile="false"
  12740. static="true" final="true" visibility="public"
  12741. deprecated="not deprecated">
  12742. </field>
  12743. <field name="IS_JAVA_RR" type="java.lang.String"
  12744. transient="false" volatile="false"
  12745. static="true" final="true" visibility="public"
  12746. deprecated="not deprecated">
  12747. </field>
  12748. <field name="IS_JAVA_RW" type="java.lang.String"
  12749. transient="false" volatile="false"
  12750. static="true" final="true" visibility="public"
  12751. deprecated="not deprecated">
  12752. </field>
  12753. <field name="IS_JAVA_REDUCE" type="java.lang.String"
  12754. transient="false" volatile="false"
  12755. static="true" final="true" visibility="public"
  12756. deprecated="not deprecated">
  12757. </field>
  12758. <field name="PARTITIONER" type="java.lang.String"
  12759. transient="false" volatile="false"
  12760. static="true" final="true" visibility="public"
  12761. deprecated="not deprecated">
  12762. </field>
  12763. <field name="INPUT_FORMAT" type="java.lang.String"
  12764. transient="false" volatile="false"
  12765. static="true" final="true" visibility="public"
  12766. deprecated="not deprecated">
  12767. </field>
  12768. <field name="PORT" type="java.lang.String"
  12769. transient="false" volatile="false"
  12770. static="true" final="true" visibility="public"
  12771. deprecated="not deprecated">
  12772. </field>
  12773. <doc>
  12774. <![CDATA[The main entry point and job submitter. It may either be used as a command
  12775. line-based or API-based method to launch Pipes jobs.]]>
  12776. </doc>
  12777. </class>
  12778. <!-- end class org.apache.hadoop.mapred.pipes.Submitter -->
  12779. </package>
  12780. <package name="org.apache.hadoop.mapred.tools">
  12781. <!-- start class org.apache.hadoop.mapred.tools.MRAdmin -->
  12782. <class name="MRAdmin" extends="org.apache.hadoop.conf.Configured"
  12783. abstract="false"
  12784. static="false" final="false" visibility="public"
  12785. deprecated="not deprecated">
  12786. <implements name="org.apache.hadoop.util.Tool"/>
  12787. <constructor name="MRAdmin"
  12788. static="false" final="false" visibility="public"
  12789. deprecated="not deprecated">
  12790. </constructor>
  12791. <constructor name="MRAdmin" type="org.apache.hadoop.conf.Configuration"
  12792. static="false" final="false" visibility="public"
  12793. deprecated="not deprecated">
  12794. </constructor>
  12795. <method name="refreshSuperUserGroupsConfiguration" return="int"
  12796. abstract="false" native="false" synchronized="false"
  12797. static="false" final="false" visibility="public"
  12798. deprecated="not deprecated">
  12799. <exception name="IOException" type="java.io.IOException"/>
  12800. <doc>
  12801. <![CDATA[refreshSuperUserGroupsConfiguration {@link JobTracker}.
  12802. @return exitcode 0 on success, non-zero on failure
  12803. @throws IOException]]>
  12804. </doc>
  12805. </method>
  12806. <method name="run" return="int"
  12807. abstract="false" native="false" synchronized="false"
  12808. static="false" final="false" visibility="public"
  12809. deprecated="not deprecated">
  12810. <param name="args" type="java.lang.String[]"/>
  12811. <exception name="Exception" type="java.lang.Exception"/>
  12812. </method>
  12813. <method name="main"
  12814. abstract="false" native="false" synchronized="false"
  12815. static="true" final="false" visibility="public"
  12816. deprecated="not deprecated">
  12817. <param name="args" type="java.lang.String[]"/>
  12818. <exception name="Exception" type="java.lang.Exception"/>
  12819. </method>
  12820. <doc>
  12821. <![CDATA[Administrative access to Hadoop Map-Reduce.
  12822. Currently it only provides the ability to connect to the {@link JobTracker}
  12823. and 1) refresh the service-level authorization policy, 2) refresh queue acl
  12824. properties.]]>
  12825. </doc>
  12826. </class>
  12827. <!-- end class org.apache.hadoop.mapred.tools.MRAdmin -->
  12828. </package>
  12829. <package name="org.apache.hadoop.mapreduce">
  12830. <!-- start class org.apache.hadoop.mapreduce.Cluster -->
  12831. <class name="Cluster" extends="java.lang.Object"
  12832. abstract="false"
  12833. static="false" final="false" visibility="public"
  12834. deprecated="not deprecated">
  12835. <constructor name="Cluster" type="org.apache.hadoop.conf.Configuration"
  12836. static="false" final="false" visibility="public"
  12837. deprecated="not deprecated">
  12838. <exception name="IOException" type="java.io.IOException"/>
  12839. </constructor>
  12840. <constructor name="Cluster" type="java.net.InetSocketAddress, org.apache.hadoop.conf.Configuration"
  12841. static="false" final="false" visibility="public"
  12842. deprecated="not deprecated">
  12843. <exception name="IOException" type="java.io.IOException"/>
  12844. </constructor>
  12845. <method name="close"
  12846. abstract="false" native="false" synchronized="true"
  12847. static="false" final="false" visibility="public"
  12848. deprecated="not deprecated">
  12849. <exception name="IOException" type="java.io.IOException"/>
  12850. <doc>
  12851. <![CDATA[Close the <code>Cluster</code>.]]>
  12852. </doc>
  12853. </method>
  12854. <method name="getFileSystem" return="org.apache.hadoop.fs.FileSystem"
  12855. abstract="false" native="false" synchronized="true"
  12856. static="false" final="false" visibility="public"
  12857. deprecated="not deprecated">
  12858. <exception name="IOException" type="java.io.IOException"/>
  12859. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12860. <doc>
  12861. <![CDATA[Get the file system where job-specific files are stored
  12862. @return object of FileSystem
  12863. @throws IOException
  12864. @throws InterruptedException]]>
  12865. </doc>
  12866. </method>
  12867. <method name="getJob" return="org.apache.hadoop.mapreduce.Job"
  12868. abstract="false" native="false" synchronized="false"
  12869. static="false" final="false" visibility="public"
  12870. deprecated="not deprecated">
  12871. <param name="jobId" type="org.apache.hadoop.mapreduce.JobID"/>
  12872. <exception name="IOException" type="java.io.IOException"/>
  12873. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12874. <doc>
  12875. <![CDATA[Get job corresponding to jobid.
  12876. @param jobId
  12877. @return object of {@link Job}
  12878. @throws IOException
  12879. @throws InterruptedException]]>
  12880. </doc>
  12881. </method>
  12882. <method name="getQueues" return="org.apache.hadoop.mapreduce.QueueInfo[]"
  12883. abstract="false" native="false" synchronized="false"
  12884. static="false" final="false" visibility="public"
  12885. deprecated="not deprecated">
  12886. <exception name="IOException" type="java.io.IOException"/>
  12887. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12888. <doc>
  12889. <![CDATA[Get all the queues in cluster.
  12890. @return array of {@link QueueInfo}
  12891. @throws IOException
  12892. @throws InterruptedException]]>
  12893. </doc>
  12894. </method>
  12895. <method name="getQueue" return="org.apache.hadoop.mapreduce.QueueInfo"
  12896. abstract="false" native="false" synchronized="false"
  12897. static="false" final="false" visibility="public"
  12898. deprecated="not deprecated">
  12899. <param name="name" type="java.lang.String"/>
  12900. <exception name="IOException" type="java.io.IOException"/>
  12901. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12902. <doc>
  12903. <![CDATA[Get queue information for the specified name.
  12904. @param name queuename
  12905. @return object of {@link QueueInfo}
  12906. @throws IOException
  12907. @throws InterruptedException]]>
  12908. </doc>
  12909. </method>
  12910. <method name="getClusterStatus" return="org.apache.hadoop.mapreduce.ClusterMetrics"
  12911. abstract="false" native="false" synchronized="false"
  12912. static="false" final="false" visibility="public"
  12913. deprecated="not deprecated">
  12914. <exception name="IOException" type="java.io.IOException"/>
  12915. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12916. <doc>
  12917. <![CDATA[Get current cluster status.
  12918. @return object of {@link ClusterMetrics}
  12919. @throws IOException
  12920. @throws InterruptedException]]>
  12921. </doc>
  12922. </method>
  12923. <method name="getActiveTaskTrackers" return="org.apache.hadoop.mapreduce.TaskTrackerInfo[]"
  12924. abstract="false" native="false" synchronized="false"
  12925. static="false" final="false" visibility="public"
  12926. deprecated="not deprecated">
  12927. <exception name="IOException" type="java.io.IOException"/>
  12928. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12929. <doc>
  12930. <![CDATA[Get all active trackers in the cluster.
  12931. @return array of {@link TaskTrackerInfo}
  12932. @throws IOException
  12933. @throws InterruptedException]]>
  12934. </doc>
  12935. </method>
  12936. <method name="getBlackListedTaskTrackers" return="org.apache.hadoop.mapreduce.TaskTrackerInfo[]"
  12937. abstract="false" native="false" synchronized="false"
  12938. static="false" final="false" visibility="public"
  12939. deprecated="not deprecated">
  12940. <exception name="IOException" type="java.io.IOException"/>
  12941. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12942. <doc>
  12943. <![CDATA[Get blacklisted trackers.
  12944. @return array of {@link TaskTrackerInfo}
  12945. @throws IOException
  12946. @throws InterruptedException]]>
  12947. </doc>
  12948. </method>
  12949. <method name="getAllJobs" return="org.apache.hadoop.mapreduce.Job[]"
  12950. abstract="false" native="false" synchronized="false"
  12951. static="false" final="false" visibility="public"
  12952. deprecated="not deprecated">
  12953. <exception name="IOException" type="java.io.IOException"/>
  12954. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12955. <doc>
  12956. <![CDATA[Get all the jobs in cluster.
  12957. @return array of {@link Job}
  12958. @throws IOException
  12959. @throws InterruptedException]]>
  12960. </doc>
  12961. </method>
  12962. <method name="getSystemDir" return="org.apache.hadoop.fs.Path"
  12963. abstract="false" native="false" synchronized="false"
  12964. static="false" final="false" visibility="public"
  12965. deprecated="not deprecated">
  12966. <exception name="IOException" type="java.io.IOException"/>
  12967. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12968. <doc>
  12969. <![CDATA[Grab the jobtracker system directory path where
  12970. job-specific files will be placed.
  12971. @return the system directory where job-specific files are to be placed.]]>
  12972. </doc>
  12973. </method>
  12974. <method name="getStagingAreaDir" return="org.apache.hadoop.fs.Path"
  12975. abstract="false" native="false" synchronized="false"
  12976. static="false" final="false" visibility="public"
  12977. deprecated="not deprecated">
  12978. <exception name="IOException" type="java.io.IOException"/>
  12979. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12980. <doc>
  12981. <![CDATA[Grab the jobtracker's view of the staging directory path where
  12982. job-specific files will be placed.
  12983. @return the staging directory where job-specific files are to be placed.]]>
  12984. </doc>
  12985. </method>
  12986. <method name="getJobHistoryUrl" return="java.lang.String"
  12987. abstract="false" native="false" synchronized="false"
  12988. static="false" final="false" visibility="public"
  12989. deprecated="not deprecated">
  12990. <param name="jobId" type="org.apache.hadoop.mapreduce.JobID"/>
  12991. <exception name="IOException" type="java.io.IOException"/>
  12992. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  12993. <doc>
  12994. <![CDATA[Get the job history file path for a given job id. The job history file at
  12995. this path may or may not be existing depending on the job completion state.
  12996. The file is present only for the completed jobs.
  12997. @param jobId the JobID of the job submitted by the current user.
  12998. @return the file path of the job history file
  12999. @throws IOException
  13000. @throws InterruptedException]]>
  13001. </doc>
  13002. </method>
  13003. <method name="getQueueAclsForCurrentUser" return="org.apache.hadoop.mapreduce.QueueAclsInfo[]"
  13004. abstract="false" native="false" synchronized="false"
  13005. static="false" final="false" visibility="public"
  13006. deprecated="not deprecated">
  13007. <exception name="IOException" type="java.io.IOException"/>
  13008. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13009. <doc>
  13010. <![CDATA[Gets the Queue ACLs for current user
  13011. @return array of QueueAclsInfo object for current user.
  13012. @throws IOException]]>
  13013. </doc>
  13014. </method>
  13015. <method name="getRootQueues" return="org.apache.hadoop.mapreduce.QueueInfo[]"
  13016. abstract="false" native="false" synchronized="false"
  13017. static="false" final="false" visibility="public"
  13018. deprecated="not deprecated">
  13019. <exception name="IOException" type="java.io.IOException"/>
  13020. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13021. <doc>
  13022. <![CDATA[Gets the root level queues.
  13023. @return array of JobQueueInfo object.
  13024. @throws IOException]]>
  13025. </doc>
  13026. </method>
  13027. <method name="getChildQueues" return="org.apache.hadoop.mapreduce.QueueInfo[]"
  13028. abstract="false" native="false" synchronized="false"
  13029. static="false" final="false" visibility="public"
  13030. deprecated="not deprecated">
  13031. <param name="queueName" type="java.lang.String"/>
  13032. <exception name="IOException" type="java.io.IOException"/>
  13033. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13034. <doc>
  13035. <![CDATA[Returns immediate children of queueName.
  13036. @param queueName
  13037. @return array of JobQueueInfo which are children of queueName
  13038. @throws IOException]]>
  13039. </doc>
  13040. </method>
  13041. <method name="getJobTrackerState" return="org.apache.hadoop.mapreduce.server.jobtracker.State"
  13042. abstract="false" native="false" synchronized="false"
  13043. static="false" final="false" visibility="public"
  13044. deprecated="Use {@link #getJobTrackerStatus()} instead.">
  13045. <exception name="IOException" type="java.io.IOException"/>
  13046. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13047. <doc>
  13048. <![CDATA[Get JobTracker's state
  13049. @return {@link State} of the JobTracker
  13050. @throws IOException
  13051. @throws InterruptedException
  13052. @deprecated Use {@link #getJobTrackerStatus()} instead.]]>
  13053. </doc>
  13054. </method>
  13055. <method name="getJobTrackerStatus" return="org.apache.hadoop.mapreduce.Cluster.JobTrackerStatus"
  13056. abstract="false" native="false" synchronized="false"
  13057. static="false" final="false" visibility="public"
  13058. deprecated="not deprecated">
  13059. <exception name="IOException" type="java.io.IOException"/>
  13060. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13061. <doc>
  13062. <![CDATA[Get the JobTracker's status.
  13063. @return {@link JobTrackerStatus} of the JobTracker
  13064. @throws IOException
  13065. @throws InterruptedException]]>
  13066. </doc>
  13067. </method>
  13068. <method name="getTaskTrackerExpiryInterval" return="long"
  13069. abstract="false" native="false" synchronized="false"
  13070. static="false" final="false" visibility="public"
  13071. deprecated="not deprecated">
  13072. <exception name="IOException" type="java.io.IOException"/>
  13073. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13074. <doc>
  13075. <![CDATA[Get the tasktracker expiry interval for the cluster
  13076. @return the expiry interval in msec]]>
  13077. </doc>
  13078. </method>
  13079. <method name="getDelegationToken" return="org.apache.hadoop.security.token.Token"
  13080. abstract="false" native="false" synchronized="false"
  13081. static="false" final="false" visibility="public"
  13082. deprecated="not deprecated">
  13083. <param name="renewer" type="org.apache.hadoop.io.Text"/>
  13084. <exception name="IOException" type="java.io.IOException"/>
  13085. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13086. <doc>
  13087. <![CDATA[Get a delegation token for the user from the JobTracker.
  13088. @param renewer the user who can renew the token
  13089. @return the new token
  13090. @throws IOException]]>
  13091. </doc>
  13092. </method>
  13093. <method name="renewDelegationToken" return="long"
  13094. abstract="false" native="false" synchronized="false"
  13095. static="false" final="false" visibility="public"
  13096. deprecated="not deprecated">
  13097. <param name="token" type="org.apache.hadoop.security.token.Token"/>
  13098. <exception name="SecretManager.InvalidToken" type="org.apache.hadoop.security.token.SecretManager.InvalidToken"/>
  13099. <exception name="IOException" type="java.io.IOException"/>
  13100. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13101. <doc>
  13102. <![CDATA[Renew a delegation token
  13103. @param token the token to renew
  13104. @return the new expiration time
  13105. @throws InvalidToken
  13106. @throws IOException]]>
  13107. </doc>
  13108. </method>
  13109. <method name="cancelDelegationToken"
  13110. abstract="false" native="false" synchronized="false"
  13111. static="false" final="false" visibility="public"
  13112. deprecated="not deprecated">
  13113. <param name="token" type="org.apache.hadoop.security.token.Token"/>
  13114. <exception name="IOException" type="java.io.IOException"/>
  13115. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13116. <doc>
  13117. <![CDATA[Cancel a delegation token from the JobTracker
  13118. @param token the token to cancel
  13119. @throws IOException]]>
  13120. </doc>
  13121. </method>
  13122. <doc>
  13123. <![CDATA[Provides a way to access information about the map/reduce cluster.]]>
  13124. </doc>
  13125. </class>
  13126. <!-- end class org.apache.hadoop.mapreduce.Cluster -->
  13127. <!-- start class org.apache.hadoop.mapreduce.Cluster.JobTrackerStatus -->
  13128. <class name="Cluster.JobTrackerStatus" extends="java.lang.Enum"
  13129. abstract="false"
  13130. static="true" final="true" visibility="public"
  13131. deprecated="not deprecated">
  13132. <method name="values" return="org.apache.hadoop.mapreduce.Cluster.JobTrackerStatus[]"
  13133. abstract="false" native="false" synchronized="false"
  13134. static="true" final="false" visibility="public"
  13135. deprecated="not deprecated">
  13136. </method>
  13137. <method name="valueOf" return="org.apache.hadoop.mapreduce.Cluster.JobTrackerStatus"
  13138. abstract="false" native="false" synchronized="false"
  13139. static="true" final="false" visibility="public"
  13140. deprecated="not deprecated">
  13141. <param name="name" type="java.lang.String"/>
  13142. </method>
  13143. </class>
  13144. <!-- end class org.apache.hadoop.mapreduce.Cluster.JobTrackerStatus -->
  13145. <!-- start class org.apache.hadoop.mapreduce.ClusterMetrics -->
  13146. <class name="ClusterMetrics" extends="java.lang.Object"
  13147. abstract="false"
  13148. static="false" final="false" visibility="public"
  13149. deprecated="not deprecated">
  13150. <implements name="org.apache.hadoop.io.Writable"/>
  13151. <constructor name="ClusterMetrics"
  13152. static="false" final="false" visibility="public"
  13153. deprecated="not deprecated">
  13154. </constructor>
  13155. <constructor name="ClusterMetrics" type="int, int, int, int, int, int, int, int, int, int, int, int"
  13156. static="false" final="false" visibility="public"
  13157. deprecated="not deprecated">
  13158. </constructor>
  13159. <method name="getRunningMaps" return="int"
  13160. abstract="false" native="false" synchronized="false"
  13161. static="false" final="false" visibility="public"
  13162. deprecated="not deprecated">
  13163. <doc>
  13164. <![CDATA[Get the number of running map tasks in the cluster.
  13165. @return running maps]]>
  13166. </doc>
  13167. </method>
  13168. <method name="getRunningReduces" return="int"
  13169. abstract="false" native="false" synchronized="false"
  13170. static="false" final="false" visibility="public"
  13171. deprecated="not deprecated">
  13172. <doc>
  13173. <![CDATA[Get the number of running reduce tasks in the cluster.
  13174. @return running reduces]]>
  13175. </doc>
  13176. </method>
  13177. <method name="getOccupiedMapSlots" return="int"
  13178. abstract="false" native="false" synchronized="false"
  13179. static="false" final="false" visibility="public"
  13180. deprecated="not deprecated">
  13181. <doc>
  13182. <![CDATA[Get number of occupied map slots in the cluster.
  13183. @return occupied map slot count]]>
  13184. </doc>
  13185. </method>
  13186. <method name="getOccupiedReduceSlots" return="int"
  13187. abstract="false" native="false" synchronized="false"
  13188. static="false" final="false" visibility="public"
  13189. deprecated="not deprecated">
  13190. <doc>
  13191. <![CDATA[Get the number of occupied reduce slots in the cluster.
  13192. @return occupied reduce slot count]]>
  13193. </doc>
  13194. </method>
  13195. <method name="getReservedMapSlots" return="int"
  13196. abstract="false" native="false" synchronized="false"
  13197. static="false" final="false" visibility="public"
  13198. deprecated="not deprecated">
  13199. <doc>
  13200. <![CDATA[Get number of reserved map slots in the cluster.
  13201. @return reserved map slot count]]>
  13202. </doc>
  13203. </method>
  13204. <method name="getReservedReduceSlots" return="int"
  13205. abstract="false" native="false" synchronized="false"
  13206. static="false" final="false" visibility="public"
  13207. deprecated="not deprecated">
  13208. <doc>
  13209. <![CDATA[Get the number of reserved reduce slots in the cluster.
  13210. @return reserved reduce slot count]]>
  13211. </doc>
  13212. </method>
  13213. <method name="getMapSlotCapacity" return="int"
  13214. abstract="false" native="false" synchronized="false"
  13215. static="false" final="false" visibility="public"
  13216. deprecated="not deprecated">
  13217. <doc>
  13218. <![CDATA[Get the total number of map slots in the cluster.
  13219. @return map slot capacity]]>
  13220. </doc>
  13221. </method>
  13222. <method name="getReduceSlotCapacity" return="int"
  13223. abstract="false" native="false" synchronized="false"
  13224. static="false" final="false" visibility="public"
  13225. deprecated="not deprecated">
  13226. <doc>
  13227. <![CDATA[Get the total number of reduce slots in the cluster.
  13228. @return reduce slot capacity]]>
  13229. </doc>
  13230. </method>
  13231. <method name="getTotalJobSubmissions" return="int"
  13232. abstract="false" native="false" synchronized="false"
  13233. static="false" final="false" visibility="public"
  13234. deprecated="not deprecated">
  13235. <doc>
  13236. <![CDATA[Get the total number of job submissions in the cluster.
  13237. @return total number of job submissions]]>
  13238. </doc>
  13239. </method>
  13240. <method name="getTaskTrackerCount" return="int"
  13241. abstract="false" native="false" synchronized="false"
  13242. static="false" final="false" visibility="public"
  13243. deprecated="not deprecated">
  13244. <doc>
  13245. <![CDATA[Get the number of active trackers in the cluster.
  13246. @return active tracker count.]]>
  13247. </doc>
  13248. </method>
  13249. <method name="getBlackListedTaskTrackerCount" return="int"
  13250. abstract="false" native="false" synchronized="false"
  13251. static="false" final="false" visibility="public"
  13252. deprecated="not deprecated">
  13253. <doc>
  13254. <![CDATA[Get the number of blacklisted trackers in the cluster.
  13255. @return blacklisted tracker count]]>
  13256. </doc>
  13257. </method>
  13258. <method name="getDecommissionedTaskTrackerCount" return="int"
  13259. abstract="false" native="false" synchronized="false"
  13260. static="false" final="false" visibility="public"
  13261. deprecated="not deprecated">
  13262. <doc>
  13263. <![CDATA[Get the number of decommissioned trackers in the cluster.
  13264. @return decommissioned tracker count]]>
  13265. </doc>
  13266. </method>
  13267. <method name="readFields"
  13268. abstract="false" native="false" synchronized="false"
  13269. static="false" final="false" visibility="public"
  13270. deprecated="not deprecated">
  13271. <param name="in" type="java.io.DataInput"/>
  13272. <exception name="IOException" type="java.io.IOException"/>
  13273. </method>
  13274. <method name="write"
  13275. abstract="false" native="false" synchronized="false"
  13276. static="false" final="false" visibility="public"
  13277. deprecated="not deprecated">
  13278. <param name="out" type="java.io.DataOutput"/>
  13279. <exception name="IOException" type="java.io.IOException"/>
  13280. </method>
  13281. <doc>
  13282. <![CDATA[Status information on the current state of the Map-Reduce cluster.
  13283. <p><code>ClusterMetrics</code> provides clients with information such as:
  13284. <ol>
  13285. <li>
  13286. Size of the cluster.
  13287. </li>
  13288. <li>
  13289. Number of blacklisted and decommissioned trackers.
  13290. </li>
  13291. <li>
  13292. Slot capacity of the cluster.
  13293. </li>
  13294. <li>
  13295. The number of currently occupied/reserved map & reduce slots.
  13296. </li>
  13297. <li>
  13298. The number of currently running map & reduce tasks.
  13299. </li>
  13300. <li>
  13301. The number of job submissions.
  13302. </li>
  13303. </ol></p>
  13304. <p>Clients can query for the latest <code>ClusterMetrics</code>, via
  13305. {@link Cluster#getClusterStatus()}.</p>
  13306. @see Cluster]]>
  13307. </doc>
  13308. </class>
  13309. <!-- end class org.apache.hadoop.mapreduce.ClusterMetrics -->
  13310. <!-- start class org.apache.hadoop.mapreduce.ContextFactory -->
  13311. <class name="ContextFactory" extends="java.lang.Object"
  13312. abstract="false"
  13313. static="false" final="false" visibility="public"
  13314. deprecated="not deprecated">
  13315. <constructor name="ContextFactory"
  13316. static="false" final="false" visibility="public"
  13317. deprecated="not deprecated">
  13318. </constructor>
  13319. <method name="cloneContext" return="org.apache.hadoop.mapreduce.JobContext"
  13320. abstract="false" native="false" synchronized="false"
  13321. static="true" final="false" visibility="public"
  13322. deprecated="not deprecated">
  13323. <param name="original" type="org.apache.hadoop.mapreduce.JobContext"/>
  13324. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  13325. <exception name="IOException" type="java.io.IOException"/>
  13326. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13327. <doc>
  13328. <![CDATA[Clone a job or task attempt context with a new configuration.
  13329. @param original the original context
  13330. @param conf the new configuration
  13331. @return a new context object
  13332. @throws InterruptedException
  13333. @throws IOException]]>
  13334. </doc>
  13335. </method>
  13336. <method name="cloneMapContext" return="org.apache.hadoop.mapreduce.Mapper.Context"
  13337. abstract="false" native="false" synchronized="false"
  13338. static="true" final="false" visibility="public"
  13339. deprecated="not deprecated">
  13340. <param name="context" type="org.apache.hadoop.mapreduce.MapContext"/>
  13341. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  13342. <param name="reader" type="org.apache.hadoop.mapreduce.RecordReader"/>
  13343. <param name="writer" type="org.apache.hadoop.mapreduce.RecordWriter"/>
  13344. <exception name="IOException" type="java.io.IOException"/>
  13345. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13346. <doc>
  13347. <![CDATA[Copy a mapper context, optionally replacing the input and output.
  13348. @param <K1> input key type
  13349. @param <V1> input value type
  13350. @param <K2> output key type
  13351. @param <V2> output value type
  13352. @param context the context to clone
  13353. @param conf a new configuration
  13354. @param reader Reader to read from. Null means to clone from context.
  13355. @param writer Writer to write to. Null means to clone from context.
  13356. @return a new context. it will not be the same class as the original.
  13357. @throws IOException
  13358. @throws InterruptedException]]>
  13359. </doc>
  13360. </method>
  13361. <doc>
  13362. <![CDATA[A factory to allow applications to deal with inconsistencies between
  13363. MapReduce Context Objects API between hadoop-0.20 and later versions.]]>
  13364. </doc>
  13365. </class>
  13366. <!-- end class org.apache.hadoop.mapreduce.ContextFactory -->
  13367. <!-- start class org.apache.hadoop.mapreduce.Counter -->
  13368. <class name="Counter" extends="java.lang.Object"
  13369. abstract="false"
  13370. static="false" final="false" visibility="public"
  13371. deprecated="not deprecated">
  13372. <implements name="org.apache.hadoop.io.Writable"/>
  13373. <constructor name="Counter"
  13374. static="false" final="false" visibility="protected"
  13375. deprecated="not deprecated">
  13376. </constructor>
  13377. <constructor name="Counter" type="java.lang.String, java.lang.String"
  13378. static="false" final="false" visibility="protected"
  13379. deprecated="not deprecated">
  13380. </constructor>
  13381. <constructor name="Counter" type="java.lang.String, java.lang.String, long"
  13382. static="false" final="false" visibility="public"
  13383. deprecated="not deprecated">
  13384. <doc>
  13385. <![CDATA[Create a counter.
  13386. @param name the name within the group's enum.
  13387. @param displayName a name to be displayed.
  13388. @param value the counter value.]]>
  13389. </doc>
  13390. </constructor>
  13391. <method name="setDisplayName"
  13392. abstract="false" native="false" synchronized="true"
  13393. static="false" final="false" visibility="protected"
  13394. deprecated="not deprecated">
  13395. <param name="displayName" type="java.lang.String"/>
  13396. </method>
  13397. <method name="readFields"
  13398. abstract="false" native="false" synchronized="true"
  13399. static="false" final="false" visibility="public"
  13400. deprecated="not deprecated">
  13401. <param name="in" type="java.io.DataInput"/>
  13402. <exception name="IOException" type="java.io.IOException"/>
  13403. <doc>
  13404. <![CDATA[Read the binary representation of the counter]]>
  13405. </doc>
  13406. </method>
  13407. <method name="write"
  13408. abstract="false" native="false" synchronized="true"
  13409. static="false" final="false" visibility="public"
  13410. deprecated="not deprecated">
  13411. <param name="out" type="java.io.DataOutput"/>
  13412. <exception name="IOException" type="java.io.IOException"/>
  13413. <doc>
  13414. <![CDATA[Write the binary representation of the counter]]>
  13415. </doc>
  13416. </method>
  13417. <method name="getName" return="java.lang.String"
  13418. abstract="false" native="false" synchronized="true"
  13419. static="false" final="false" visibility="public"
  13420. deprecated="not deprecated">
  13421. </method>
  13422. <method name="getDisplayName" return="java.lang.String"
  13423. abstract="false" native="false" synchronized="true"
  13424. static="false" final="false" visibility="public"
  13425. deprecated="not deprecated">
  13426. <doc>
  13427. <![CDATA[Get the name of the counter.
  13428. @return the user facing name of the counter]]>
  13429. </doc>
  13430. </method>
  13431. <method name="getValue" return="long"
  13432. abstract="false" native="false" synchronized="true"
  13433. static="false" final="false" visibility="public"
  13434. deprecated="not deprecated">
  13435. <doc>
  13436. <![CDATA[What is the current value of this counter?
  13437. @return the current value]]>
  13438. </doc>
  13439. </method>
  13440. <method name="setValue"
  13441. abstract="false" native="false" synchronized="true"
  13442. static="false" final="false" visibility="public"
  13443. deprecated="not deprecated">
  13444. <param name="value" type="long"/>
  13445. <doc>
  13446. <![CDATA[Set this counter by the given value
  13447. @param value the value to set]]>
  13448. </doc>
  13449. </method>
  13450. <method name="increment"
  13451. abstract="false" native="false" synchronized="true"
  13452. static="false" final="false" visibility="public"
  13453. deprecated="not deprecated">
  13454. <param name="incr" type="long"/>
  13455. <doc>
  13456. <![CDATA[Increment this counter by the given value
  13457. @param incr the value to increase this counter by]]>
  13458. </doc>
  13459. </method>
  13460. <method name="equals" return="boolean"
  13461. abstract="false" native="false" synchronized="true"
  13462. static="false" final="false" visibility="public"
  13463. deprecated="not deprecated">
  13464. <param name="genericRight" type="java.lang.Object"/>
  13465. </method>
  13466. <method name="hashCode" return="int"
  13467. abstract="false" native="false" synchronized="true"
  13468. static="false" final="false" visibility="public"
  13469. deprecated="not deprecated">
  13470. </method>
  13471. <doc>
  13472. <![CDATA[A named counter that tracks the progress of a map/reduce job.
  13473. <p><code>Counters</code> represent global counters, defined either by the
  13474. Map-Reduce framework or applications. Each <code>Counter</code> is named by
  13475. an {@link Enum} and has a long for the value.</p>
  13476. <p><code>Counters</code> are bunched into Groups, each comprising of
  13477. counters from a particular <code>Enum</code> class.]]>
  13478. </doc>
  13479. </class>
  13480. <!-- end class org.apache.hadoop.mapreduce.Counter -->
  13481. <!-- start class org.apache.hadoop.mapreduce.CounterGroup -->
  13482. <class name="CounterGroup" extends="java.lang.Object"
  13483. abstract="false"
  13484. static="false" final="false" visibility="public"
  13485. deprecated="not deprecated">
  13486. <implements name="org.apache.hadoop.io.Writable"/>
  13487. <implements name="java.lang.Iterable"/>
  13488. <constructor name="CounterGroup" type="java.lang.String"
  13489. static="false" final="false" visibility="protected"
  13490. deprecated="not deprecated">
  13491. </constructor>
  13492. <constructor name="CounterGroup" type="java.lang.String, java.lang.String"
  13493. static="false" final="false" visibility="public"
  13494. deprecated="not deprecated">
  13495. <doc>
  13496. <![CDATA[Create a CounterGroup.
  13497. @param name the name of the group's enum.
  13498. @param displayName a name to be displayed for the group.]]>
  13499. </doc>
  13500. </constructor>
  13501. <method name="getName" return="java.lang.String"
  13502. abstract="false" native="false" synchronized="true"
  13503. static="false" final="false" visibility="public"
  13504. deprecated="not deprecated">
  13505. <doc>
  13506. <![CDATA[Get the internal name of the group
  13507. @return the internal name]]>
  13508. </doc>
  13509. </method>
  13510. <method name="getDisplayName" return="java.lang.String"
  13511. abstract="false" native="false" synchronized="true"
  13512. static="false" final="false" visibility="public"
  13513. deprecated="not deprecated">
  13514. <doc>
  13515. <![CDATA[Get the display name of the group.
  13516. @return the human readable name]]>
  13517. </doc>
  13518. </method>
  13519. <method name="addCounter"
  13520. abstract="false" native="false" synchronized="true"
  13521. static="false" final="false" visibility="public"
  13522. deprecated="not deprecated">
  13523. <param name="counter" type="org.apache.hadoop.mapreduce.Counter"/>
  13524. <doc>
  13525. <![CDATA[Add a counter to this group.]]>
  13526. </doc>
  13527. </method>
  13528. <method name="findCounter" return="org.apache.hadoop.mapreduce.Counter"
  13529. abstract="false" native="false" synchronized="false"
  13530. static="false" final="false" visibility="public"
  13531. deprecated="not deprecated">
  13532. <param name="counterName" type="java.lang.String"/>
  13533. <param name="displayName" type="java.lang.String"/>
  13534. <doc>
  13535. <![CDATA[Find a counter in a group.
  13536. @param counterName the name of the counter
  13537. @param displayName the display name of the counter
  13538. @return the counter that was found or added]]>
  13539. </doc>
  13540. </method>
  13541. <method name="findCounter" return="org.apache.hadoop.mapreduce.Counter"
  13542. abstract="false" native="false" synchronized="true"
  13543. static="false" final="false" visibility="public"
  13544. deprecated="not deprecated">
  13545. <param name="counterName" type="java.lang.String"/>
  13546. </method>
  13547. <method name="iterator" return="java.util.Iterator"
  13548. abstract="false" native="false" synchronized="true"
  13549. static="false" final="false" visibility="public"
  13550. deprecated="not deprecated">
  13551. </method>
  13552. <method name="write"
  13553. abstract="false" native="false" synchronized="true"
  13554. static="false" final="false" visibility="public"
  13555. deprecated="not deprecated">
  13556. <param name="out" type="java.io.DataOutput"/>
  13557. <exception name="IOException" type="java.io.IOException"/>
  13558. </method>
  13559. <method name="readFields"
  13560. abstract="false" native="false" synchronized="true"
  13561. static="false" final="false" visibility="public"
  13562. deprecated="not deprecated">
  13563. <param name="in" type="java.io.DataInput"/>
  13564. <exception name="IOException" type="java.io.IOException"/>
  13565. </method>
  13566. <method name="size" return="int"
  13567. abstract="false" native="false" synchronized="true"
  13568. static="false" final="false" visibility="public"
  13569. deprecated="not deprecated">
  13570. <doc>
  13571. <![CDATA[Returns the number of counters in this group.]]>
  13572. </doc>
  13573. </method>
  13574. <method name="equals" return="boolean"
  13575. abstract="false" native="false" synchronized="true"
  13576. static="false" final="false" visibility="public"
  13577. deprecated="not deprecated">
  13578. <param name="genericRight" type="java.lang.Object"/>
  13579. </method>
  13580. <method name="hashCode" return="int"
  13581. abstract="false" native="false" synchronized="true"
  13582. static="false" final="false" visibility="public"
  13583. deprecated="not deprecated">
  13584. </method>
  13585. <method name="incrAllCounters"
  13586. abstract="false" native="false" synchronized="true"
  13587. static="false" final="false" visibility="public"
  13588. deprecated="not deprecated">
  13589. <param name="rightGroup" type="org.apache.hadoop.mapreduce.CounterGroup"/>
  13590. </method>
  13591. <doc>
  13592. <![CDATA[A group of {@link Counter}s that logically belong together. Typically,
  13593. it is an {@link Enum} subclass and the counters are the values.]]>
  13594. </doc>
  13595. </class>
  13596. <!-- end class org.apache.hadoop.mapreduce.CounterGroup -->
  13597. <!-- start class org.apache.hadoop.mapreduce.Counters -->
  13598. <class name="Counters" extends="java.lang.Object"
  13599. abstract="false"
  13600. static="false" final="false" visibility="public"
  13601. deprecated="not deprecated">
  13602. <implements name="org.apache.hadoop.io.Writable"/>
  13603. <implements name="java.lang.Iterable"/>
  13604. <constructor name="Counters"
  13605. static="false" final="false" visibility="public"
  13606. deprecated="not deprecated">
  13607. </constructor>
  13608. <constructor name="Counters" type="org.apache.hadoop.mapred.Counters"
  13609. static="false" final="false" visibility="public"
  13610. deprecated="not deprecated">
  13611. <doc>
  13612. <![CDATA[Utility method to create a Counters object from the
  13613. org.apache.hadoop.mapred counters
  13614. @param counters]]>
  13615. </doc>
  13616. </constructor>
  13617. <method name="addGroup"
  13618. abstract="false" native="false" synchronized="false"
  13619. static="false" final="false" visibility="public"
  13620. deprecated="not deprecated">
  13621. <param name="group" type="org.apache.hadoop.mapreduce.CounterGroup"/>
  13622. <doc>
  13623. <![CDATA[Add a group.]]>
  13624. </doc>
  13625. </method>
  13626. <method name="findCounter" return="org.apache.hadoop.mapreduce.Counter"
  13627. abstract="false" native="false" synchronized="false"
  13628. static="false" final="false" visibility="public"
  13629. deprecated="not deprecated">
  13630. <param name="groupName" type="java.lang.String"/>
  13631. <param name="counterName" type="java.lang.String"/>
  13632. </method>
  13633. <method name="findCounter" return="org.apache.hadoop.mapreduce.Counter"
  13634. abstract="false" native="false" synchronized="true"
  13635. static="false" final="false" visibility="public"
  13636. deprecated="not deprecated">
  13637. <param name="key" type="java.lang.Enum"/>
  13638. <doc>
  13639. <![CDATA[Find the counter for the given enum. The same enum will always return the
  13640. same counter.
  13641. @param key the counter key
  13642. @return the matching counter object]]>
  13643. </doc>
  13644. </method>
  13645. <method name="getGroupNames" return="java.util.Collection"
  13646. abstract="false" native="false" synchronized="true"
  13647. static="false" final="false" visibility="public"
  13648. deprecated="not deprecated">
  13649. <doc>
  13650. <![CDATA[Returns the names of all counter classes.
  13651. @return Set of counter names.]]>
  13652. </doc>
  13653. </method>
  13654. <method name="iterator" return="java.util.Iterator"
  13655. abstract="false" native="false" synchronized="false"
  13656. static="false" final="false" visibility="public"
  13657. deprecated="not deprecated">
  13658. </method>
  13659. <method name="getGroup" return="org.apache.hadoop.mapreduce.CounterGroup"
  13660. abstract="false" native="false" synchronized="true"
  13661. static="false" final="false" visibility="public"
  13662. deprecated="not deprecated">
  13663. <param name="groupName" type="java.lang.String"/>
  13664. <doc>
  13665. <![CDATA[Returns the named counter group, or an empty group if there is none
  13666. with the specified name.]]>
  13667. </doc>
  13668. </method>
  13669. <method name="countCounters" return="int"
  13670. abstract="false" native="false" synchronized="true"
  13671. static="false" final="false" visibility="public"
  13672. deprecated="not deprecated">
  13673. <doc>
  13674. <![CDATA[Returns the total number of counters, by summing the number of counters
  13675. in each group.]]>
  13676. </doc>
  13677. </method>
  13678. <method name="write"
  13679. abstract="false" native="false" synchronized="true"
  13680. static="false" final="false" visibility="public"
  13681. deprecated="not deprecated">
  13682. <param name="out" type="java.io.DataOutput"/>
  13683. <exception name="IOException" type="java.io.IOException"/>
  13684. <doc>
  13685. <![CDATA[Write the set of groups.
  13686. The external format is:
  13687. #groups (groupName group)*
  13688. i.e. the number of groups followed by 0 or more groups, where each
  13689. group is of the form:
  13690. groupDisplayName #counters (false | true counter)*
  13691. where each counter is of the form:
  13692. name (false | true displayName) value]]>
  13693. </doc>
  13694. </method>
  13695. <method name="readFields"
  13696. abstract="false" native="false" synchronized="true"
  13697. static="false" final="false" visibility="public"
  13698. deprecated="not deprecated">
  13699. <param name="in" type="java.io.DataInput"/>
  13700. <exception name="IOException" type="java.io.IOException"/>
  13701. <doc>
  13702. <![CDATA[Read a set of groups.]]>
  13703. </doc>
  13704. </method>
  13705. <method name="toString" return="java.lang.String"
  13706. abstract="false" native="false" synchronized="true"
  13707. static="false" final="false" visibility="public"
  13708. deprecated="not deprecated">
  13709. <doc>
  13710. <![CDATA[Return textual representation of the counter values.]]>
  13711. </doc>
  13712. </method>
  13713. <method name="incrAllCounters"
  13714. abstract="false" native="false" synchronized="true"
  13715. static="false" final="false" visibility="public"
  13716. deprecated="not deprecated">
  13717. <param name="other" type="org.apache.hadoop.mapreduce.Counters"/>
  13718. <doc>
  13719. <![CDATA[Increments multiple counters by their amounts in another Counters
  13720. instance.
  13721. @param other the other Counters instance]]>
  13722. </doc>
  13723. </method>
  13724. <method name="equals" return="boolean"
  13725. abstract="false" native="false" synchronized="false"
  13726. static="false" final="false" visibility="public"
  13727. deprecated="not deprecated">
  13728. <param name="genericRight" type="java.lang.Object"/>
  13729. </method>
  13730. <method name="hashCode" return="int"
  13731. abstract="false" native="false" synchronized="false"
  13732. static="false" final="false" visibility="public"
  13733. deprecated="not deprecated">
  13734. </method>
  13735. </class>
  13736. <!-- end class org.apache.hadoop.mapreduce.Counters -->
  13737. <!-- start class org.apache.hadoop.mapreduce.ID -->
  13738. <class name="ID" extends="java.lang.Object"
  13739. abstract="true"
  13740. static="false" final="false" visibility="public"
  13741. deprecated="not deprecated">
  13742. <implements name="org.apache.hadoop.io.WritableComparable"/>
  13743. <constructor name="ID" type="int"
  13744. static="false" final="false" visibility="public"
  13745. deprecated="not deprecated">
  13746. <doc>
  13747. <![CDATA[constructs an ID object from the given int]]>
  13748. </doc>
  13749. </constructor>
  13750. <constructor name="ID"
  13751. static="false" final="false" visibility="protected"
  13752. deprecated="not deprecated">
  13753. </constructor>
  13754. <method name="getId" return="int"
  13755. abstract="false" native="false" synchronized="false"
  13756. static="false" final="false" visibility="public"
  13757. deprecated="not deprecated">
  13758. <doc>
  13759. <![CDATA[returns the int which represents the identifier]]>
  13760. </doc>
  13761. </method>
  13762. <method name="toString" return="java.lang.String"
  13763. abstract="false" native="false" synchronized="false"
  13764. static="false" final="false" visibility="public"
  13765. deprecated="not deprecated">
  13766. </method>
  13767. <method name="hashCode" return="int"
  13768. abstract="false" native="false" synchronized="false"
  13769. static="false" final="false" visibility="public"
  13770. deprecated="not deprecated">
  13771. </method>
  13772. <method name="equals" return="boolean"
  13773. abstract="false" native="false" synchronized="false"
  13774. static="false" final="false" visibility="public"
  13775. deprecated="not deprecated">
  13776. <param name="o" type="java.lang.Object"/>
  13777. </method>
  13778. <method name="compareTo" return="int"
  13779. abstract="false" native="false" synchronized="false"
  13780. static="false" final="false" visibility="public"
  13781. deprecated="not deprecated">
  13782. <param name="that" type="org.apache.hadoop.mapreduce.ID"/>
  13783. <doc>
  13784. <![CDATA[Compare IDs by associated numbers]]>
  13785. </doc>
  13786. </method>
  13787. <method name="readFields"
  13788. abstract="false" native="false" synchronized="false"
  13789. static="false" final="false" visibility="public"
  13790. deprecated="not deprecated">
  13791. <param name="in" type="java.io.DataInput"/>
  13792. <exception name="IOException" type="java.io.IOException"/>
  13793. </method>
  13794. <method name="write"
  13795. abstract="false" native="false" synchronized="false"
  13796. static="false" final="false" visibility="public"
  13797. deprecated="not deprecated">
  13798. <param name="out" type="java.io.DataOutput"/>
  13799. <exception name="IOException" type="java.io.IOException"/>
  13800. </method>
  13801. <field name="SEPARATOR" type="char"
  13802. transient="false" volatile="false"
  13803. static="true" final="true" visibility="protected"
  13804. deprecated="not deprecated">
  13805. </field>
  13806. <field name="id" type="int"
  13807. transient="false" volatile="false"
  13808. static="false" final="false" visibility="protected"
  13809. deprecated="not deprecated">
  13810. </field>
  13811. <doc>
  13812. <![CDATA[A general identifier, which internally stores the id
  13813. as an integer. This is the super class of {@link JobID},
  13814. {@link TaskID} and {@link TaskAttemptID}.
  13815. @see JobID
  13816. @see TaskID
  13817. @see TaskAttemptID]]>
  13818. </doc>
  13819. </class>
  13820. <!-- end class org.apache.hadoop.mapreduce.ID -->
  13821. <!-- start class org.apache.hadoop.mapreduce.InputFormat -->
  13822. <class name="InputFormat" extends="java.lang.Object"
  13823. abstract="true"
  13824. static="false" final="false" visibility="public"
  13825. deprecated="not deprecated">
  13826. <constructor name="InputFormat"
  13827. static="false" final="false" visibility="public"
  13828. deprecated="not deprecated">
  13829. </constructor>
  13830. <method name="getSplits" return="java.util.List"
  13831. abstract="true" native="false" synchronized="false"
  13832. static="false" final="false" visibility="public"
  13833. deprecated="not deprecated">
  13834. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  13835. <exception name="IOException" type="java.io.IOException"/>
  13836. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13837. <doc>
  13838. <![CDATA[Logically split the set of input files for the job.
  13839. <p>Each {@link InputSplit} is then assigned to an individual {@link Mapper}
  13840. for processing.</p>
  13841. <p><i>Note</i>: The split is a <i>logical</i> split of the inputs and the
  13842. input files are not physically split into chunks. For e.g. a split could
  13843. be <i>&lt;input-file-path, start, offset&gt;</i> tuple. The InputFormat
  13844. also creates the {@link RecordReader} to read the {@link InputSplit}.
  13845. @param context job configuration.
  13846. @return an array of {@link InputSplit}s for the job.]]>
  13847. </doc>
  13848. </method>
  13849. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  13850. abstract="true" native="false" synchronized="false"
  13851. static="false" final="false" visibility="public"
  13852. deprecated="not deprecated">
  13853. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  13854. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  13855. <exception name="IOException" type="java.io.IOException"/>
  13856. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13857. <doc>
  13858. <![CDATA[Create a record reader for a given split. The framework will call
  13859. {@link RecordReader#initialize(InputSplit, TaskAttemptContext)} before
  13860. the split is used.
  13861. @param split the split to be read
  13862. @param context the information about the task
  13863. @return a new record reader
  13864. @throws IOException
  13865. @throws InterruptedException]]>
  13866. </doc>
  13867. </method>
  13868. <doc>
  13869. <![CDATA[<code>InputFormat</code> describes the input-specification for a
  13870. Map-Reduce job.
  13871. <p>The Map-Reduce framework relies on the <code>InputFormat</code> of the
  13872. job to:<p>
  13873. <ol>
  13874. <li>
  13875. Validate the input-specification of the job.
  13876. <li>
  13877. Split-up the input file(s) into logical {@link InputSplit}s, each of
  13878. which is then assigned to an individual {@link Mapper}.
  13879. </li>
  13880. <li>
  13881. Provide the {@link RecordReader} implementation to be used to glean
  13882. input records from the logical <code>InputSplit</code> for processing by
  13883. the {@link Mapper}.
  13884. </li>
  13885. </ol>
  13886. <p>The default behavior of file-based {@link InputFormat}s, typically
  13887. sub-classes of {@link FileInputFormat}, is to split the
  13888. input into <i>logical</i> {@link InputSplit}s based on the total size, in
  13889. bytes, of the input files. However, the {@link FileSystem} blocksize of
  13890. the input files is treated as an upper bound for input splits. A lower bound
  13891. on the split size can be set via
  13892. <a href="{@docRoot}/../mapred-default.html#mapreduce.input.fileinputformat.split.minsize">
  13893. mapreduce.input.fileinputformat.split.minsize</a>.</p>
  13894. <p>Clearly, logical splits based on input-size is insufficient for many
  13895. applications since record boundaries are to respected. In such cases, the
  13896. application has to also implement a {@link RecordReader} on whom lies the
  13897. responsibility to respect record-boundaries and present a record-oriented
  13898. view of the logical <code>InputSplit</code> to the individual task.
  13899. @see InputSplit
  13900. @see RecordReader
  13901. @see FileInputFormat]]>
  13902. </doc>
  13903. </class>
  13904. <!-- end class org.apache.hadoop.mapreduce.InputFormat -->
  13905. <!-- start class org.apache.hadoop.mapreduce.InputSplit -->
  13906. <class name="InputSplit" extends="java.lang.Object"
  13907. abstract="true"
  13908. static="false" final="false" visibility="public"
  13909. deprecated="not deprecated">
  13910. <constructor name="InputSplit"
  13911. static="false" final="false" visibility="public"
  13912. deprecated="not deprecated">
  13913. </constructor>
  13914. <method name="getLength" return="long"
  13915. abstract="true" native="false" synchronized="false"
  13916. static="false" final="false" visibility="public"
  13917. deprecated="not deprecated">
  13918. <exception name="IOException" type="java.io.IOException"/>
  13919. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13920. <doc>
  13921. <![CDATA[Get the size of the split, so that the input splits can be sorted by size.
  13922. @return the number of bytes in the split
  13923. @throws IOException
  13924. @throws InterruptedException]]>
  13925. </doc>
  13926. </method>
  13927. <method name="getLocations" return="java.lang.String[]"
  13928. abstract="true" native="false" synchronized="false"
  13929. static="false" final="false" visibility="public"
  13930. deprecated="not deprecated">
  13931. <exception name="IOException" type="java.io.IOException"/>
  13932. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  13933. <doc>
  13934. <![CDATA[Get the list of nodes by name where the data for the split would be local.
  13935. The locations do not need to be serialized.
  13936. @return a new array of the node nodes.
  13937. @throws IOException
  13938. @throws InterruptedException]]>
  13939. </doc>
  13940. </method>
  13941. <doc>
  13942. <![CDATA[<code>InputSplit</code> represents the data to be processed by an
  13943. individual {@link Mapper}.
  13944. <p>Typically, it presents a byte-oriented view on the input and is the
  13945. responsibility of {@link RecordReader} of the job to process this and present
  13946. a record-oriented view.
  13947. @see InputFormat
  13948. @see RecordReader]]>
  13949. </doc>
  13950. </class>
  13951. <!-- end class org.apache.hadoop.mapreduce.InputSplit -->
  13952. <!-- start class org.apache.hadoop.mapreduce.Job -->
  13953. <class name="Job" extends="org.apache.hadoop.mapreduce.task.JobContextImpl"
  13954. abstract="false"
  13955. static="false" final="false" visibility="public"
  13956. deprecated="not deprecated">
  13957. <implements name="org.apache.hadoop.mapreduce.JobContext"/>
  13958. <constructor name="Job"
  13959. static="false" final="false" visibility="public"
  13960. deprecated="not deprecated">
  13961. <exception name="IOException" type="java.io.IOException"/>
  13962. </constructor>
  13963. <constructor name="Job" type="org.apache.hadoop.conf.Configuration"
  13964. static="false" final="false" visibility="public"
  13965. deprecated="not deprecated">
  13966. <exception name="IOException" type="java.io.IOException"/>
  13967. </constructor>
  13968. <constructor name="Job" type="org.apache.hadoop.conf.Configuration, java.lang.String"
  13969. static="false" final="false" visibility="public"
  13970. deprecated="not deprecated">
  13971. <exception name="IOException" type="java.io.IOException"/>
  13972. </constructor>
  13973. <method name="getInstance" return="org.apache.hadoop.mapreduce.Job"
  13974. abstract="false" native="false" synchronized="false"
  13975. static="true" final="false" visibility="public"
  13976. deprecated="not deprecated">
  13977. <exception name="IOException" type="java.io.IOException"/>
  13978. <doc>
  13979. <![CDATA[Creates a new {@link Job} with no particular {@link Cluster} .
  13980. A Cluster will be created with a generic {@link Configuration}.
  13981. @return the {@link Job} , with no connection to a cluster yet.
  13982. @throws IOException]]>
  13983. </doc>
  13984. </method>
  13985. <method name="getInstance" return="org.apache.hadoop.mapreduce.Job"
  13986. abstract="false" native="false" synchronized="false"
  13987. static="true" final="false" visibility="public"
  13988. deprecated="not deprecated">
  13989. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  13990. <exception name="IOException" type="java.io.IOException"/>
  13991. <doc>
  13992. <![CDATA[Creates a new {@link Job} with no particular {@link Cluster} .
  13993. A Cluster will be created from the conf parameter only when it's needed.
  13994. @param conf the configuration
  13995. @return the {@link Job} , with no connection to a cluster yet.
  13996. @throws IOException]]>
  13997. </doc>
  13998. </method>
  13999. <method name="getInstance" return="org.apache.hadoop.mapreduce.Job"
  14000. abstract="false" native="false" synchronized="false"
  14001. static="true" final="false" visibility="public"
  14002. deprecated="not deprecated">
  14003. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  14004. <param name="jobName" type="java.lang.String"/>
  14005. <exception name="IOException" type="java.io.IOException"/>
  14006. <doc>
  14007. <![CDATA[Creates a new {@link Job} with no particular {@link Cluster} and a given jobName.
  14008. A Cluster will be created from the conf parameter only when it's needed.
  14009. @param conf the configuration
  14010. @return the {@link Job} , with no connection to a cluster yet.
  14011. @throws IOException]]>
  14012. </doc>
  14013. </method>
  14014. <method name="getInstance" return="org.apache.hadoop.mapreduce.Job"
  14015. abstract="false" native="false" synchronized="false"
  14016. static="true" final="false" visibility="public"
  14017. deprecated="not deprecated">
  14018. <param name="cluster" type="org.apache.hadoop.mapreduce.Cluster"/>
  14019. <exception name="IOException" type="java.io.IOException"/>
  14020. </method>
  14021. <method name="getInstance" return="org.apache.hadoop.mapreduce.Job"
  14022. abstract="false" native="false" synchronized="false"
  14023. static="true" final="false" visibility="public"
  14024. deprecated="not deprecated">
  14025. <param name="cluster" type="org.apache.hadoop.mapreduce.Cluster"/>
  14026. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  14027. <exception name="IOException" type="java.io.IOException"/>
  14028. </method>
  14029. <method name="getInstance" return="org.apache.hadoop.mapreduce.Job"
  14030. abstract="false" native="false" synchronized="false"
  14031. static="true" final="false" visibility="public"
  14032. deprecated="not deprecated">
  14033. <param name="cluster" type="org.apache.hadoop.mapreduce.Cluster"/>
  14034. <param name="status" type="org.apache.hadoop.mapreduce.JobStatus"/>
  14035. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  14036. <exception name="IOException" type="java.io.IOException"/>
  14037. </method>
  14038. <method name="getStatus" return="org.apache.hadoop.mapreduce.JobStatus"
  14039. abstract="false" native="false" synchronized="false"
  14040. static="false" final="false" visibility="public"
  14041. deprecated="not deprecated">
  14042. <exception name="IOException" type="java.io.IOException"/>
  14043. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14044. </method>
  14045. <method name="getJobState" return="org.apache.hadoop.mapreduce.JobStatus.State"
  14046. abstract="false" native="false" synchronized="false"
  14047. static="false" final="false" visibility="public"
  14048. deprecated="not deprecated">
  14049. <exception name="IOException" type="java.io.IOException"/>
  14050. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14051. <doc>
  14052. <![CDATA[Returns the current state of the Job.
  14053. @return JobStatus#State
  14054. @throws IOException
  14055. @throws InterruptedException]]>
  14056. </doc>
  14057. </method>
  14058. <method name="getTrackingURL" return="java.lang.String"
  14059. abstract="false" native="false" synchronized="false"
  14060. static="false" final="false" visibility="public"
  14061. deprecated="not deprecated">
  14062. <doc>
  14063. <![CDATA[Get the URL where some job progress information will be displayed.
  14064. @return the URL where some job progress information will be displayed.]]>
  14065. </doc>
  14066. </method>
  14067. <method name="getJobFile" return="java.lang.String"
  14068. abstract="false" native="false" synchronized="false"
  14069. static="false" final="false" visibility="public"
  14070. deprecated="not deprecated">
  14071. <doc>
  14072. <![CDATA[Get the path of the submitted job configuration.
  14073. @return the path of the submitted job configuration.]]>
  14074. </doc>
  14075. </method>
  14076. <method name="getStartTime" return="long"
  14077. abstract="false" native="false" synchronized="false"
  14078. static="false" final="false" visibility="public"
  14079. deprecated="not deprecated">
  14080. <doc>
  14081. <![CDATA[Get start time of the job.
  14082. @return the start time of the job]]>
  14083. </doc>
  14084. </method>
  14085. <method name="getFinishTime" return="long"
  14086. abstract="false" native="false" synchronized="false"
  14087. static="false" final="false" visibility="public"
  14088. deprecated="not deprecated">
  14089. <exception name="IOException" type="java.io.IOException"/>
  14090. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14091. <doc>
  14092. <![CDATA[Get finish time of the job.
  14093. @return the finish time of the job]]>
  14094. </doc>
  14095. </method>
  14096. <method name="getSchedulingInfo" return="java.lang.String"
  14097. abstract="false" native="false" synchronized="false"
  14098. static="false" final="false" visibility="public"
  14099. deprecated="not deprecated">
  14100. <doc>
  14101. <![CDATA[Get scheduling info of the job.
  14102. @return the scheduling info of the job]]>
  14103. </doc>
  14104. </method>
  14105. <method name="getPriority" return="org.apache.hadoop.mapreduce.JobPriority"
  14106. abstract="false" native="false" synchronized="false"
  14107. static="false" final="false" visibility="public"
  14108. deprecated="not deprecated">
  14109. <exception name="IOException" type="java.io.IOException"/>
  14110. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14111. <doc>
  14112. <![CDATA[Get scheduling info of the job.
  14113. @return the scheduling info of the job]]>
  14114. </doc>
  14115. </method>
  14116. <method name="getJobName" return="java.lang.String"
  14117. abstract="false" native="false" synchronized="false"
  14118. static="false" final="false" visibility="public"
  14119. deprecated="not deprecated">
  14120. <doc>
  14121. <![CDATA[The user-specified job name.]]>
  14122. </doc>
  14123. </method>
  14124. <method name="getHistoryUrl" return="java.lang.String"
  14125. abstract="false" native="false" synchronized="false"
  14126. static="false" final="false" visibility="public"
  14127. deprecated="not deprecated">
  14128. <exception name="IOException" type="java.io.IOException"/>
  14129. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14130. </method>
  14131. <method name="isRetired" return="boolean"
  14132. abstract="false" native="false" synchronized="false"
  14133. static="false" final="false" visibility="public"
  14134. deprecated="not deprecated">
  14135. <exception name="IOException" type="java.io.IOException"/>
  14136. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14137. </method>
  14138. <method name="toString" return="java.lang.String"
  14139. abstract="false" native="false" synchronized="false"
  14140. static="false" final="false" visibility="public"
  14141. deprecated="not deprecated">
  14142. <doc>
  14143. <![CDATA[Dump stats to screen.]]>
  14144. </doc>
  14145. </method>
  14146. <method name="getTaskReports" return="org.apache.hadoop.mapreduce.TaskReport[]"
  14147. abstract="false" native="false" synchronized="false"
  14148. static="false" final="false" visibility="public"
  14149. deprecated="not deprecated">
  14150. <param name="type" type="org.apache.hadoop.mapreduce.TaskType"/>
  14151. <exception name="IOException" type="java.io.IOException"/>
  14152. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14153. <doc>
  14154. <![CDATA[Get the information of the current state of the tasks of a job.
  14155. @param type Type of the task
  14156. @return the list of all of the map tips.
  14157. @throws IOException]]>
  14158. </doc>
  14159. </method>
  14160. <method name="mapProgress" return="float"
  14161. abstract="false" native="false" synchronized="false"
  14162. static="false" final="false" visibility="public"
  14163. deprecated="not deprecated">
  14164. <exception name="IOException" type="java.io.IOException"/>
  14165. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14166. <doc>
  14167. <![CDATA[Get the <i>progress</i> of the job's map-tasks, as a float between 0.0
  14168. and 1.0. When all map tasks have completed, the function returns 1.0.
  14169. @return the progress of the job's map-tasks.
  14170. @throws IOException]]>
  14171. </doc>
  14172. </method>
  14173. <method name="reduceProgress" return="float"
  14174. abstract="false" native="false" synchronized="false"
  14175. static="false" final="false" visibility="public"
  14176. deprecated="not deprecated">
  14177. <exception name="IOException" type="java.io.IOException"/>
  14178. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14179. <doc>
  14180. <![CDATA[Get the <i>progress</i> of the job's reduce-tasks, as a float between 0.0
  14181. and 1.0. When all reduce tasks have completed, the function returns 1.0.
  14182. @return the progress of the job's reduce-tasks.
  14183. @throws IOException]]>
  14184. </doc>
  14185. </method>
  14186. <method name="cleanupProgress" return="float"
  14187. abstract="false" native="false" synchronized="false"
  14188. static="false" final="false" visibility="public"
  14189. deprecated="not deprecated">
  14190. <exception name="IOException" type="java.io.IOException"/>
  14191. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14192. <doc>
  14193. <![CDATA[Get the <i>progress</i> of the job's cleanup-tasks, as a float between 0.0
  14194. and 1.0. When all cleanup tasks have completed, the function returns 1.0.
  14195. @return the progress of the job's cleanup-tasks.
  14196. @throws IOException]]>
  14197. </doc>
  14198. </method>
  14199. <method name="setupProgress" return="float"
  14200. abstract="false" native="false" synchronized="false"
  14201. static="false" final="false" visibility="public"
  14202. deprecated="not deprecated">
  14203. <exception name="IOException" type="java.io.IOException"/>
  14204. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14205. <doc>
  14206. <![CDATA[Get the <i>progress</i> of the job's setup-tasks, as a float between 0.0
  14207. and 1.0. When all setup tasks have completed, the function returns 1.0.
  14208. @return the progress of the job's setup-tasks.
  14209. @throws IOException]]>
  14210. </doc>
  14211. </method>
  14212. <method name="isComplete" return="boolean"
  14213. abstract="false" native="false" synchronized="false"
  14214. static="false" final="false" visibility="public"
  14215. deprecated="not deprecated">
  14216. <exception name="IOException" type="java.io.IOException"/>
  14217. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14218. <doc>
  14219. <![CDATA[Check if the job is finished or not.
  14220. This is a non-blocking call.
  14221. @return <code>true</code> if the job is complete, else <code>false</code>.
  14222. @throws IOException]]>
  14223. </doc>
  14224. </method>
  14225. <method name="isSuccessful" return="boolean"
  14226. abstract="false" native="false" synchronized="false"
  14227. static="false" final="false" visibility="public"
  14228. deprecated="not deprecated">
  14229. <exception name="IOException" type="java.io.IOException"/>
  14230. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14231. <doc>
  14232. <![CDATA[Check if the job completed successfully.
  14233. @return <code>true</code> if the job succeeded, else <code>false</code>.
  14234. @throws IOException]]>
  14235. </doc>
  14236. </method>
  14237. <method name="killJob"
  14238. abstract="false" native="false" synchronized="false"
  14239. static="false" final="false" visibility="public"
  14240. deprecated="not deprecated">
  14241. <exception name="IOException" type="java.io.IOException"/>
  14242. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14243. <doc>
  14244. <![CDATA[Kill the running job. Blocks until all job tasks have been
  14245. killed as well. If the job is no longer running, it simply returns.
  14246. @throws IOException]]>
  14247. </doc>
  14248. </method>
  14249. <method name="setPriority"
  14250. abstract="false" native="false" synchronized="false"
  14251. static="false" final="false" visibility="public"
  14252. deprecated="not deprecated">
  14253. <param name="priority" type="org.apache.hadoop.mapreduce.JobPriority"/>
  14254. <exception name="IOException" type="java.io.IOException"/>
  14255. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14256. <doc>
  14257. <![CDATA[Set the priority of a running job.
  14258. @param priority the new priority for the job.
  14259. @throws IOException]]>
  14260. </doc>
  14261. </method>
  14262. <method name="getTaskCompletionEvents" return="org.apache.hadoop.mapreduce.TaskCompletionEvent[]"
  14263. abstract="false" native="false" synchronized="false"
  14264. static="false" final="false" visibility="public"
  14265. deprecated="not deprecated">
  14266. <param name="startFrom" type="int"/>
  14267. <param name="numEvents" type="int"/>
  14268. <exception name="IOException" type="java.io.IOException"/>
  14269. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14270. <doc>
  14271. <![CDATA[Get events indicating completion (success/failure) of component tasks.
  14272. @param startFrom index to start fetching events from
  14273. @param numEvents number of events to fetch
  14274. @return an array of {@link TaskCompletionEvent}s
  14275. @throws IOException]]>
  14276. </doc>
  14277. </method>
  14278. <method name="killTask" return="boolean"
  14279. abstract="false" native="false" synchronized="false"
  14280. static="false" final="false" visibility="public"
  14281. deprecated="not deprecated">
  14282. <param name="taskId" type="org.apache.hadoop.mapreduce.TaskAttemptID"/>
  14283. <exception name="IOException" type="java.io.IOException"/>
  14284. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14285. <doc>
  14286. <![CDATA[Kill indicated task attempt.
  14287. @param taskId the id of the task to be terminated.
  14288. @throws IOException]]>
  14289. </doc>
  14290. </method>
  14291. <method name="failTask" return="boolean"
  14292. abstract="false" native="false" synchronized="false"
  14293. static="false" final="false" visibility="public"
  14294. deprecated="not deprecated">
  14295. <param name="taskId" type="org.apache.hadoop.mapreduce.TaskAttemptID"/>
  14296. <exception name="IOException" type="java.io.IOException"/>
  14297. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14298. <doc>
  14299. <![CDATA[Fail indicated task attempt.
  14300. @param taskId the id of the task to be terminated.
  14301. @throws IOException]]>
  14302. </doc>
  14303. </method>
  14304. <method name="getCounters" return="org.apache.hadoop.mapreduce.Counters"
  14305. abstract="false" native="false" synchronized="false"
  14306. static="false" final="false" visibility="public"
  14307. deprecated="not deprecated">
  14308. <exception name="IOException" type="java.io.IOException"/>
  14309. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14310. <doc>
  14311. <![CDATA[Gets the counters for this job. May return null if the job has been
  14312. retired and the job is no longer in the completed job store.
  14313. @return the counters for this job.
  14314. @throws IOException]]>
  14315. </doc>
  14316. </method>
  14317. <method name="getTaskDiagnostics" return="java.lang.String[]"
  14318. abstract="false" native="false" synchronized="false"
  14319. static="false" final="false" visibility="public"
  14320. deprecated="not deprecated">
  14321. <param name="taskid" type="org.apache.hadoop.mapreduce.TaskAttemptID"/>
  14322. <exception name="IOException" type="java.io.IOException"/>
  14323. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14324. <doc>
  14325. <![CDATA[Gets the diagnostic messages for a given task attempt.
  14326. @param taskid
  14327. @return the list of diagnostic messages for the task
  14328. @throws IOException]]>
  14329. </doc>
  14330. </method>
  14331. <method name="setNumReduceTasks"
  14332. abstract="false" native="false" synchronized="false"
  14333. static="false" final="false" visibility="public"
  14334. deprecated="not deprecated">
  14335. <param name="tasks" type="int"/>
  14336. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14337. <doc>
  14338. <![CDATA[Set the number of reduce tasks for the job.
  14339. @param tasks the number of reduce tasks
  14340. @throws IllegalStateException if the job is submitted]]>
  14341. </doc>
  14342. </method>
  14343. <method name="setWorkingDirectory"
  14344. abstract="false" native="false" synchronized="false"
  14345. static="false" final="false" visibility="public"
  14346. deprecated="not deprecated">
  14347. <param name="dir" type="org.apache.hadoop.fs.Path"/>
  14348. <exception name="IOException" type="java.io.IOException"/>
  14349. <doc>
  14350. <![CDATA[Set the current working directory for the default file system.
  14351. @param dir the new current working directory.
  14352. @throws IllegalStateException if the job is submitted]]>
  14353. </doc>
  14354. </method>
  14355. <method name="setInputFormatClass"
  14356. abstract="false" native="false" synchronized="false"
  14357. static="false" final="false" visibility="public"
  14358. deprecated="not deprecated">
  14359. <param name="cls" type="java.lang.Class"/>
  14360. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14361. <doc>
  14362. <![CDATA[Set the {@link InputFormat} for the job.
  14363. @param cls the <code>InputFormat</code> to use
  14364. @throws IllegalStateException if the job is submitted]]>
  14365. </doc>
  14366. </method>
  14367. <method name="setOutputFormatClass"
  14368. abstract="false" native="false" synchronized="false"
  14369. static="false" final="false" visibility="public"
  14370. deprecated="not deprecated">
  14371. <param name="cls" type="java.lang.Class"/>
  14372. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14373. <doc>
  14374. <![CDATA[Set the {@link OutputFormat} for the job.
  14375. @param cls the <code>OutputFormat</code> to use
  14376. @throws IllegalStateException if the job is submitted]]>
  14377. </doc>
  14378. </method>
  14379. <method name="setMapperClass"
  14380. abstract="false" native="false" synchronized="false"
  14381. static="false" final="false" visibility="public"
  14382. deprecated="not deprecated">
  14383. <param name="cls" type="java.lang.Class"/>
  14384. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14385. <doc>
  14386. <![CDATA[Set the {@link Mapper} for the job.
  14387. @param cls the <code>Mapper</code> to use
  14388. @throws IllegalStateException if the job is submitted]]>
  14389. </doc>
  14390. </method>
  14391. <method name="setJarByClass"
  14392. abstract="false" native="false" synchronized="false"
  14393. static="false" final="false" visibility="public"
  14394. deprecated="not deprecated">
  14395. <param name="cls" type="java.lang.Class"/>
  14396. <doc>
  14397. <![CDATA[Set the Jar by finding where a given class came from.
  14398. @param cls the example class]]>
  14399. </doc>
  14400. </method>
  14401. <method name="setJar"
  14402. abstract="false" native="false" synchronized="false"
  14403. static="false" final="false" visibility="public"
  14404. deprecated="not deprecated">
  14405. <param name="jar" type="java.lang.String"/>
  14406. <doc>
  14407. <![CDATA[Set the job jar]]>
  14408. </doc>
  14409. </method>
  14410. <method name="setUser"
  14411. abstract="false" native="false" synchronized="false"
  14412. static="false" final="false" visibility="public"
  14413. deprecated="not deprecated">
  14414. <param name="user" type="java.lang.String"/>
  14415. <doc>
  14416. <![CDATA[Set the reported username for this job.
  14417. @param user the username for this job.]]>
  14418. </doc>
  14419. </method>
  14420. <method name="setCombinerClass"
  14421. abstract="false" native="false" synchronized="false"
  14422. static="false" final="false" visibility="public"
  14423. deprecated="not deprecated">
  14424. <param name="cls" type="java.lang.Class"/>
  14425. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14426. <doc>
  14427. <![CDATA[Set the combiner class for the job.
  14428. @param cls the combiner to use
  14429. @throws IllegalStateException if the job is submitted]]>
  14430. </doc>
  14431. </method>
  14432. <method name="setReducerClass"
  14433. abstract="false" native="false" synchronized="false"
  14434. static="false" final="false" visibility="public"
  14435. deprecated="not deprecated">
  14436. <param name="cls" type="java.lang.Class"/>
  14437. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14438. <doc>
  14439. <![CDATA[Set the {@link Reducer} for the job.
  14440. @param cls the <code>Reducer</code> to use
  14441. @throws IllegalStateException if the job is submitted]]>
  14442. </doc>
  14443. </method>
  14444. <method name="setPartitionerClass"
  14445. abstract="false" native="false" synchronized="false"
  14446. static="false" final="false" visibility="public"
  14447. deprecated="not deprecated">
  14448. <param name="cls" type="java.lang.Class"/>
  14449. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14450. <doc>
  14451. <![CDATA[Set the {@link Partitioner} for the job.
  14452. @param cls the <code>Partitioner</code> to use
  14453. @throws IllegalStateException if the job is submitted]]>
  14454. </doc>
  14455. </method>
  14456. <method name="setMapOutputKeyClass"
  14457. abstract="false" native="false" synchronized="false"
  14458. static="false" final="false" visibility="public"
  14459. deprecated="not deprecated">
  14460. <param name="theClass" type="java.lang.Class"/>
  14461. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14462. <doc>
  14463. <![CDATA[Set the key class for the map output data. This allows the user to
  14464. specify the map output key class to be different than the final output
  14465. value class.
  14466. @param theClass the map output key class.
  14467. @throws IllegalStateException if the job is submitted]]>
  14468. </doc>
  14469. </method>
  14470. <method name="setMapOutputValueClass"
  14471. abstract="false" native="false" synchronized="false"
  14472. static="false" final="false" visibility="public"
  14473. deprecated="not deprecated">
  14474. <param name="theClass" type="java.lang.Class"/>
  14475. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14476. <doc>
  14477. <![CDATA[Set the value class for the map output data. This allows the user to
  14478. specify the map output value class to be different than the final output
  14479. value class.
  14480. @param theClass the map output value class.
  14481. @throws IllegalStateException if the job is submitted]]>
  14482. </doc>
  14483. </method>
  14484. <method name="setOutputKeyClass"
  14485. abstract="false" native="false" synchronized="false"
  14486. static="false" final="false" visibility="public"
  14487. deprecated="not deprecated">
  14488. <param name="theClass" type="java.lang.Class"/>
  14489. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14490. <doc>
  14491. <![CDATA[Set the key class for the job output data.
  14492. @param theClass the key class for the job output data.
  14493. @throws IllegalStateException if the job is submitted]]>
  14494. </doc>
  14495. </method>
  14496. <method name="setOutputValueClass"
  14497. abstract="false" native="false" synchronized="false"
  14498. static="false" final="false" visibility="public"
  14499. deprecated="not deprecated">
  14500. <param name="theClass" type="java.lang.Class"/>
  14501. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14502. <doc>
  14503. <![CDATA[Set the value class for job outputs.
  14504. @param theClass the value class for job outputs.
  14505. @throws IllegalStateException if the job is submitted]]>
  14506. </doc>
  14507. </method>
  14508. <method name="setSortComparatorClass"
  14509. abstract="false" native="false" synchronized="false"
  14510. static="false" final="false" visibility="public"
  14511. deprecated="not deprecated">
  14512. <param name="cls" type="java.lang.Class"/>
  14513. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14514. <doc>
  14515. <![CDATA[Define the comparator that controls how the keys are sorted before they
  14516. are passed to the {@link Reducer}.
  14517. @param cls the raw comparator
  14518. @throws IllegalStateException if the job is submitted]]>
  14519. </doc>
  14520. </method>
  14521. <method name="setGroupingComparatorClass"
  14522. abstract="false" native="false" synchronized="false"
  14523. static="false" final="false" visibility="public"
  14524. deprecated="not deprecated">
  14525. <param name="cls" type="java.lang.Class"/>
  14526. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14527. <doc>
  14528. <![CDATA[Define the comparator that controls which keys are grouped together
  14529. for a single call to
  14530. {@link Reducer#reduce(Object, Iterable,
  14531. org.apache.hadoop.mapreduce.Reducer.Context)}
  14532. @param cls the raw comparator to use
  14533. @throws IllegalStateException if the job is submitted]]>
  14534. </doc>
  14535. </method>
  14536. <method name="setJobName"
  14537. abstract="false" native="false" synchronized="false"
  14538. static="false" final="false" visibility="public"
  14539. deprecated="not deprecated">
  14540. <param name="name" type="java.lang.String"/>
  14541. <exception name="IllegalStateException" type="java.lang.IllegalStateException"/>
  14542. <doc>
  14543. <![CDATA[Set the user-specified job name.
  14544. @param name the job's new name.
  14545. @throws IllegalStateException if the job is submitted]]>
  14546. </doc>
  14547. </method>
  14548. <method name="setSpeculativeExecution"
  14549. abstract="false" native="false" synchronized="false"
  14550. static="false" final="false" visibility="public"
  14551. deprecated="not deprecated">
  14552. <param name="speculativeExecution" type="boolean"/>
  14553. <doc>
  14554. <![CDATA[Turn speculative execution on or off for this job.
  14555. @param speculativeExecution <code>true</code> if speculative execution
  14556. should be turned on, else <code>false</code>.]]>
  14557. </doc>
  14558. </method>
  14559. <method name="setMapSpeculativeExecution"
  14560. abstract="false" native="false" synchronized="false"
  14561. static="false" final="false" visibility="public"
  14562. deprecated="not deprecated">
  14563. <param name="speculativeExecution" type="boolean"/>
  14564. <doc>
  14565. <![CDATA[Turn speculative execution on or off for this job for map tasks.
  14566. @param speculativeExecution <code>true</code> if speculative execution
  14567. should be turned on for map tasks,
  14568. else <code>false</code>.]]>
  14569. </doc>
  14570. </method>
  14571. <method name="setReduceSpeculativeExecution"
  14572. abstract="false" native="false" synchronized="false"
  14573. static="false" final="false" visibility="public"
  14574. deprecated="not deprecated">
  14575. <param name="speculativeExecution" type="boolean"/>
  14576. <doc>
  14577. <![CDATA[Turn speculative execution on or off for this job for reduce tasks.
  14578. @param speculativeExecution <code>true</code> if speculative execution
  14579. should be turned on for reduce tasks,
  14580. else <code>false</code>.]]>
  14581. </doc>
  14582. </method>
  14583. <method name="setJobSetupCleanupNeeded"
  14584. abstract="false" native="false" synchronized="false"
  14585. static="false" final="false" visibility="public"
  14586. deprecated="not deprecated">
  14587. <param name="needed" type="boolean"/>
  14588. <doc>
  14589. <![CDATA[Specify whether job-setup and job-cleanup is needed for the job
  14590. @param needed If <code>true</code>, job-setup and job-cleanup will be
  14591. considered from {@link OutputCommitter}
  14592. else ignored.]]>
  14593. </doc>
  14594. </method>
  14595. <method name="setCacheArchives"
  14596. abstract="false" native="false" synchronized="false"
  14597. static="false" final="false" visibility="public"
  14598. deprecated="not deprecated">
  14599. <param name="archives" type="java.net.URI[]"/>
  14600. <doc>
  14601. <![CDATA[Set the given set of archives
  14602. @param archives The list of archives that need to be localized]]>
  14603. </doc>
  14604. </method>
  14605. <method name="setCacheFiles"
  14606. abstract="false" native="false" synchronized="false"
  14607. static="false" final="false" visibility="public"
  14608. deprecated="not deprecated">
  14609. <param name="files" type="java.net.URI[]"/>
  14610. <doc>
  14611. <![CDATA[Set the given set of files
  14612. @param files The list of files that need to be localized]]>
  14613. </doc>
  14614. </method>
  14615. <method name="addCacheArchive"
  14616. abstract="false" native="false" synchronized="false"
  14617. static="false" final="false" visibility="public"
  14618. deprecated="not deprecated">
  14619. <param name="uri" type="java.net.URI"/>
  14620. <doc>
  14621. <![CDATA[Add a archives to be localized
  14622. @param uri The uri of the cache to be localized]]>
  14623. </doc>
  14624. </method>
  14625. <method name="addCacheFile"
  14626. abstract="false" native="false" synchronized="false"
  14627. static="false" final="false" visibility="public"
  14628. deprecated="not deprecated">
  14629. <param name="uri" type="java.net.URI"/>
  14630. <doc>
  14631. <![CDATA[Add a file to be localized
  14632. @param uri The uri of the cache to be localized]]>
  14633. </doc>
  14634. </method>
  14635. <method name="addFileToClassPath"
  14636. abstract="false" native="false" synchronized="false"
  14637. static="false" final="false" visibility="public"
  14638. deprecated="not deprecated">
  14639. <param name="file" type="org.apache.hadoop.fs.Path"/>
  14640. <exception name="IOException" type="java.io.IOException"/>
  14641. <doc>
  14642. <![CDATA[Add an file path to the current set of classpath entries It adds the file
  14643. to cache as well.
  14644. Files added with this method will not be unpacked while being added to the
  14645. classpath.
  14646. To add archives to classpath, use the {@link #addArchiveToClassPath(Path)}
  14647. method instead.
  14648. @param file Path of the file to be added]]>
  14649. </doc>
  14650. </method>
  14651. <method name="addArchiveToClassPath"
  14652. abstract="false" native="false" synchronized="false"
  14653. static="false" final="false" visibility="public"
  14654. deprecated="not deprecated">
  14655. <param name="archive" type="org.apache.hadoop.fs.Path"/>
  14656. <exception name="IOException" type="java.io.IOException"/>
  14657. <doc>
  14658. <![CDATA[Add an archive path to the current set of classpath entries. It adds the
  14659. archive to cache as well.
  14660. Archive files will be unpacked and added to the classpath
  14661. when being distributed.
  14662. @param archive Path of the archive to be added]]>
  14663. </doc>
  14664. </method>
  14665. <method name="createSymlink"
  14666. abstract="false" native="false" synchronized="false"
  14667. static="false" final="false" visibility="public"
  14668. deprecated="not deprecated">
  14669. <doc>
  14670. <![CDATA[This method allows you to create symlinks in the current working directory
  14671. of the task to all the cache files/archives]]>
  14672. </doc>
  14673. </method>
  14674. <method name="setMaxMapAttempts"
  14675. abstract="false" native="false" synchronized="false"
  14676. static="false" final="false" visibility="public"
  14677. deprecated="not deprecated">
  14678. <param name="n" type="int"/>
  14679. <doc>
  14680. <![CDATA[Expert: Set the number of maximum attempts that will be made to run a
  14681. map task.
  14682. @param n the number of attempts per map task.]]>
  14683. </doc>
  14684. </method>
  14685. <method name="setMaxReduceAttempts"
  14686. abstract="false" native="false" synchronized="false"
  14687. static="false" final="false" visibility="public"
  14688. deprecated="not deprecated">
  14689. <param name="n" type="int"/>
  14690. <doc>
  14691. <![CDATA[Expert: Set the number of maximum attempts that will be made to run a
  14692. reduce task.
  14693. @param n the number of attempts per reduce task.]]>
  14694. </doc>
  14695. </method>
  14696. <method name="setProfileEnabled"
  14697. abstract="false" native="false" synchronized="false"
  14698. static="false" final="false" visibility="public"
  14699. deprecated="not deprecated">
  14700. <param name="newValue" type="boolean"/>
  14701. <doc>
  14702. <![CDATA[Set whether the system should collect profiler information for some of
  14703. the tasks in this job? The information is stored in the user log
  14704. directory.
  14705. @param newValue true means it should be gathered]]>
  14706. </doc>
  14707. </method>
  14708. <method name="setProfileParams"
  14709. abstract="false" native="false" synchronized="false"
  14710. static="false" final="false" visibility="public"
  14711. deprecated="not deprecated">
  14712. <param name="value" type="java.lang.String"/>
  14713. <doc>
  14714. <![CDATA[Set the profiler configuration arguments. If the string contains a '%s' it
  14715. will be replaced with the name of the profiling output file when the task
  14716. runs.
  14717. This value is passed to the task child JVM on the command line.
  14718. @param value the configuration string]]>
  14719. </doc>
  14720. </method>
  14721. <method name="setProfileTaskRange"
  14722. abstract="false" native="false" synchronized="false"
  14723. static="false" final="false" visibility="public"
  14724. deprecated="not deprecated">
  14725. <param name="isMap" type="boolean"/>
  14726. <param name="newValue" type="java.lang.String"/>
  14727. <doc>
  14728. <![CDATA[Set the ranges of maps or reduces to profile. setProfileEnabled(true)
  14729. must also be called.
  14730. @param newValue a set of integer ranges of the map ids]]>
  14731. </doc>
  14732. </method>
  14733. <method name="setCancelDelegationTokenUponJobCompletion"
  14734. abstract="false" native="false" synchronized="false"
  14735. static="false" final="false" visibility="public"
  14736. deprecated="not deprecated">
  14737. <param name="value" type="boolean"/>
  14738. <doc>
  14739. <![CDATA[Sets the flag that will allow the JobTracker to cancel the HDFS delegation
  14740. tokens upon job completion. Defaults to true.]]>
  14741. </doc>
  14742. </method>
  14743. <method name="submit"
  14744. abstract="false" native="false" synchronized="false"
  14745. static="false" final="false" visibility="public"
  14746. deprecated="not deprecated">
  14747. <exception name="IOException" type="java.io.IOException"/>
  14748. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14749. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  14750. <doc>
  14751. <![CDATA[Submit the job to the cluster and return immediately.
  14752. @throws IOException]]>
  14753. </doc>
  14754. </method>
  14755. <method name="waitForCompletion" return="boolean"
  14756. abstract="false" native="false" synchronized="false"
  14757. static="false" final="false" visibility="public"
  14758. deprecated="not deprecated">
  14759. <param name="verbose" type="boolean"/>
  14760. <exception name="IOException" type="java.io.IOException"/>
  14761. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14762. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  14763. <doc>
  14764. <![CDATA[Submit the job to the cluster and wait for it to finish.
  14765. @param verbose print the progress to the user
  14766. @return true if the job succeeded
  14767. @throws IOException thrown if the communication with the
  14768. <code>JobTracker</code> is lost]]>
  14769. </doc>
  14770. </method>
  14771. <method name="monitorAndPrintJob" return="boolean"
  14772. abstract="false" native="false" synchronized="false"
  14773. static="false" final="false" visibility="public"
  14774. deprecated="not deprecated">
  14775. <exception name="IOException" type="java.io.IOException"/>
  14776. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  14777. <doc>
  14778. <![CDATA[Monitor a job and print status in real-time as progress is made and tasks
  14779. fail.
  14780. @return true if the job succeeded
  14781. @throws IOException if communication to the JobTracker fails]]>
  14782. </doc>
  14783. </method>
  14784. <method name="getProgressPollInterval" return="int"
  14785. abstract="false" native="false" synchronized="false"
  14786. static="true" final="false" visibility="public"
  14787. deprecated="not deprecated">
  14788. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  14789. <doc>
  14790. <![CDATA[The interval at which monitorAndPrintJob() prints status]]>
  14791. </doc>
  14792. </method>
  14793. <method name="getCompletionPollInterval" return="int"
  14794. abstract="false" native="false" synchronized="false"
  14795. static="true" final="false" visibility="public"
  14796. deprecated="not deprecated">
  14797. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  14798. <doc>
  14799. <![CDATA[The interval at which waitForCompletion() should check.]]>
  14800. </doc>
  14801. </method>
  14802. <method name="getTaskOutputFilter" return="org.apache.hadoop.mapreduce.Job.TaskStatusFilter"
  14803. abstract="false" native="false" synchronized="false"
  14804. static="true" final="false" visibility="public"
  14805. deprecated="not deprecated">
  14806. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  14807. <doc>
  14808. <![CDATA[Get the task output filter.
  14809. @param conf the configuration.
  14810. @return the filter level.]]>
  14811. </doc>
  14812. </method>
  14813. <method name="setTaskOutputFilter"
  14814. abstract="false" native="false" synchronized="false"
  14815. static="true" final="false" visibility="public"
  14816. deprecated="not deprecated">
  14817. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  14818. <param name="newValue" type="org.apache.hadoop.mapreduce.Job.TaskStatusFilter"/>
  14819. <doc>
  14820. <![CDATA[Modify the Configuration to set the task output filter.
  14821. @param conf the Configuration to modify.
  14822. @param newValue the value to set.]]>
  14823. </doc>
  14824. </method>
  14825. <field name="OUTPUT_FILTER" type="java.lang.String"
  14826. transient="false" volatile="false"
  14827. static="true" final="true" visibility="public"
  14828. deprecated="not deprecated">
  14829. </field>
  14830. <field name="COMPLETION_POLL_INTERVAL_KEY" type="java.lang.String"
  14831. transient="false" volatile="false"
  14832. static="true" final="true" visibility="public"
  14833. deprecated="not deprecated">
  14834. <doc>
  14835. <![CDATA[Key in mapred-*.xml that sets completionPollInvervalMillis]]>
  14836. </doc>
  14837. </field>
  14838. <field name="PROGRESS_MONITOR_POLL_INTERVAL_KEY" type="java.lang.String"
  14839. transient="false" volatile="false"
  14840. static="true" final="true" visibility="public"
  14841. deprecated="not deprecated">
  14842. <doc>
  14843. <![CDATA[Key in mapred-*.xml that sets progMonitorPollIntervalMillis]]>
  14844. </doc>
  14845. </field>
  14846. <field name="USED_GENERIC_PARSER" type="java.lang.String"
  14847. transient="false" volatile="false"
  14848. static="true" final="true" visibility="public"
  14849. deprecated="not deprecated">
  14850. </field>
  14851. <field name="SUBMIT_REPLICATION" type="java.lang.String"
  14852. transient="false" volatile="false"
  14853. static="true" final="true" visibility="public"
  14854. deprecated="not deprecated">
  14855. </field>
  14856. <doc>
  14857. <![CDATA[The job submitter's view of the Job.
  14858. <p>It allows the user to configure the
  14859. job, submit it, control its execution, and query the state. The set methods
  14860. only work until the job is submitted, afterwards they will throw an
  14861. IllegalStateException. </p>
  14862. <p>
  14863. Normally the user creates the application, describes various facets of the
  14864. job via {@link Job} and then submits the job and monitor its progress.</p>
  14865. <p>Here is an example on how to submit a job:</p>
  14866. <p><blockquote><pre>
  14867. // Create a new Job
  14868. Job job = new Job(new Configuration());
  14869. job.setJarByClass(MyJob.class);
  14870. // Specify various job-specific parameters
  14871. job.setJobName("myjob");
  14872. job.setInputPath(new Path("in"));
  14873. job.setOutputPath(new Path("out"));
  14874. job.setMapperClass(MyJob.MyMapper.class);
  14875. job.setReducerClass(MyJob.MyReducer.class);
  14876. // Submit the job, then poll for progress until the job is complete
  14877. job.waitForCompletion(true);
  14878. </pre></blockquote></p>]]>
  14879. </doc>
  14880. </class>
  14881. <!-- end class org.apache.hadoop.mapreduce.Job -->
  14882. <!-- start class org.apache.hadoop.mapreduce.Job.JobState -->
  14883. <class name="Job.JobState" extends="java.lang.Enum"
  14884. abstract="false"
  14885. static="true" final="true" visibility="public"
  14886. deprecated="not deprecated">
  14887. <method name="values" return="org.apache.hadoop.mapreduce.Job.JobState[]"
  14888. abstract="false" native="false" synchronized="false"
  14889. static="true" final="false" visibility="public"
  14890. deprecated="not deprecated">
  14891. </method>
  14892. <method name="valueOf" return="org.apache.hadoop.mapreduce.Job.JobState"
  14893. abstract="false" native="false" synchronized="false"
  14894. static="true" final="false" visibility="public"
  14895. deprecated="not deprecated">
  14896. <param name="name" type="java.lang.String"/>
  14897. </method>
  14898. </class>
  14899. <!-- end class org.apache.hadoop.mapreduce.Job.JobState -->
  14900. <!-- start class org.apache.hadoop.mapreduce.Job.TaskStatusFilter -->
  14901. <class name="Job.TaskStatusFilter" extends="java.lang.Enum"
  14902. abstract="false"
  14903. static="true" final="true" visibility="public"
  14904. deprecated="not deprecated">
  14905. <method name="values" return="org.apache.hadoop.mapreduce.Job.TaskStatusFilter[]"
  14906. abstract="false" native="false" synchronized="false"
  14907. static="true" final="false" visibility="public"
  14908. deprecated="not deprecated">
  14909. </method>
  14910. <method name="valueOf" return="org.apache.hadoop.mapreduce.Job.TaskStatusFilter"
  14911. abstract="false" native="false" synchronized="false"
  14912. static="true" final="false" visibility="public"
  14913. deprecated="not deprecated">
  14914. <param name="name" type="java.lang.String"/>
  14915. </method>
  14916. </class>
  14917. <!-- end class org.apache.hadoop.mapreduce.Job.TaskStatusFilter -->
  14918. <!-- start interface org.apache.hadoop.mapreduce.JobContext -->
  14919. <interface name="JobContext" abstract="true"
  14920. static="false" final="false" visibility="public"
  14921. deprecated="not deprecated">
  14922. <implements name="org.apache.hadoop.mapreduce.MRJobConfig"/>
  14923. <method name="getConfiguration" return="org.apache.hadoop.conf.Configuration"
  14924. abstract="false" native="false" synchronized="false"
  14925. static="false" final="false" visibility="public"
  14926. deprecated="not deprecated">
  14927. <doc>
  14928. <![CDATA[Return the configuration for the job.
  14929. @return the shared configuration object]]>
  14930. </doc>
  14931. </method>
  14932. <method name="getCredentials" return="org.apache.hadoop.security.Credentials"
  14933. abstract="false" native="false" synchronized="false"
  14934. static="false" final="false" visibility="public"
  14935. deprecated="not deprecated">
  14936. <doc>
  14937. <![CDATA[Get credentials for the job.
  14938. @return credentials for the job]]>
  14939. </doc>
  14940. </method>
  14941. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  14942. abstract="false" native="false" synchronized="false"
  14943. static="false" final="false" visibility="public"
  14944. deprecated="not deprecated">
  14945. <doc>
  14946. <![CDATA[Get the unique ID for the job.
  14947. @return the object with the job id]]>
  14948. </doc>
  14949. </method>
  14950. <method name="getNumReduceTasks" return="int"
  14951. abstract="false" native="false" synchronized="false"
  14952. static="false" final="false" visibility="public"
  14953. deprecated="not deprecated">
  14954. <doc>
  14955. <![CDATA[Get configured the number of reduce tasks for this job. Defaults to
  14956. <code>1</code>.
  14957. @return the number of reduce tasks for this job.]]>
  14958. </doc>
  14959. </method>
  14960. <method name="getWorkingDirectory" return="org.apache.hadoop.fs.Path"
  14961. abstract="false" native="false" synchronized="false"
  14962. static="false" final="false" visibility="public"
  14963. deprecated="not deprecated">
  14964. <exception name="IOException" type="java.io.IOException"/>
  14965. <doc>
  14966. <![CDATA[Get the current working directory for the default file system.
  14967. @return the directory name.]]>
  14968. </doc>
  14969. </method>
  14970. <method name="getOutputKeyClass" return="java.lang.Class"
  14971. abstract="false" native="false" synchronized="false"
  14972. static="false" final="false" visibility="public"
  14973. deprecated="not deprecated">
  14974. <doc>
  14975. <![CDATA[Get the key class for the job output data.
  14976. @return the key class for the job output data.]]>
  14977. </doc>
  14978. </method>
  14979. <method name="getOutputValueClass" return="java.lang.Class"
  14980. abstract="false" native="false" synchronized="false"
  14981. static="false" final="false" visibility="public"
  14982. deprecated="not deprecated">
  14983. <doc>
  14984. <![CDATA[Get the value class for job outputs.
  14985. @return the value class for job outputs.]]>
  14986. </doc>
  14987. </method>
  14988. <method name="getMapOutputKeyClass" return="java.lang.Class"
  14989. abstract="false" native="false" synchronized="false"
  14990. static="false" final="false" visibility="public"
  14991. deprecated="not deprecated">
  14992. <doc>
  14993. <![CDATA[Get the key class for the map output data. If it is not set, use the
  14994. (final) output key class. This allows the map output key class to be
  14995. different than the final output key class.
  14996. @return the map output key class.]]>
  14997. </doc>
  14998. </method>
  14999. <method name="getMapOutputValueClass" return="java.lang.Class"
  15000. abstract="false" native="false" synchronized="false"
  15001. static="false" final="false" visibility="public"
  15002. deprecated="not deprecated">
  15003. <doc>
  15004. <![CDATA[Get the value class for the map output data. If it is not set, use the
  15005. (final) output value class This allows the map output value class to be
  15006. different than the final output value class.
  15007. @return the map output value class.]]>
  15008. </doc>
  15009. </method>
  15010. <method name="getJobName" return="java.lang.String"
  15011. abstract="false" native="false" synchronized="false"
  15012. static="false" final="false" visibility="public"
  15013. deprecated="not deprecated">
  15014. <doc>
  15015. <![CDATA[Get the user-specified job name. This is only used to identify the
  15016. job to the user.
  15017. @return the job's name, defaulting to "".]]>
  15018. </doc>
  15019. </method>
  15020. <method name="getInputFormatClass" return="java.lang.Class"
  15021. abstract="false" native="false" synchronized="false"
  15022. static="false" final="false" visibility="public"
  15023. deprecated="not deprecated">
  15024. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  15025. <doc>
  15026. <![CDATA[Get the {@link InputFormat} class for the job.
  15027. @return the {@link InputFormat} class for the job.]]>
  15028. </doc>
  15029. </method>
  15030. <method name="getMapperClass" return="java.lang.Class"
  15031. abstract="false" native="false" synchronized="false"
  15032. static="false" final="false" visibility="public"
  15033. deprecated="not deprecated">
  15034. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  15035. <doc>
  15036. <![CDATA[Get the {@link Mapper} class for the job.
  15037. @return the {@link Mapper} class for the job.]]>
  15038. </doc>
  15039. </method>
  15040. <method name="getCombinerClass" return="java.lang.Class"
  15041. abstract="false" native="false" synchronized="false"
  15042. static="false" final="false" visibility="public"
  15043. deprecated="not deprecated">
  15044. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  15045. <doc>
  15046. <![CDATA[Get the combiner class for the job.
  15047. @return the combiner class for the job.]]>
  15048. </doc>
  15049. </method>
  15050. <method name="getReducerClass" return="java.lang.Class"
  15051. abstract="false" native="false" synchronized="false"
  15052. static="false" final="false" visibility="public"
  15053. deprecated="not deprecated">
  15054. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  15055. <doc>
  15056. <![CDATA[Get the {@link Reducer} class for the job.
  15057. @return the {@link Reducer} class for the job.]]>
  15058. </doc>
  15059. </method>
  15060. <method name="getOutputFormatClass" return="java.lang.Class"
  15061. abstract="false" native="false" synchronized="false"
  15062. static="false" final="false" visibility="public"
  15063. deprecated="not deprecated">
  15064. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  15065. <doc>
  15066. <![CDATA[Get the {@link OutputFormat} class for the job.
  15067. @return the {@link OutputFormat} class for the job.]]>
  15068. </doc>
  15069. </method>
  15070. <method name="getPartitionerClass" return="java.lang.Class"
  15071. abstract="false" native="false" synchronized="false"
  15072. static="false" final="false" visibility="public"
  15073. deprecated="not deprecated">
  15074. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  15075. <doc>
  15076. <![CDATA[Get the {@link Partitioner} class for the job.
  15077. @return the {@link Partitioner} class for the job.]]>
  15078. </doc>
  15079. </method>
  15080. <method name="getSortComparator" return="org.apache.hadoop.io.RawComparator"
  15081. abstract="false" native="false" synchronized="false"
  15082. static="false" final="false" visibility="public"
  15083. deprecated="not deprecated">
  15084. <doc>
  15085. <![CDATA[Get the {@link RawComparator} comparator used to compare keys.
  15086. @return the {@link RawComparator} comparator used to compare keys.]]>
  15087. </doc>
  15088. </method>
  15089. <method name="getJar" return="java.lang.String"
  15090. abstract="false" native="false" synchronized="false"
  15091. static="false" final="false" visibility="public"
  15092. deprecated="not deprecated">
  15093. <doc>
  15094. <![CDATA[Get the pathname of the job's jar.
  15095. @return the pathname]]>
  15096. </doc>
  15097. </method>
  15098. <method name="getGroupingComparator" return="org.apache.hadoop.io.RawComparator"
  15099. abstract="false" native="false" synchronized="false"
  15100. static="false" final="false" visibility="public"
  15101. deprecated="not deprecated">
  15102. <doc>
  15103. <![CDATA[Get the user defined {@link RawComparator} comparator for
  15104. grouping keys of inputs to the reduce.
  15105. @return comparator set by the user for grouping values.
  15106. @see Job#setGroupingComparatorClass(Class) for details.]]>
  15107. </doc>
  15108. </method>
  15109. <method name="getJobSetupCleanupNeeded" return="boolean"
  15110. abstract="false" native="false" synchronized="false"
  15111. static="false" final="false" visibility="public"
  15112. deprecated="not deprecated">
  15113. <doc>
  15114. <![CDATA[Get whether job-setup and job-cleanup is needed for the job
  15115. @return boolean]]>
  15116. </doc>
  15117. </method>
  15118. <method name="getProfileEnabled" return="boolean"
  15119. abstract="false" native="false" synchronized="false"
  15120. static="false" final="false" visibility="public"
  15121. deprecated="not deprecated">
  15122. <doc>
  15123. <![CDATA[Get whether the task profiling is enabled.
  15124. @return true if some tasks will be profiled]]>
  15125. </doc>
  15126. </method>
  15127. <method name="getProfileParams" return="java.lang.String"
  15128. abstract="false" native="false" synchronized="false"
  15129. static="false" final="false" visibility="public"
  15130. deprecated="not deprecated">
  15131. <doc>
  15132. <![CDATA[Get the profiler configuration arguments.
  15133. The default value for this property is
  15134. "-agentlib:hprof=cpu=samples,heap=sites,force=n,thread=y,verbose=n,file=%s"
  15135. @return the parameters to pass to the task child to configure profiling]]>
  15136. </doc>
  15137. </method>
  15138. <method name="getProfileTaskRange" return="org.apache.hadoop.conf.Configuration.IntegerRanges"
  15139. abstract="false" native="false" synchronized="false"
  15140. static="false" final="false" visibility="public"
  15141. deprecated="not deprecated">
  15142. <param name="isMap" type="boolean"/>
  15143. <doc>
  15144. <![CDATA[Get the range of maps or reduces to profile.
  15145. @param isMap is the task a map?
  15146. @return the task ranges]]>
  15147. </doc>
  15148. </method>
  15149. <method name="getUser" return="java.lang.String"
  15150. abstract="false" native="false" synchronized="false"
  15151. static="false" final="false" visibility="public"
  15152. deprecated="not deprecated">
  15153. <doc>
  15154. <![CDATA[Get the reported username for this job.
  15155. @return the username]]>
  15156. </doc>
  15157. </method>
  15158. <method name="getSymlink" return="boolean"
  15159. abstract="false" native="false" synchronized="false"
  15160. static="false" final="false" visibility="public"
  15161. deprecated="not deprecated">
  15162. <doc>
  15163. <![CDATA[This method checks to see if symlinks are to be create for the
  15164. localized cache files in the current working directory
  15165. @return true if symlinks are to be created- else return false]]>
  15166. </doc>
  15167. </method>
  15168. <method name="getArchiveClassPaths" return="org.apache.hadoop.fs.Path[]"
  15169. abstract="false" native="false" synchronized="false"
  15170. static="false" final="false" visibility="public"
  15171. deprecated="not deprecated">
  15172. <doc>
  15173. <![CDATA[Get the archive entries in classpath as an array of Path]]>
  15174. </doc>
  15175. </method>
  15176. <method name="getCacheArchives" return="java.net.URI[]"
  15177. abstract="false" native="false" synchronized="false"
  15178. static="false" final="false" visibility="public"
  15179. deprecated="not deprecated">
  15180. <exception name="IOException" type="java.io.IOException"/>
  15181. <doc>
  15182. <![CDATA[Get cache archives set in the Configuration
  15183. @return A URI array of the caches set in the Configuration
  15184. @throws IOException]]>
  15185. </doc>
  15186. </method>
  15187. <method name="getCacheFiles" return="java.net.URI[]"
  15188. abstract="false" native="false" synchronized="false"
  15189. static="false" final="false" visibility="public"
  15190. deprecated="not deprecated">
  15191. <exception name="IOException" type="java.io.IOException"/>
  15192. <doc>
  15193. <![CDATA[Get cache files set in the Configuration
  15194. @return A URI array of the files set in the Configuration
  15195. @throws IOException]]>
  15196. </doc>
  15197. </method>
  15198. <method name="getLocalCacheArchives" return="org.apache.hadoop.fs.Path[]"
  15199. abstract="false" native="false" synchronized="false"
  15200. static="false" final="false" visibility="public"
  15201. deprecated="not deprecated">
  15202. <exception name="IOException" type="java.io.IOException"/>
  15203. <doc>
  15204. <![CDATA[Return the path array of the localized caches
  15205. @return A path array of localized caches
  15206. @throws IOException]]>
  15207. </doc>
  15208. </method>
  15209. <method name="getLocalCacheFiles" return="org.apache.hadoop.fs.Path[]"
  15210. abstract="false" native="false" synchronized="false"
  15211. static="false" final="false" visibility="public"
  15212. deprecated="not deprecated">
  15213. <exception name="IOException" type="java.io.IOException"/>
  15214. <doc>
  15215. <![CDATA[Return the path array of the localized files
  15216. @return A path array of localized files
  15217. @throws IOException]]>
  15218. </doc>
  15219. </method>
  15220. <method name="getFileClassPaths" return="org.apache.hadoop.fs.Path[]"
  15221. abstract="false" native="false" synchronized="false"
  15222. static="false" final="false" visibility="public"
  15223. deprecated="not deprecated">
  15224. <doc>
  15225. <![CDATA[Get the file entries in classpath as an array of Path]]>
  15226. </doc>
  15227. </method>
  15228. <method name="getArchiveTimestamps" return="java.lang.String[]"
  15229. abstract="false" native="false" synchronized="false"
  15230. static="false" final="false" visibility="public"
  15231. deprecated="not deprecated">
  15232. <doc>
  15233. <![CDATA[Get the timestamps of the archives. Used by internal
  15234. DistributedCache and MapReduce code.
  15235. @return a string array of timestamps
  15236. @throws IOException]]>
  15237. </doc>
  15238. </method>
  15239. <method name="getFileTimestamps" return="java.lang.String[]"
  15240. abstract="false" native="false" synchronized="false"
  15241. static="false" final="false" visibility="public"
  15242. deprecated="not deprecated">
  15243. <doc>
  15244. <![CDATA[Get the timestamps of the files. Used by internal
  15245. DistributedCache and MapReduce code.
  15246. @return a string array of timestamps
  15247. @throws IOException]]>
  15248. </doc>
  15249. </method>
  15250. <method name="getMaxMapAttempts" return="int"
  15251. abstract="false" native="false" synchronized="false"
  15252. static="false" final="false" visibility="public"
  15253. deprecated="not deprecated">
  15254. <doc>
  15255. <![CDATA[Get the configured number of maximum attempts that will be made to run a
  15256. map task, as specified by the <code>mapred.map.max.attempts</code>
  15257. property. If this property is not already set, the default is 4 attempts.
  15258. @return the max number of attempts per map task.]]>
  15259. </doc>
  15260. </method>
  15261. <method name="getMaxReduceAttempts" return="int"
  15262. abstract="false" native="false" synchronized="false"
  15263. static="false" final="false" visibility="public"
  15264. deprecated="not deprecated">
  15265. <doc>
  15266. <![CDATA[Get the configured number of maximum attempts that will be made to run a
  15267. reduce task, as specified by the <code>mapred.reduce.max.attempts</code>
  15268. property. If this property is not already set, the default is 4 attempts.
  15269. @return the max number of attempts per reduce task.]]>
  15270. </doc>
  15271. </method>
  15272. <doc>
  15273. <![CDATA[A read-only view of the job that is provided to the tasks while they
  15274. are running.]]>
  15275. </doc>
  15276. </interface>
  15277. <!-- end interface org.apache.hadoop.mapreduce.JobContext -->
  15278. <!-- start class org.apache.hadoop.mapreduce.JobCounter -->
  15279. <class name="JobCounter" extends="java.lang.Enum"
  15280. abstract="false"
  15281. static="false" final="true" visibility="public"
  15282. deprecated="not deprecated">
  15283. <method name="values" return="org.apache.hadoop.mapreduce.JobCounter[]"
  15284. abstract="false" native="false" synchronized="false"
  15285. static="true" final="false" visibility="public"
  15286. deprecated="not deprecated">
  15287. </method>
  15288. <method name="valueOf" return="org.apache.hadoop.mapreduce.JobCounter"
  15289. abstract="false" native="false" synchronized="false"
  15290. static="true" final="false" visibility="public"
  15291. deprecated="not deprecated">
  15292. <param name="name" type="java.lang.String"/>
  15293. </method>
  15294. </class>
  15295. <!-- end class org.apache.hadoop.mapreduce.JobCounter -->
  15296. <!-- start class org.apache.hadoop.mapreduce.JobID -->
  15297. <class name="JobID" extends="org.apache.hadoop.mapred.ID"
  15298. abstract="false"
  15299. static="false" final="false" visibility="public"
  15300. deprecated="not deprecated">
  15301. <implements name="java.lang.Comparable"/>
  15302. <constructor name="JobID" type="java.lang.String, int"
  15303. static="false" final="false" visibility="public"
  15304. deprecated="not deprecated">
  15305. <doc>
  15306. <![CDATA[Constructs a JobID object
  15307. @param jtIdentifier jobTracker identifier
  15308. @param id job number]]>
  15309. </doc>
  15310. </constructor>
  15311. <constructor name="JobID"
  15312. static="false" final="false" visibility="public"
  15313. deprecated="not deprecated">
  15314. </constructor>
  15315. <method name="getJtIdentifier" return="java.lang.String"
  15316. abstract="false" native="false" synchronized="false"
  15317. static="false" final="false" visibility="public"
  15318. deprecated="not deprecated">
  15319. </method>
  15320. <method name="equals" return="boolean"
  15321. abstract="false" native="false" synchronized="false"
  15322. static="false" final="false" visibility="public"
  15323. deprecated="not deprecated">
  15324. <param name="o" type="java.lang.Object"/>
  15325. </method>
  15326. <method name="compareTo" return="int"
  15327. abstract="false" native="false" synchronized="false"
  15328. static="false" final="false" visibility="public"
  15329. deprecated="not deprecated">
  15330. <param name="o" type="org.apache.hadoop.mapreduce.ID"/>
  15331. <doc>
  15332. <![CDATA[Compare JobIds by first jtIdentifiers, then by job numbers]]>
  15333. </doc>
  15334. </method>
  15335. <method name="appendTo" return="java.lang.StringBuilder"
  15336. abstract="false" native="false" synchronized="false"
  15337. static="false" final="false" visibility="public"
  15338. deprecated="not deprecated">
  15339. <param name="builder" type="java.lang.StringBuilder"/>
  15340. <doc>
  15341. <![CDATA[Add the stuff after the "job" prefix to the given builder. This is useful,
  15342. because the sub-ids use this substring at the start of their string.
  15343. @param builder the builder to append to
  15344. @return the builder that was passed in]]>
  15345. </doc>
  15346. </method>
  15347. <method name="hashCode" return="int"
  15348. abstract="false" native="false" synchronized="false"
  15349. static="false" final="false" visibility="public"
  15350. deprecated="not deprecated">
  15351. </method>
  15352. <method name="toString" return="java.lang.String"
  15353. abstract="false" native="false" synchronized="false"
  15354. static="false" final="false" visibility="public"
  15355. deprecated="not deprecated">
  15356. </method>
  15357. <method name="readFields"
  15358. abstract="false" native="false" synchronized="false"
  15359. static="false" final="false" visibility="public"
  15360. deprecated="not deprecated">
  15361. <param name="in" type="java.io.DataInput"/>
  15362. <exception name="IOException" type="java.io.IOException"/>
  15363. </method>
  15364. <method name="write"
  15365. abstract="false" native="false" synchronized="false"
  15366. static="false" final="false" visibility="public"
  15367. deprecated="not deprecated">
  15368. <param name="out" type="java.io.DataOutput"/>
  15369. <exception name="IOException" type="java.io.IOException"/>
  15370. </method>
  15371. <method name="forName" return="org.apache.hadoop.mapreduce.JobID"
  15372. abstract="false" native="false" synchronized="false"
  15373. static="true" final="false" visibility="public"
  15374. deprecated="not deprecated">
  15375. <param name="str" type="java.lang.String"/>
  15376. <exception name="IllegalArgumentException" type="java.lang.IllegalArgumentException"/>
  15377. <doc>
  15378. <![CDATA[Construct a JobId object from given string
  15379. @return constructed JobId object or null if the given String is null
  15380. @throws IllegalArgumentException if the given string is malformed]]>
  15381. </doc>
  15382. </method>
  15383. <field name="JOB" type="java.lang.String"
  15384. transient="false" volatile="false"
  15385. static="true" final="true" visibility="protected"
  15386. deprecated="not deprecated">
  15387. </field>
  15388. <field name="JOBID_REGEX" type="java.lang.String"
  15389. transient="false" volatile="false"
  15390. static="true" final="true" visibility="public"
  15391. deprecated="not deprecated">
  15392. </field>
  15393. <field name="idFormat" type="java.text.NumberFormat"
  15394. transient="false" volatile="false"
  15395. static="true" final="true" visibility="protected"
  15396. deprecated="not deprecated">
  15397. </field>
  15398. <doc>
  15399. <![CDATA[JobID represents the immutable and unique identifier for
  15400. the job. JobID consists of two parts. First part
  15401. represents the jobtracker identifier, so that jobID to jobtracker map
  15402. is defined. For cluster setup this string is the jobtracker
  15403. start time, for local setting, it is "local".
  15404. Second part of the JobID is the job number. <br>
  15405. An example JobID is :
  15406. <code>job_200707121733_0003</code> , which represents the third job
  15407. running at the jobtracker started at <code>200707121733</code>.
  15408. <p>
  15409. Applications should never construct or parse JobID strings, but rather
  15410. use appropriate constructors or {@link #forName(String)} method.
  15411. @see TaskID
  15412. @see TaskAttemptID
  15413. @see org.apache.hadoop.mapred.JobTracker#getNewJobId()
  15414. @see org.apache.hadoop.mapred.JobTracker#getStartTime()]]>
  15415. </doc>
  15416. </class>
  15417. <!-- end class org.apache.hadoop.mapreduce.JobID -->
  15418. <!-- start class org.apache.hadoop.mapreduce.JobPriority -->
  15419. <class name="JobPriority" extends="java.lang.Enum"
  15420. abstract="false"
  15421. static="false" final="true" visibility="public"
  15422. deprecated="not deprecated">
  15423. <method name="values" return="org.apache.hadoop.mapreduce.JobPriority[]"
  15424. abstract="false" native="false" synchronized="false"
  15425. static="true" final="false" visibility="public"
  15426. deprecated="not deprecated">
  15427. </method>
  15428. <method name="valueOf" return="org.apache.hadoop.mapreduce.JobPriority"
  15429. abstract="false" native="false" synchronized="false"
  15430. static="true" final="false" visibility="public"
  15431. deprecated="not deprecated">
  15432. <param name="name" type="java.lang.String"/>
  15433. </method>
  15434. <doc>
  15435. <![CDATA[Used to describe the priority of the running job.]]>
  15436. </doc>
  15437. </class>
  15438. <!-- end class org.apache.hadoop.mapreduce.JobPriority -->
  15439. <!-- start class org.apache.hadoop.mapreduce.JobStatus -->
  15440. <class name="JobStatus" extends="java.lang.Object"
  15441. abstract="false"
  15442. static="false" final="false" visibility="public"
  15443. deprecated="not deprecated">
  15444. <implements name="org.apache.hadoop.io.Writable"/>
  15445. <implements name="java.lang.Cloneable"/>
  15446. <constructor name="JobStatus"
  15447. static="false" final="false" visibility="public"
  15448. deprecated="not deprecated">
  15449. </constructor>
  15450. <constructor name="JobStatus" type="org.apache.hadoop.mapreduce.JobID, float, float, float, float, org.apache.hadoop.mapreduce.JobStatus.State, org.apache.hadoop.mapreduce.JobPriority, java.lang.String, java.lang.String, java.lang.String, java.lang.String"
  15451. static="false" final="false" visibility="public"
  15452. deprecated="not deprecated">
  15453. <doc>
  15454. <![CDATA[Create a job status object for a given jobid.
  15455. @param jobid The jobid of the job
  15456. @param setupProgress The progress made on the setup
  15457. @param mapProgress The progress made on the maps
  15458. @param reduceProgress The progress made on the reduces
  15459. @param cleanupProgress The progress made on the cleanup
  15460. @param runState The current state of the job
  15461. @param jp Priority of the job.
  15462. @param user userid of the person who submitted the job.
  15463. @param jobName user-specified job name.
  15464. @param jobFile job configuration file.
  15465. @param trackingUrl link to the web-ui for details of the job.]]>
  15466. </doc>
  15467. </constructor>
  15468. <method name="setMapProgress"
  15469. abstract="false" native="false" synchronized="true"
  15470. static="false" final="false" visibility="protected"
  15471. deprecated="not deprecated">
  15472. <param name="p" type="float"/>
  15473. <doc>
  15474. <![CDATA[Sets the map progress of this job
  15475. @param p The value of map progress to set to]]>
  15476. </doc>
  15477. </method>
  15478. <method name="setCleanupProgress"
  15479. abstract="false" native="false" synchronized="true"
  15480. static="false" final="false" visibility="protected"
  15481. deprecated="not deprecated">
  15482. <param name="p" type="float"/>
  15483. <doc>
  15484. <![CDATA[Sets the cleanup progress of this job
  15485. @param p The value of cleanup progress to set to]]>
  15486. </doc>
  15487. </method>
  15488. <method name="setSetupProgress"
  15489. abstract="false" native="false" synchronized="true"
  15490. static="false" final="false" visibility="protected"
  15491. deprecated="not deprecated">
  15492. <param name="p" type="float"/>
  15493. <doc>
  15494. <![CDATA[Sets the setup progress of this job
  15495. @param p The value of setup progress to set to]]>
  15496. </doc>
  15497. </method>
  15498. <method name="setReduceProgress"
  15499. abstract="false" native="false" synchronized="true"
  15500. static="false" final="false" visibility="protected"
  15501. deprecated="not deprecated">
  15502. <param name="p" type="float"/>
  15503. <doc>
  15504. <![CDATA[Sets the reduce progress of this Job
  15505. @param p The value of reduce progress to set to]]>
  15506. </doc>
  15507. </method>
  15508. <method name="setPriority"
  15509. abstract="false" native="false" synchronized="true"
  15510. static="false" final="false" visibility="protected"
  15511. deprecated="not deprecated">
  15512. <param name="jp" type="org.apache.hadoop.mapreduce.JobPriority"/>
  15513. <doc>
  15514. <![CDATA[Set the priority of the job, defaulting to NORMAL.
  15515. @param jp new job priority]]>
  15516. </doc>
  15517. </method>
  15518. <method name="setFinishTime"
  15519. abstract="false" native="false" synchronized="true"
  15520. static="false" final="false" visibility="protected"
  15521. deprecated="not deprecated">
  15522. <param name="finishTime" type="long"/>
  15523. <doc>
  15524. <![CDATA[Set the finish time of the job
  15525. @param finishTime The finishTime of the job]]>
  15526. </doc>
  15527. </method>
  15528. <method name="setHistoryFile"
  15529. abstract="false" native="false" synchronized="true"
  15530. static="false" final="false" visibility="protected"
  15531. deprecated="not deprecated">
  15532. <param name="historyFile" type="java.lang.String"/>
  15533. <doc>
  15534. <![CDATA[Set the job history file url for a completed job]]>
  15535. </doc>
  15536. </method>
  15537. <method name="setTrackingUrl"
  15538. abstract="false" native="false" synchronized="true"
  15539. static="false" final="false" visibility="protected"
  15540. deprecated="not deprecated">
  15541. <param name="trackingUrl" type="java.lang.String"/>
  15542. <doc>
  15543. <![CDATA[Set the link to the web-ui for details of the job.]]>
  15544. </doc>
  15545. </method>
  15546. <method name="setRetired"
  15547. abstract="false" native="false" synchronized="true"
  15548. static="false" final="false" visibility="protected"
  15549. deprecated="not deprecated">
  15550. <doc>
  15551. <![CDATA[Set the job retire flag to true.]]>
  15552. </doc>
  15553. </method>
  15554. <method name="setState"
  15555. abstract="false" native="false" synchronized="true"
  15556. static="false" final="false" visibility="protected"
  15557. deprecated="not deprecated">
  15558. <param name="state" type="org.apache.hadoop.mapreduce.JobStatus.State"/>
  15559. <doc>
  15560. <![CDATA[Change the current run state of the job.]]>
  15561. </doc>
  15562. </method>
  15563. <method name="setStartTime"
  15564. abstract="false" native="false" synchronized="true"
  15565. static="false" final="false" visibility="protected"
  15566. deprecated="not deprecated">
  15567. <param name="startTime" type="long"/>
  15568. <doc>
  15569. <![CDATA[Set the start time of the job
  15570. @param startTime The startTime of the job]]>
  15571. </doc>
  15572. </method>
  15573. <method name="setUsername"
  15574. abstract="false" native="false" synchronized="true"
  15575. static="false" final="false" visibility="protected"
  15576. deprecated="not deprecated">
  15577. <param name="userName" type="java.lang.String"/>
  15578. <doc>
  15579. <![CDATA[@param userName The username of the job]]>
  15580. </doc>
  15581. </method>
  15582. <method name="setSchedulingInfo"
  15583. abstract="false" native="false" synchronized="true"
  15584. static="false" final="false" visibility="protected"
  15585. deprecated="not deprecated">
  15586. <param name="schedulingInfo" type="java.lang.String"/>
  15587. <doc>
  15588. <![CDATA[Used to set the scheduling information associated to a particular Job.
  15589. @param schedulingInfo Scheduling information of the job]]>
  15590. </doc>
  15591. </method>
  15592. <method name="setJobACLs"
  15593. abstract="false" native="false" synchronized="true"
  15594. static="false" final="false" visibility="protected"
  15595. deprecated="not deprecated">
  15596. <param name="acls" type="java.util.Map"/>
  15597. <doc>
  15598. <![CDATA[Set the job acls.
  15599. @param acls {@link Map} from {@link JobACL} to {@link AccessControlList}]]>
  15600. </doc>
  15601. </method>
  15602. <method name="getMapProgress" return="float"
  15603. abstract="false" native="false" synchronized="true"
  15604. static="false" final="false" visibility="public"
  15605. deprecated="not deprecated">
  15606. <doc>
  15607. <![CDATA[@return Percentage of progress in maps]]>
  15608. </doc>
  15609. </method>
  15610. <method name="getCleanupProgress" return="float"
  15611. abstract="false" native="false" synchronized="true"
  15612. static="false" final="false" visibility="public"
  15613. deprecated="not deprecated">
  15614. <doc>
  15615. <![CDATA[@return Percentage of progress in cleanup]]>
  15616. </doc>
  15617. </method>
  15618. <method name="getSetupProgress" return="float"
  15619. abstract="false" native="false" synchronized="true"
  15620. static="false" final="false" visibility="public"
  15621. deprecated="not deprecated">
  15622. <doc>
  15623. <![CDATA[@return Percentage of progress in setup]]>
  15624. </doc>
  15625. </method>
  15626. <method name="getReduceProgress" return="float"
  15627. abstract="false" native="false" synchronized="true"
  15628. static="false" final="false" visibility="public"
  15629. deprecated="not deprecated">
  15630. <doc>
  15631. <![CDATA[@return Percentage of progress in reduce]]>
  15632. </doc>
  15633. </method>
  15634. <method name="getState" return="org.apache.hadoop.mapreduce.JobStatus.State"
  15635. abstract="false" native="false" synchronized="true"
  15636. static="false" final="false" visibility="public"
  15637. deprecated="not deprecated">
  15638. <doc>
  15639. <![CDATA[@return running state of the job]]>
  15640. </doc>
  15641. </method>
  15642. <method name="getStartTime" return="long"
  15643. abstract="false" native="false" synchronized="true"
  15644. static="false" final="false" visibility="public"
  15645. deprecated="not deprecated">
  15646. <doc>
  15647. <![CDATA[@return start time of the job]]>
  15648. </doc>
  15649. </method>
  15650. <method name="clone" return="java.lang.Object"
  15651. abstract="false" native="false" synchronized="false"
  15652. static="false" final="false" visibility="public"
  15653. deprecated="not deprecated">
  15654. </method>
  15655. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  15656. abstract="false" native="false" synchronized="false"
  15657. static="false" final="false" visibility="public"
  15658. deprecated="not deprecated">
  15659. <doc>
  15660. <![CDATA[@return The jobid of the Job]]>
  15661. </doc>
  15662. </method>
  15663. <method name="getUsername" return="java.lang.String"
  15664. abstract="false" native="false" synchronized="true"
  15665. static="false" final="false" visibility="public"
  15666. deprecated="not deprecated">
  15667. <doc>
  15668. <![CDATA[@return the username of the job]]>
  15669. </doc>
  15670. </method>
  15671. <method name="getSchedulingInfo" return="java.lang.String"
  15672. abstract="false" native="false" synchronized="true"
  15673. static="false" final="false" visibility="public"
  15674. deprecated="not deprecated">
  15675. <doc>
  15676. <![CDATA[Gets the Scheduling information associated to a particular Job.
  15677. @return the scheduling information of the job]]>
  15678. </doc>
  15679. </method>
  15680. <method name="getJobACLs" return="java.util.Map"
  15681. abstract="false" native="false" synchronized="true"
  15682. static="false" final="false" visibility="public"
  15683. deprecated="not deprecated">
  15684. <doc>
  15685. <![CDATA[Get the job acls.
  15686. @return a {@link Map} from {@link JobACL} to {@link AccessControlList}]]>
  15687. </doc>
  15688. </method>
  15689. <method name="getPriority" return="org.apache.hadoop.mapreduce.JobPriority"
  15690. abstract="false" native="false" synchronized="true"
  15691. static="false" final="false" visibility="public"
  15692. deprecated="not deprecated">
  15693. <doc>
  15694. <![CDATA[Return the priority of the job
  15695. @return job priority]]>
  15696. </doc>
  15697. </method>
  15698. <method name="isJobComplete" return="boolean"
  15699. abstract="false" native="false" synchronized="true"
  15700. static="false" final="false" visibility="public"
  15701. deprecated="not deprecated">
  15702. <doc>
  15703. <![CDATA[Returns true if the status is for a completed job.]]>
  15704. </doc>
  15705. </method>
  15706. <method name="write"
  15707. abstract="false" native="false" synchronized="true"
  15708. static="false" final="false" visibility="public"
  15709. deprecated="not deprecated">
  15710. <param name="out" type="java.io.DataOutput"/>
  15711. <exception name="IOException" type="java.io.IOException"/>
  15712. </method>
  15713. <method name="readFields"
  15714. abstract="false" native="false" synchronized="true"
  15715. static="false" final="false" visibility="public"
  15716. deprecated="not deprecated">
  15717. <param name="in" type="java.io.DataInput"/>
  15718. <exception name="IOException" type="java.io.IOException"/>
  15719. </method>
  15720. <method name="getJobName" return="java.lang.String"
  15721. abstract="false" native="false" synchronized="false"
  15722. static="false" final="false" visibility="public"
  15723. deprecated="not deprecated">
  15724. <doc>
  15725. <![CDATA[Get the user-specified job name.]]>
  15726. </doc>
  15727. </method>
  15728. <method name="getJobFile" return="java.lang.String"
  15729. abstract="false" native="false" synchronized="false"
  15730. static="false" final="false" visibility="public"
  15731. deprecated="not deprecated">
  15732. <doc>
  15733. <![CDATA[Get the configuration file for the job.]]>
  15734. </doc>
  15735. </method>
  15736. <method name="getTrackingUrl" return="java.lang.String"
  15737. abstract="false" native="false" synchronized="true"
  15738. static="false" final="false" visibility="public"
  15739. deprecated="not deprecated">
  15740. <doc>
  15741. <![CDATA[Get the link to the web-ui for details of the job.]]>
  15742. </doc>
  15743. </method>
  15744. <method name="getFinishTime" return="long"
  15745. abstract="false" native="false" synchronized="true"
  15746. static="false" final="false" visibility="public"
  15747. deprecated="not deprecated">
  15748. <doc>
  15749. <![CDATA[Get the finish time of the job.]]>
  15750. </doc>
  15751. </method>
  15752. <method name="isRetired" return="boolean"
  15753. abstract="false" native="false" synchronized="true"
  15754. static="false" final="false" visibility="public"
  15755. deprecated="not deprecated">
  15756. <doc>
  15757. <![CDATA[Check whether the job has retired.]]>
  15758. </doc>
  15759. </method>
  15760. <method name="getHistoryFile" return="java.lang.String"
  15761. abstract="false" native="false" synchronized="true"
  15762. static="false" final="false" visibility="public"
  15763. deprecated="not deprecated">
  15764. <doc>
  15765. <![CDATA[@return the job history file name for a completed job. If job is not
  15766. completed or history file not available then return null.]]>
  15767. </doc>
  15768. </method>
  15769. <method name="toString" return="java.lang.String"
  15770. abstract="false" native="false" synchronized="false"
  15771. static="false" final="false" visibility="public"
  15772. deprecated="not deprecated">
  15773. </method>
  15774. <doc>
  15775. <![CDATA[Describes the current status of a job.]]>
  15776. </doc>
  15777. </class>
  15778. <!-- end class org.apache.hadoop.mapreduce.JobStatus -->
  15779. <!-- start class org.apache.hadoop.mapreduce.JobStatus.State -->
  15780. <class name="JobStatus.State" extends="java.lang.Enum"
  15781. abstract="false"
  15782. static="true" final="true" visibility="public"
  15783. deprecated="not deprecated">
  15784. <method name="values" return="org.apache.hadoop.mapreduce.JobStatus.State[]"
  15785. abstract="false" native="false" synchronized="false"
  15786. static="true" final="false" visibility="public"
  15787. deprecated="not deprecated">
  15788. </method>
  15789. <method name="valueOf" return="org.apache.hadoop.mapreduce.JobStatus.State"
  15790. abstract="false" native="false" synchronized="false"
  15791. static="true" final="false" visibility="public"
  15792. deprecated="not deprecated">
  15793. <param name="name" type="java.lang.String"/>
  15794. </method>
  15795. <method name="getValue" return="int"
  15796. abstract="false" native="false" synchronized="false"
  15797. static="false" final="false" visibility="public"
  15798. deprecated="not deprecated">
  15799. </method>
  15800. <doc>
  15801. <![CDATA[Current state of the job]]>
  15802. </doc>
  15803. </class>
  15804. <!-- end class org.apache.hadoop.mapreduce.JobStatus.State -->
  15805. <!-- start interface org.apache.hadoop.mapreduce.MapContext -->
  15806. <interface name="MapContext" abstract="true"
  15807. static="false" final="false" visibility="public"
  15808. deprecated="not deprecated">
  15809. <implements name="org.apache.hadoop.mapreduce.TaskInputOutputContext"/>
  15810. <method name="getInputSplit" return="org.apache.hadoop.mapreduce.InputSplit"
  15811. abstract="false" native="false" synchronized="false"
  15812. static="false" final="false" visibility="public"
  15813. deprecated="not deprecated">
  15814. <doc>
  15815. <![CDATA[Get the input split for this map.]]>
  15816. </doc>
  15817. </method>
  15818. <doc>
  15819. <![CDATA[The context that is given to the {@link Mapper}.
  15820. @param <KEYIN> the key input type to the Mapper
  15821. @param <VALUEIN> the value input type to the Mapper
  15822. @param <KEYOUT> the key output type from the Mapper
  15823. @param <VALUEOUT> the value output type from the Mapper]]>
  15824. </doc>
  15825. </interface>
  15826. <!-- end interface org.apache.hadoop.mapreduce.MapContext -->
  15827. <!-- start class org.apache.hadoop.mapreduce.Mapper -->
  15828. <class name="Mapper" extends="java.lang.Object"
  15829. abstract="false"
  15830. static="false" final="false" visibility="public"
  15831. deprecated="not deprecated">
  15832. <constructor name="Mapper"
  15833. static="false" final="false" visibility="public"
  15834. deprecated="not deprecated">
  15835. </constructor>
  15836. <method name="setup"
  15837. abstract="false" native="false" synchronized="false"
  15838. static="false" final="false" visibility="protected"
  15839. deprecated="not deprecated">
  15840. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  15841. <exception name="IOException" type="java.io.IOException"/>
  15842. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  15843. <doc>
  15844. <![CDATA[Called once at the beginning of the task.]]>
  15845. </doc>
  15846. </method>
  15847. <method name="map"
  15848. abstract="false" native="false" synchronized="false"
  15849. static="false" final="false" visibility="protected"
  15850. deprecated="not deprecated">
  15851. <param name="key" type="KEYIN"/>
  15852. <param name="value" type="VALUEIN"/>
  15853. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  15854. <exception name="IOException" type="java.io.IOException"/>
  15855. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  15856. <doc>
  15857. <![CDATA[Called once for each key/value pair in the input split. Most applications
  15858. should override this, but the default is the identity function.]]>
  15859. </doc>
  15860. </method>
  15861. <method name="cleanup"
  15862. abstract="false" native="false" synchronized="false"
  15863. static="false" final="false" visibility="protected"
  15864. deprecated="not deprecated">
  15865. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  15866. <exception name="IOException" type="java.io.IOException"/>
  15867. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  15868. <doc>
  15869. <![CDATA[Called once at the end of the task.]]>
  15870. </doc>
  15871. </method>
  15872. <method name="run"
  15873. abstract="false" native="false" synchronized="false"
  15874. static="false" final="false" visibility="public"
  15875. deprecated="not deprecated">
  15876. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  15877. <exception name="IOException" type="java.io.IOException"/>
  15878. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  15879. <doc>
  15880. <![CDATA[Expert users can override this method for more complete control over the
  15881. execution of the Mapper.
  15882. @param context
  15883. @throws IOException]]>
  15884. </doc>
  15885. </method>
  15886. <doc>
  15887. <![CDATA[Maps input key/value pairs to a set of intermediate key/value pairs.
  15888. <p>Maps are the individual tasks which transform input records into a
  15889. intermediate records. The transformed intermediate records need not be of
  15890. the same type as the input records. A given input pair may map to zero or
  15891. many output pairs.</p>
  15892. <p>The Hadoop Map-Reduce framework spawns one map task for each
  15893. {@link InputSplit} generated by the {@link InputFormat} for the job.
  15894. <code>Mapper</code> implementations can access the {@link Configuration} for
  15895. the job via the {@link JobContext#getConfiguration()}.
  15896. <p>The framework first calls
  15897. {@link #setup(org.apache.hadoop.mapreduce.Mapper.Context)}, followed by
  15898. {@link #map(Object, Object, Context)}
  15899. for each key/value pair in the <code>InputSplit</code>. Finally
  15900. {@link #cleanup(Context)} is called.</p>
  15901. <p>All intermediate values associated with a given output key are
  15902. subsequently grouped by the framework, and passed to a {@link Reducer} to
  15903. determine the final output. Users can control the sorting and grouping by
  15904. specifying two key {@link RawComparator} classes.</p>
  15905. <p>The <code>Mapper</code> outputs are partitioned per
  15906. <code>Reducer</code>. Users can control which keys (and hence records) go to
  15907. which <code>Reducer</code> by implementing a custom {@link Partitioner}.
  15908. <p>Users can optionally specify a <code>combiner</code>, via
  15909. {@link Job#setCombinerClass(Class)}, to perform local aggregation of the
  15910. intermediate outputs, which helps to cut down the amount of data transferred
  15911. from the <code>Mapper</code> to the <code>Reducer</code>.
  15912. <p>Applications can specify if and how the intermediate
  15913. outputs are to be compressed and which {@link CompressionCodec}s are to be
  15914. used via the <code>Configuration</code>.</p>
  15915. <p>If the job has zero
  15916. reduces then the output of the <code>Mapper</code> is directly written
  15917. to the {@link OutputFormat} without sorting by keys.</p>
  15918. <p>Example:</p>
  15919. <p><blockquote><pre>
  15920. public class TokenCounterMapper
  15921. extends Mapper&lt;Object, Text, Text, IntWritable&gt;{
  15922. private final static IntWritable one = new IntWritable(1);
  15923. private Text word = new Text();
  15924. public void map(Object key, Text value, Context context) throws IOException, InterruptedException {
  15925. StringTokenizer itr = new StringTokenizer(value.toString());
  15926. while (itr.hasMoreTokens()) {
  15927. word.set(itr.nextToken());
  15928. context.write(word, one);
  15929. }
  15930. }
  15931. }
  15932. </pre></blockquote></p>
  15933. <p>Applications may override the {@link #run(Context)} method to exert
  15934. greater control on map processing e.g. multi-threaded <code>Mapper</code>s
  15935. etc.</p>
  15936. @see InputFormat
  15937. @see JobContext
  15938. @see Partitioner
  15939. @see Reducer]]>
  15940. </doc>
  15941. </class>
  15942. <!-- end class org.apache.hadoop.mapreduce.Mapper -->
  15943. <!-- start class org.apache.hadoop.mapreduce.Mapper.Context -->
  15944. <class name="Mapper.Context" extends="java.lang.Object"
  15945. abstract="true"
  15946. static="false" final="false" visibility="public"
  15947. deprecated="not deprecated">
  15948. <implements name="org.apache.hadoop.mapreduce.MapContext"/>
  15949. <constructor name="Mapper.Context"
  15950. static="false" final="false" visibility="public"
  15951. deprecated="not deprecated">
  15952. </constructor>
  15953. <doc>
  15954. <![CDATA[The <code>Context</code> passed on to the {@link Mapper} implementations.]]>
  15955. </doc>
  15956. </class>
  15957. <!-- end class org.apache.hadoop.mapreduce.Mapper.Context -->
  15958. <!-- start class org.apache.hadoop.mapreduce.MarkableIterator -->
  15959. <class name="MarkableIterator" extends="java.lang.Object"
  15960. abstract="false"
  15961. static="false" final="false" visibility="public"
  15962. deprecated="not deprecated">
  15963. <implements name="org.apache.hadoop.mapreduce.MarkableIteratorInterface"/>
  15964. <constructor name="MarkableIterator" type="java.util.Iterator"
  15965. static="false" final="false" visibility="public"
  15966. deprecated="not deprecated">
  15967. <doc>
  15968. <![CDATA[Create a new iterator layered on the input iterator
  15969. @param itr underlying iterator that implements MarkableIteratorInterface]]>
  15970. </doc>
  15971. </constructor>
  15972. <method name="mark"
  15973. abstract="false" native="false" synchronized="false"
  15974. static="false" final="false" visibility="public"
  15975. deprecated="not deprecated">
  15976. <exception name="IOException" type="java.io.IOException"/>
  15977. </method>
  15978. <method name="reset"
  15979. abstract="false" native="false" synchronized="false"
  15980. static="false" final="false" visibility="public"
  15981. deprecated="not deprecated">
  15982. <exception name="IOException" type="java.io.IOException"/>
  15983. </method>
  15984. <method name="clearMark"
  15985. abstract="false" native="false" synchronized="false"
  15986. static="false" final="false" visibility="public"
  15987. deprecated="not deprecated">
  15988. <exception name="IOException" type="java.io.IOException"/>
  15989. </method>
  15990. <method name="hasNext" return="boolean"
  15991. abstract="false" native="false" synchronized="false"
  15992. static="false" final="false" visibility="public"
  15993. deprecated="not deprecated">
  15994. </method>
  15995. <method name="next" return="VALUE"
  15996. abstract="false" native="false" synchronized="false"
  15997. static="false" final="false" visibility="public"
  15998. deprecated="not deprecated">
  15999. </method>
  16000. <method name="remove"
  16001. abstract="false" native="false" synchronized="false"
  16002. static="false" final="false" visibility="public"
  16003. deprecated="not deprecated">
  16004. </method>
  16005. <doc>
  16006. <![CDATA[<code>MarkableIterator</code> is a wrapper iterator class that
  16007. implements the {@link MarkableIteratorInterface}.]]>
  16008. </doc>
  16009. </class>
  16010. <!-- end class org.apache.hadoop.mapreduce.MarkableIterator -->
  16011. <!-- start class org.apache.hadoop.mapreduce.OutputCommitter -->
  16012. <class name="OutputCommitter" extends="java.lang.Object"
  16013. abstract="true"
  16014. static="false" final="false" visibility="public"
  16015. deprecated="not deprecated">
  16016. <constructor name="OutputCommitter"
  16017. static="false" final="false" visibility="public"
  16018. deprecated="not deprecated">
  16019. </constructor>
  16020. <method name="setupJob"
  16021. abstract="true" native="false" synchronized="false"
  16022. static="false" final="false" visibility="public"
  16023. deprecated="not deprecated">
  16024. <param name="jobContext" type="org.apache.hadoop.mapreduce.JobContext"/>
  16025. <exception name="IOException" type="java.io.IOException"/>
  16026. <doc>
  16027. <![CDATA[For the framework to setup the job output during initialization
  16028. @param jobContext Context of the job whose output is being written.
  16029. @throws IOException if temporary output could not be created]]>
  16030. </doc>
  16031. </method>
  16032. <method name="cleanupJob"
  16033. abstract="false" native="false" synchronized="false"
  16034. static="false" final="false" visibility="public"
  16035. deprecated="Use {@link #commitJob(JobContext)} or
  16036. {@link #abortJob(JobContext, JobStatus.State)} instead.">
  16037. <param name="jobContext" type="org.apache.hadoop.mapreduce.JobContext"/>
  16038. <exception name="IOException" type="java.io.IOException"/>
  16039. <doc>
  16040. <![CDATA[For cleaning up the job's output after job completion
  16041. @param jobContext Context of the job whose output is being written.
  16042. @throws IOException
  16043. @deprecated Use {@link #commitJob(JobContext)} or
  16044. {@link #abortJob(JobContext, JobStatus.State)} instead.]]>
  16045. </doc>
  16046. </method>
  16047. <method name="commitJob"
  16048. abstract="false" native="false" synchronized="false"
  16049. static="false" final="false" visibility="public"
  16050. deprecated="not deprecated">
  16051. <param name="jobContext" type="org.apache.hadoop.mapreduce.JobContext"/>
  16052. <exception name="IOException" type="java.io.IOException"/>
  16053. <doc>
  16054. <![CDATA[For committing job's output after successful job completion. Note that this
  16055. is invoked for jobs with final runstate as SUCCESSFUL.
  16056. @param jobContext Context of the job whose output is being written.
  16057. @throws IOException]]>
  16058. </doc>
  16059. </method>
  16060. <method name="abortJob"
  16061. abstract="false" native="false" synchronized="false"
  16062. static="false" final="false" visibility="public"
  16063. deprecated="not deprecated">
  16064. <param name="jobContext" type="org.apache.hadoop.mapreduce.JobContext"/>
  16065. <param name="state" type="org.apache.hadoop.mapreduce.JobStatus.State"/>
  16066. <exception name="IOException" type="java.io.IOException"/>
  16067. <doc>
  16068. <![CDATA[For aborting an unsuccessful job's output. Note that this is invoked for
  16069. jobs with final runstate as {@link JobStatus.State#FAILED} or
  16070. {@link JobStatus.State#KILLED}.
  16071. @param jobContext Context of the job whose output is being written.
  16072. @param state final runstate of the job
  16073. @throws IOException]]>
  16074. </doc>
  16075. </method>
  16076. <method name="setupTask"
  16077. abstract="true" native="false" synchronized="false"
  16078. static="false" final="false" visibility="public"
  16079. deprecated="not deprecated">
  16080. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16081. <exception name="IOException" type="java.io.IOException"/>
  16082. <doc>
  16083. <![CDATA[Sets up output for the task.
  16084. @param taskContext Context of the task whose output is being written.
  16085. @throws IOException]]>
  16086. </doc>
  16087. </method>
  16088. <method name="needsTaskCommit" return="boolean"
  16089. abstract="true" native="false" synchronized="false"
  16090. static="false" final="false" visibility="public"
  16091. deprecated="not deprecated">
  16092. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16093. <exception name="IOException" type="java.io.IOException"/>
  16094. <doc>
  16095. <![CDATA[Check whether task needs a commit
  16096. @param taskContext
  16097. @return true/false
  16098. @throws IOException]]>
  16099. </doc>
  16100. </method>
  16101. <method name="commitTask"
  16102. abstract="true" native="false" synchronized="false"
  16103. static="false" final="false" visibility="public"
  16104. deprecated="not deprecated">
  16105. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16106. <exception name="IOException" type="java.io.IOException"/>
  16107. <doc>
  16108. <![CDATA[To promote the task's temporary output to final output location
  16109. The task's output is moved to the job's output directory.
  16110. @param taskContext Context of the task whose output is being written.
  16111. @throws IOException if commit is not]]>
  16112. </doc>
  16113. </method>
  16114. <method name="abortTask"
  16115. abstract="true" native="false" synchronized="false"
  16116. static="false" final="false" visibility="public"
  16117. deprecated="not deprecated">
  16118. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16119. <exception name="IOException" type="java.io.IOException"/>
  16120. <doc>
  16121. <![CDATA[Discard the task output
  16122. @param taskContext
  16123. @throws IOException]]>
  16124. </doc>
  16125. </method>
  16126. <doc>
  16127. <![CDATA[<code>OutputCommitter</code> describes the commit of task output for a
  16128. Map-Reduce job.
  16129. <p>The Map-Reduce framework relies on the <code>OutputCommitter</code> of
  16130. the job to:<p>
  16131. <ol>
  16132. <li>
  16133. Setup the job during initialization. For example, create the temporary
  16134. output directory for the job during the initialization of the job.
  16135. </li>
  16136. <li>
  16137. Cleanup the job after the job completion. For example, remove the
  16138. temporary output directory after the job completion.
  16139. </li>
  16140. <li>
  16141. Setup the task temporary output.
  16142. </li>
  16143. <li>
  16144. Check whether a task needs a commit. This is to avoid the commit
  16145. procedure if a task does not need commit.
  16146. </li>
  16147. <li>
  16148. Commit of the task output.
  16149. </li>
  16150. <li>
  16151. Discard the task commit.
  16152. </li>
  16153. </ol>
  16154. @see org.apache.hadoop.mapreduce.lib.output.FileOutputCommitter
  16155. @see JobContext
  16156. @see TaskAttemptContext]]>
  16157. </doc>
  16158. </class>
  16159. <!-- end class org.apache.hadoop.mapreduce.OutputCommitter -->
  16160. <!-- start class org.apache.hadoop.mapreduce.OutputFormat -->
  16161. <class name="OutputFormat" extends="java.lang.Object"
  16162. abstract="true"
  16163. static="false" final="false" visibility="public"
  16164. deprecated="not deprecated">
  16165. <constructor name="OutputFormat"
  16166. static="false" final="false" visibility="public"
  16167. deprecated="not deprecated">
  16168. </constructor>
  16169. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  16170. abstract="true" native="false" synchronized="false"
  16171. static="false" final="false" visibility="public"
  16172. deprecated="not deprecated">
  16173. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16174. <exception name="IOException" type="java.io.IOException"/>
  16175. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16176. <doc>
  16177. <![CDATA[Get the {@link RecordWriter} for the given task.
  16178. @param context the information about the current task.
  16179. @return a {@link RecordWriter} to write the output for the job.
  16180. @throws IOException]]>
  16181. </doc>
  16182. </method>
  16183. <method name="checkOutputSpecs"
  16184. abstract="true" native="false" synchronized="false"
  16185. static="false" final="false" visibility="public"
  16186. deprecated="not deprecated">
  16187. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  16188. <exception name="IOException" type="java.io.IOException"/>
  16189. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16190. <doc>
  16191. <![CDATA[Check for validity of the output-specification for the job.
  16192. <p>This is to validate the output specification for the job when it is
  16193. a job is submitted. Typically checks that it does not already exist,
  16194. throwing an exception when it already exists, so that output is not
  16195. overwritten.</p>
  16196. @param context information about the job
  16197. @throws IOException when output should not be attempted]]>
  16198. </doc>
  16199. </method>
  16200. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  16201. abstract="true" native="false" synchronized="false"
  16202. static="false" final="false" visibility="public"
  16203. deprecated="not deprecated">
  16204. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16205. <exception name="IOException" type="java.io.IOException"/>
  16206. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16207. <doc>
  16208. <![CDATA[Get the output committer for this output format. This is responsible
  16209. for ensuring the output is committed correctly.
  16210. @param context the task context
  16211. @return an output committer
  16212. @throws IOException
  16213. @throws InterruptedException]]>
  16214. </doc>
  16215. </method>
  16216. <doc>
  16217. <![CDATA[<code>OutputFormat</code> describes the output-specification for a
  16218. Map-Reduce job.
  16219. <p>The Map-Reduce framework relies on the <code>OutputFormat</code> of the
  16220. job to:<p>
  16221. <ol>
  16222. <li>
  16223. Validate the output-specification of the job. For e.g. check that the
  16224. output directory doesn't already exist.
  16225. <li>
  16226. Provide the {@link RecordWriter} implementation to be used to write out
  16227. the output files of the job. Output files are stored in a
  16228. {@link FileSystem}.
  16229. </li>
  16230. </ol>
  16231. @see RecordWriter]]>
  16232. </doc>
  16233. </class>
  16234. <!-- end class org.apache.hadoop.mapreduce.OutputFormat -->
  16235. <!-- start class org.apache.hadoop.mapreduce.Partitioner -->
  16236. <class name="Partitioner" extends="java.lang.Object"
  16237. abstract="true"
  16238. static="false" final="false" visibility="public"
  16239. deprecated="not deprecated">
  16240. <constructor name="Partitioner"
  16241. static="false" final="false" visibility="public"
  16242. deprecated="not deprecated">
  16243. </constructor>
  16244. <method name="getPartition" return="int"
  16245. abstract="true" native="false" synchronized="false"
  16246. static="false" final="false" visibility="public"
  16247. deprecated="not deprecated">
  16248. <param name="key" type="KEY"/>
  16249. <param name="value" type="VALUE"/>
  16250. <param name="numPartitions" type="int"/>
  16251. <doc>
  16252. <![CDATA[Get the partition number for a given key (hence record) given the total
  16253. number of partitions i.e. number of reduce-tasks for the job.
  16254. <p>Typically a hash function on a all or a subset of the key.</p>
  16255. @param key the key to be partioned.
  16256. @param value the entry value.
  16257. @param numPartitions the total number of partitions.
  16258. @return the partition number for the <code>key</code>.]]>
  16259. </doc>
  16260. </method>
  16261. <doc>
  16262. <![CDATA[Partitions the key space.
  16263. <p><code>Partitioner</code> controls the partitioning of the keys of the
  16264. intermediate map-outputs. The key (or a subset of the key) is used to derive
  16265. the partition, typically by a hash function. The total number of partitions
  16266. is the same as the number of reduce tasks for the job. Hence this controls
  16267. which of the <code>m</code> reduce tasks the intermediate key (and hence the
  16268. record) is sent for reduction.</p>
  16269. @see Reducer]]>
  16270. </doc>
  16271. </class>
  16272. <!-- end class org.apache.hadoop.mapreduce.Partitioner -->
  16273. <!-- start class org.apache.hadoop.mapreduce.QueueAclsInfo -->
  16274. <class name="QueueAclsInfo" extends="java.lang.Object"
  16275. abstract="false"
  16276. static="false" final="false" visibility="public"
  16277. deprecated="not deprecated">
  16278. <implements name="org.apache.hadoop.io.Writable"/>
  16279. <constructor name="QueueAclsInfo"
  16280. static="false" final="false" visibility="public"
  16281. deprecated="not deprecated">
  16282. <doc>
  16283. <![CDATA[Default constructor for QueueAclsInfo.]]>
  16284. </doc>
  16285. </constructor>
  16286. <constructor name="QueueAclsInfo" type="java.lang.String, java.lang.String[]"
  16287. static="false" final="false" visibility="public"
  16288. deprecated="not deprecated">
  16289. <doc>
  16290. <![CDATA[Construct a new QueueAclsInfo object using the queue name and the
  16291. queue operations array
  16292. @param queueName Name of the job queue
  16293. @param operations]]>
  16294. </doc>
  16295. </constructor>
  16296. <method name="getQueueName" return="java.lang.String"
  16297. abstract="false" native="false" synchronized="false"
  16298. static="false" final="false" visibility="public"
  16299. deprecated="not deprecated">
  16300. <doc>
  16301. <![CDATA[Get queue name.
  16302. @return name]]>
  16303. </doc>
  16304. </method>
  16305. <method name="setQueueName"
  16306. abstract="false" native="false" synchronized="false"
  16307. static="false" final="false" visibility="protected"
  16308. deprecated="not deprecated">
  16309. <param name="queueName" type="java.lang.String"/>
  16310. </method>
  16311. <method name="getOperations" return="java.lang.String[]"
  16312. abstract="false" native="false" synchronized="false"
  16313. static="false" final="false" visibility="public"
  16314. deprecated="not deprecated">
  16315. <doc>
  16316. <![CDATA[Get opearations allowed on queue.
  16317. @return array of String]]>
  16318. </doc>
  16319. </method>
  16320. <method name="readFields"
  16321. abstract="false" native="false" synchronized="false"
  16322. static="false" final="false" visibility="public"
  16323. deprecated="not deprecated">
  16324. <param name="in" type="java.io.DataInput"/>
  16325. <exception name="IOException" type="java.io.IOException"/>
  16326. </method>
  16327. <method name="write"
  16328. abstract="false" native="false" synchronized="false"
  16329. static="false" final="false" visibility="public"
  16330. deprecated="not deprecated">
  16331. <param name="out" type="java.io.DataOutput"/>
  16332. <exception name="IOException" type="java.io.IOException"/>
  16333. </method>
  16334. <doc>
  16335. <![CDATA[Class to encapsulate Queue ACLs for a particular
  16336. user.]]>
  16337. </doc>
  16338. </class>
  16339. <!-- end class org.apache.hadoop.mapreduce.QueueAclsInfo -->
  16340. <!-- start class org.apache.hadoop.mapreduce.QueueInfo -->
  16341. <class name="QueueInfo" extends="java.lang.Object"
  16342. abstract="false"
  16343. static="false" final="false" visibility="public"
  16344. deprecated="not deprecated">
  16345. <implements name="org.apache.hadoop.io.Writable"/>
  16346. <constructor name="QueueInfo"
  16347. static="false" final="false" visibility="public"
  16348. deprecated="not deprecated">
  16349. <doc>
  16350. <![CDATA[Default constructor for QueueInfo.]]>
  16351. </doc>
  16352. </constructor>
  16353. <constructor name="QueueInfo" type="java.lang.String, java.lang.String"
  16354. static="false" final="false" visibility="public"
  16355. deprecated="not deprecated">
  16356. <doc>
  16357. <![CDATA[Construct a new QueueInfo object using the queue name and the
  16358. scheduling information passed.
  16359. @param queueName Name of the job queue
  16360. @param schedulingInfo Scheduling Information associated with the job
  16361. queue]]>
  16362. </doc>
  16363. </constructor>
  16364. <constructor name="QueueInfo" type="java.lang.String, java.lang.String, org.apache.hadoop.mapreduce.QueueState, org.apache.hadoop.mapreduce.JobStatus[]"
  16365. static="false" final="false" visibility="public"
  16366. deprecated="not deprecated">
  16367. <doc>
  16368. <![CDATA[@param queueName
  16369. @param schedulingInfo
  16370. @param state
  16371. @param stats]]>
  16372. </doc>
  16373. </constructor>
  16374. <method name="setQueueName"
  16375. abstract="false" native="false" synchronized="false"
  16376. static="false" final="false" visibility="protected"
  16377. deprecated="not deprecated">
  16378. <param name="queueName" type="java.lang.String"/>
  16379. <doc>
  16380. <![CDATA[Set the queue name of the JobQueueInfo
  16381. @param queueName Name of the job queue.]]>
  16382. </doc>
  16383. </method>
  16384. <method name="getQueueName" return="java.lang.String"
  16385. abstract="false" native="false" synchronized="false"
  16386. static="false" final="false" visibility="public"
  16387. deprecated="not deprecated">
  16388. <doc>
  16389. <![CDATA[Get the queue name from JobQueueInfo
  16390. @return queue name]]>
  16391. </doc>
  16392. </method>
  16393. <method name="setSchedulingInfo"
  16394. abstract="false" native="false" synchronized="false"
  16395. static="false" final="false" visibility="protected"
  16396. deprecated="not deprecated">
  16397. <param name="schedulingInfo" type="java.lang.String"/>
  16398. <doc>
  16399. <![CDATA[Set the scheduling information associated to particular job queue
  16400. @param schedulingInfo]]>
  16401. </doc>
  16402. </method>
  16403. <method name="getSchedulingInfo" return="java.lang.String"
  16404. abstract="false" native="false" synchronized="false"
  16405. static="false" final="false" visibility="public"
  16406. deprecated="not deprecated">
  16407. <doc>
  16408. <![CDATA[Gets the scheduling information associated to particular job queue.
  16409. If nothing is set would return <b>"N/A"</b>
  16410. @return Scheduling information associated to particular Job Queue]]>
  16411. </doc>
  16412. </method>
  16413. <method name="setState"
  16414. abstract="false" native="false" synchronized="false"
  16415. static="false" final="false" visibility="protected"
  16416. deprecated="not deprecated">
  16417. <param name="state" type="org.apache.hadoop.mapreduce.QueueState"/>
  16418. <doc>
  16419. <![CDATA[Set the state of the queue
  16420. @param state state of the queue.]]>
  16421. </doc>
  16422. </method>
  16423. <method name="getState" return="org.apache.hadoop.mapreduce.QueueState"
  16424. abstract="false" native="false" synchronized="false"
  16425. static="false" final="false" visibility="public"
  16426. deprecated="not deprecated">
  16427. <doc>
  16428. <![CDATA[Return the queue state
  16429. @return the queue state.]]>
  16430. </doc>
  16431. </method>
  16432. <method name="setJobStatuses"
  16433. abstract="false" native="false" synchronized="false"
  16434. static="false" final="false" visibility="protected"
  16435. deprecated="not deprecated">
  16436. <param name="stats" type="org.apache.hadoop.mapreduce.JobStatus[]"/>
  16437. </method>
  16438. <method name="getQueueChildren" return="java.util.List"
  16439. abstract="false" native="false" synchronized="false"
  16440. static="false" final="false" visibility="public"
  16441. deprecated="not deprecated">
  16442. <doc>
  16443. <![CDATA[Get immediate children.
  16444. @return list of QueueInfo]]>
  16445. </doc>
  16446. </method>
  16447. <method name="setQueueChildren"
  16448. abstract="false" native="false" synchronized="false"
  16449. static="false" final="false" visibility="protected"
  16450. deprecated="not deprecated">
  16451. <param name="children" type="java.util.List"/>
  16452. </method>
  16453. <method name="getProperties" return="java.util.Properties"
  16454. abstract="false" native="false" synchronized="false"
  16455. static="false" final="false" visibility="public"
  16456. deprecated="not deprecated">
  16457. <doc>
  16458. <![CDATA[Get properties.
  16459. @return Properties]]>
  16460. </doc>
  16461. </method>
  16462. <method name="setProperties"
  16463. abstract="false" native="false" synchronized="false"
  16464. static="false" final="false" visibility="protected"
  16465. deprecated="not deprecated">
  16466. <param name="props" type="java.util.Properties"/>
  16467. </method>
  16468. <method name="getJobStatuses" return="org.apache.hadoop.mapreduce.JobStatus[]"
  16469. abstract="false" native="false" synchronized="false"
  16470. static="false" final="false" visibility="public"
  16471. deprecated="not deprecated">
  16472. <doc>
  16473. <![CDATA[Get the jobs submitted to queue
  16474. @return list of JobStatus for the submitted jobs]]>
  16475. </doc>
  16476. </method>
  16477. <method name="readFields"
  16478. abstract="false" native="false" synchronized="false"
  16479. static="false" final="false" visibility="public"
  16480. deprecated="not deprecated">
  16481. <param name="in" type="java.io.DataInput"/>
  16482. <exception name="IOException" type="java.io.IOException"/>
  16483. </method>
  16484. <method name="write"
  16485. abstract="false" native="false" synchronized="false"
  16486. static="false" final="false" visibility="public"
  16487. deprecated="not deprecated">
  16488. <param name="out" type="java.io.DataOutput"/>
  16489. <exception name="IOException" type="java.io.IOException"/>
  16490. </method>
  16491. <doc>
  16492. <![CDATA[Class that contains the information regarding the Job Queues which are
  16493. maintained by the Hadoop Map/Reduce framework.]]>
  16494. </doc>
  16495. </class>
  16496. <!-- end class org.apache.hadoop.mapreduce.QueueInfo -->
  16497. <!-- start class org.apache.hadoop.mapreduce.QueueState -->
  16498. <class name="QueueState" extends="java.lang.Enum"
  16499. abstract="false"
  16500. static="false" final="true" visibility="public"
  16501. deprecated="not deprecated">
  16502. <method name="values" return="org.apache.hadoop.mapreduce.QueueState[]"
  16503. abstract="false" native="false" synchronized="false"
  16504. static="true" final="false" visibility="public"
  16505. deprecated="not deprecated">
  16506. </method>
  16507. <method name="valueOf" return="org.apache.hadoop.mapreduce.QueueState"
  16508. abstract="false" native="false" synchronized="false"
  16509. static="true" final="false" visibility="public"
  16510. deprecated="not deprecated">
  16511. <param name="name" type="java.lang.String"/>
  16512. </method>
  16513. <method name="getStateName" return="java.lang.String"
  16514. abstract="false" native="false" synchronized="false"
  16515. static="false" final="false" visibility="public"
  16516. deprecated="not deprecated">
  16517. <doc>
  16518. <![CDATA[@return the stateName]]>
  16519. </doc>
  16520. </method>
  16521. <method name="getState" return="org.apache.hadoop.mapreduce.QueueState"
  16522. abstract="false" native="false" synchronized="false"
  16523. static="true" final="false" visibility="public"
  16524. deprecated="not deprecated">
  16525. <param name="state" type="java.lang.String"/>
  16526. </method>
  16527. <method name="toString" return="java.lang.String"
  16528. abstract="false" native="false" synchronized="false"
  16529. static="false" final="false" visibility="public"
  16530. deprecated="not deprecated">
  16531. </method>
  16532. <doc>
  16533. <![CDATA[Enum representing queue state]]>
  16534. </doc>
  16535. </class>
  16536. <!-- end class org.apache.hadoop.mapreduce.QueueState -->
  16537. <!-- start class org.apache.hadoop.mapreduce.RecordReader -->
  16538. <class name="RecordReader" extends="java.lang.Object"
  16539. abstract="true"
  16540. static="false" final="false" visibility="public"
  16541. deprecated="not deprecated">
  16542. <implements name="java.io.Closeable"/>
  16543. <constructor name="RecordReader"
  16544. static="false" final="false" visibility="public"
  16545. deprecated="not deprecated">
  16546. </constructor>
  16547. <method name="initialize"
  16548. abstract="true" native="false" synchronized="false"
  16549. static="false" final="false" visibility="public"
  16550. deprecated="not deprecated">
  16551. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  16552. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16553. <exception name="IOException" type="java.io.IOException"/>
  16554. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16555. <doc>
  16556. <![CDATA[Called once at initialization.
  16557. @param split the split that defines the range of records to read
  16558. @param context the information about the task
  16559. @throws IOException
  16560. @throws InterruptedException]]>
  16561. </doc>
  16562. </method>
  16563. <method name="nextKeyValue" return="boolean"
  16564. abstract="true" native="false" synchronized="false"
  16565. static="false" final="false" visibility="public"
  16566. deprecated="not deprecated">
  16567. <exception name="IOException" type="java.io.IOException"/>
  16568. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16569. <doc>
  16570. <![CDATA[Read the next key, value pair.
  16571. @return true if a key/value pair was read
  16572. @throws IOException
  16573. @throws InterruptedException]]>
  16574. </doc>
  16575. </method>
  16576. <method name="getCurrentKey" return="KEYIN"
  16577. abstract="true" native="false" synchronized="false"
  16578. static="false" final="false" visibility="public"
  16579. deprecated="not deprecated">
  16580. <exception name="IOException" type="java.io.IOException"/>
  16581. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16582. <doc>
  16583. <![CDATA[Get the current key
  16584. @return the current key or null if there is no current key
  16585. @throws IOException
  16586. @throws InterruptedException]]>
  16587. </doc>
  16588. </method>
  16589. <method name="getCurrentValue" return="VALUEIN"
  16590. abstract="true" native="false" synchronized="false"
  16591. static="false" final="false" visibility="public"
  16592. deprecated="not deprecated">
  16593. <exception name="IOException" type="java.io.IOException"/>
  16594. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16595. <doc>
  16596. <![CDATA[Get the current value.
  16597. @return the object that was read
  16598. @throws IOException
  16599. @throws InterruptedException]]>
  16600. </doc>
  16601. </method>
  16602. <method name="getProgress" return="float"
  16603. abstract="true" native="false" synchronized="false"
  16604. static="false" final="false" visibility="public"
  16605. deprecated="not deprecated">
  16606. <exception name="IOException" type="java.io.IOException"/>
  16607. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16608. <doc>
  16609. <![CDATA[The current progress of the record reader through its data.
  16610. @return a number between 0.0 and 1.0 that is the fraction of the data read
  16611. @throws IOException
  16612. @throws InterruptedException]]>
  16613. </doc>
  16614. </method>
  16615. <method name="close"
  16616. abstract="true" native="false" synchronized="false"
  16617. static="false" final="false" visibility="public"
  16618. deprecated="not deprecated">
  16619. <exception name="IOException" type="java.io.IOException"/>
  16620. <doc>
  16621. <![CDATA[Close the record reader.]]>
  16622. </doc>
  16623. </method>
  16624. <doc>
  16625. <![CDATA[The record reader breaks the data into key/value pairs for input to the
  16626. {@link Mapper}.
  16627. @param <KEYIN>
  16628. @param <VALUEIN>]]>
  16629. </doc>
  16630. </class>
  16631. <!-- end class org.apache.hadoop.mapreduce.RecordReader -->
  16632. <!-- start class org.apache.hadoop.mapreduce.RecordWriter -->
  16633. <class name="RecordWriter" extends="java.lang.Object"
  16634. abstract="true"
  16635. static="false" final="false" visibility="public"
  16636. deprecated="not deprecated">
  16637. <constructor name="RecordWriter"
  16638. static="false" final="false" visibility="public"
  16639. deprecated="not deprecated">
  16640. </constructor>
  16641. <method name="write"
  16642. abstract="true" native="false" synchronized="false"
  16643. static="false" final="false" visibility="public"
  16644. deprecated="not deprecated">
  16645. <param name="key" type="K"/>
  16646. <param name="value" type="V"/>
  16647. <exception name="IOException" type="java.io.IOException"/>
  16648. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16649. <doc>
  16650. <![CDATA[Writes a key/value pair.
  16651. @param key the key to write.
  16652. @param value the value to write.
  16653. @throws IOException]]>
  16654. </doc>
  16655. </method>
  16656. <method name="close"
  16657. abstract="true" native="false" synchronized="false"
  16658. static="false" final="false" visibility="public"
  16659. deprecated="not deprecated">
  16660. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  16661. <exception name="IOException" type="java.io.IOException"/>
  16662. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16663. <doc>
  16664. <![CDATA[Close this <code>RecordWriter</code> to future operations.
  16665. @param context the context of the task
  16666. @throws IOException]]>
  16667. </doc>
  16668. </method>
  16669. <doc>
  16670. <![CDATA[<code>RecordWriter</code> writes the output &lt;key, value&gt; pairs
  16671. to an output file.
  16672. <p><code>RecordWriter</code> implementations write the job outputs to the
  16673. {@link FileSystem}.
  16674. @see OutputFormat]]>
  16675. </doc>
  16676. </class>
  16677. <!-- end class org.apache.hadoop.mapreduce.RecordWriter -->
  16678. <!-- start interface org.apache.hadoop.mapreduce.ReduceContext -->
  16679. <interface name="ReduceContext" abstract="true"
  16680. static="false" final="false" visibility="public"
  16681. deprecated="not deprecated">
  16682. <implements name="org.apache.hadoop.mapreduce.TaskInputOutputContext"/>
  16683. <method name="nextKey" return="boolean"
  16684. abstract="false" native="false" synchronized="false"
  16685. static="false" final="false" visibility="public"
  16686. deprecated="not deprecated">
  16687. <exception name="IOException" type="java.io.IOException"/>
  16688. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16689. <doc>
  16690. <![CDATA[Start processing next unique key.]]>
  16691. </doc>
  16692. </method>
  16693. <method name="getValues" return="java.lang.Iterable"
  16694. abstract="false" native="false" synchronized="false"
  16695. static="false" final="false" visibility="public"
  16696. deprecated="not deprecated">
  16697. <exception name="IOException" type="java.io.IOException"/>
  16698. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16699. <doc>
  16700. <![CDATA[Iterate through the values for the current key, reusing the same value
  16701. object, which is stored in the context.
  16702. @return the series of values associated with the current key. All of the
  16703. objects returned directly and indirectly from this method are reused.]]>
  16704. </doc>
  16705. </method>
  16706. <doc>
  16707. <![CDATA[The context passed to the {@link Reducer}.
  16708. @param <KEYIN> the class of the input keys
  16709. @param <VALUEIN> the class of the input values
  16710. @param <KEYOUT> the class of the output keys
  16711. @param <VALUEOUT> the class of the output values]]>
  16712. </doc>
  16713. </interface>
  16714. <!-- end interface org.apache.hadoop.mapreduce.ReduceContext -->
  16715. <!-- start interface org.apache.hadoop.mapreduce.ReduceContext.ValueIterator -->
  16716. <interface name="ReduceContext.ValueIterator" abstract="true"
  16717. static="true" final="false" visibility="public"
  16718. deprecated="not deprecated">
  16719. <implements name="org.apache.hadoop.mapreduce.MarkableIteratorInterface"/>
  16720. <method name="resetBackupStore"
  16721. abstract="false" native="false" synchronized="false"
  16722. static="false" final="false" visibility="public"
  16723. deprecated="not deprecated">
  16724. <exception name="IOException" type="java.io.IOException"/>
  16725. <doc>
  16726. <![CDATA[This method is called when the reducer moves from one key to
  16727. another.
  16728. @throws IOException]]>
  16729. </doc>
  16730. </method>
  16731. <doc>
  16732. <![CDATA[{@link Iterator} to iterate over values for a given group of records.]]>
  16733. </doc>
  16734. </interface>
  16735. <!-- end interface org.apache.hadoop.mapreduce.ReduceContext.ValueIterator -->
  16736. <!-- start class org.apache.hadoop.mapreduce.Reducer -->
  16737. <class name="Reducer" extends="java.lang.Object"
  16738. abstract="false"
  16739. static="false" final="false" visibility="public"
  16740. deprecated="not deprecated">
  16741. <constructor name="Reducer"
  16742. static="false" final="false" visibility="public"
  16743. deprecated="not deprecated">
  16744. </constructor>
  16745. <method name="setup"
  16746. abstract="false" native="false" synchronized="false"
  16747. static="false" final="false" visibility="protected"
  16748. deprecated="not deprecated">
  16749. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  16750. <exception name="IOException" type="java.io.IOException"/>
  16751. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16752. <doc>
  16753. <![CDATA[Called once at the start of the task.]]>
  16754. </doc>
  16755. </method>
  16756. <method name="reduce"
  16757. abstract="false" native="false" synchronized="false"
  16758. static="false" final="false" visibility="protected"
  16759. deprecated="not deprecated">
  16760. <param name="key" type="KEYIN"/>
  16761. <param name="values" type="java.lang.Iterable"/>
  16762. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  16763. <exception name="IOException" type="java.io.IOException"/>
  16764. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16765. <doc>
  16766. <![CDATA[This method is called once for each key. Most applications will define
  16767. their reduce class by overriding this method. The default implementation
  16768. is an identity function.]]>
  16769. </doc>
  16770. </method>
  16771. <method name="cleanup"
  16772. abstract="false" native="false" synchronized="false"
  16773. static="false" final="false" visibility="protected"
  16774. deprecated="not deprecated">
  16775. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  16776. <exception name="IOException" type="java.io.IOException"/>
  16777. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16778. <doc>
  16779. <![CDATA[Called once at the end of the task.]]>
  16780. </doc>
  16781. </method>
  16782. <method name="run"
  16783. abstract="false" native="false" synchronized="false"
  16784. static="false" final="false" visibility="public"
  16785. deprecated="not deprecated">
  16786. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  16787. <exception name="IOException" type="java.io.IOException"/>
  16788. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  16789. <doc>
  16790. <![CDATA[Advanced application writers can use the
  16791. {@link #run(org.apache.hadoop.mapreduce.Reducer.Context)} method to
  16792. control how the reduce task works.]]>
  16793. </doc>
  16794. </method>
  16795. <doc>
  16796. <![CDATA[Reduces a set of intermediate values which share a key to a smaller set of
  16797. values.
  16798. <p><code>Reducer</code> implementations
  16799. can access the {@link Configuration} for the job via the
  16800. {@link JobContext#getConfiguration()} method.</p>
  16801. <p><code>Reducer</code> has 3 primary phases:</p>
  16802. <ol>
  16803. <li>
  16804. <h4 id="Shuffle">Shuffle</h4>
  16805. <p>The <code>Reducer</code> copies the sorted output from each
  16806. {@link Mapper} using HTTP across the network.</p>
  16807. </li>
  16808. <li>
  16809. <h4 id="Sort">Sort</h4>
  16810. <p>The framework merge sorts <code>Reducer</code> inputs by
  16811. <code>key</code>s
  16812. (since different <code>Mapper</code>s may have output the same key).</p>
  16813. <p>The shuffle and sort phases occur simultaneously i.e. while outputs are
  16814. being fetched they are merged.</p>
  16815. <h5 id="SecondarySort">SecondarySort</h5>
  16816. <p>To achieve a secondary sort on the values returned by the value
  16817. iterator, the application should extend the key with the secondary
  16818. key and define a grouping comparator. The keys will be sorted using the
  16819. entire key, but will be grouped using the grouping comparator to decide
  16820. which keys and values are sent in the same call to reduce.The grouping
  16821. comparator is specified via
  16822. {@link Job#setGroupingComparatorClass(Class)}. The sort order is
  16823. controlled by
  16824. {@link Job#setSortComparatorClass(Class)}.</p>
  16825. For example, say that you want to find duplicate web pages and tag them
  16826. all with the url of the "best" known example. You would set up the job
  16827. like:
  16828. <ul>
  16829. <li>Map Input Key: url</li>
  16830. <li>Map Input Value: document</li>
  16831. <li>Map Output Key: document checksum, url pagerank</li>
  16832. <li>Map Output Value: url</li>
  16833. <li>Partitioner: by checksum</li>
  16834. <li>OutputKeyComparator: by checksum and then decreasing pagerank</li>
  16835. <li>OutputValueGroupingComparator: by checksum</li>
  16836. </ul>
  16837. </li>
  16838. <li>
  16839. <h4 id="Reduce">Reduce</h4>
  16840. <p>In this phase the
  16841. {@link #reduce(Object, Iterable, Context)}
  16842. method is called for each <code>&lt;key, (collection of values)&gt;</code> in
  16843. the sorted inputs.</p>
  16844. <p>The output of the reduce task is typically written to a
  16845. {@link RecordWriter} via
  16846. {@link Context#write(Object, Object)}.</p>
  16847. </li>
  16848. </ol>
  16849. <p>The output of the <code>Reducer</code> is <b>not re-sorted</b>.</p>
  16850. <p>Example:</p>
  16851. <p><blockquote><pre>
  16852. public class IntSumReducer&lt;Key&gt; extends Reducer&lt;Key,IntWritable,
  16853. Key,IntWritable&gt; {
  16854. private IntWritable result = new IntWritable();
  16855. public void reduce(Key key, Iterable&lt;IntWritable&gt; values,
  16856. Context context) throws IOException, InterruptedException {
  16857. int sum = 0;
  16858. for (IntWritable val : values) {
  16859. sum += val.get();
  16860. }
  16861. result.set(sum);
  16862. context.write(key, result);
  16863. }
  16864. }
  16865. </pre></blockquote></p>
  16866. @see Mapper
  16867. @see Partitioner]]>
  16868. </doc>
  16869. </class>
  16870. <!-- end class org.apache.hadoop.mapreduce.Reducer -->
  16871. <!-- start class org.apache.hadoop.mapreduce.Reducer.Context -->
  16872. <class name="Reducer.Context" extends="java.lang.Object"
  16873. abstract="true"
  16874. static="false" final="false" visibility="public"
  16875. deprecated="not deprecated">
  16876. <implements name="org.apache.hadoop.mapreduce.ReduceContext"/>
  16877. <constructor name="Reducer.Context"
  16878. static="false" final="false" visibility="public"
  16879. deprecated="not deprecated">
  16880. </constructor>
  16881. <doc>
  16882. <![CDATA[The <code>Context</code> passed on to the {@link Reducer} implementations.]]>
  16883. </doc>
  16884. </class>
  16885. <!-- end class org.apache.hadoop.mapreduce.Reducer.Context -->
  16886. <!-- start interface org.apache.hadoop.mapreduce.TaskAttemptContext -->
  16887. <interface name="TaskAttemptContext" abstract="true"
  16888. static="false" final="false" visibility="public"
  16889. deprecated="not deprecated">
  16890. <implements name="org.apache.hadoop.mapreduce.JobContext"/>
  16891. <implements name="org.apache.hadoop.util.Progressable"/>
  16892. <method name="getTaskAttemptID" return="org.apache.hadoop.mapreduce.TaskAttemptID"
  16893. abstract="false" native="false" synchronized="false"
  16894. static="false" final="false" visibility="public"
  16895. deprecated="not deprecated">
  16896. <doc>
  16897. <![CDATA[Get the unique name for this task attempt.]]>
  16898. </doc>
  16899. </method>
  16900. <method name="setStatus"
  16901. abstract="false" native="false" synchronized="false"
  16902. static="false" final="false" visibility="public"
  16903. deprecated="not deprecated">
  16904. <param name="msg" type="java.lang.String"/>
  16905. <doc>
  16906. <![CDATA[Set the current status of the task to the given string.]]>
  16907. </doc>
  16908. </method>
  16909. <method name="getStatus" return="java.lang.String"
  16910. abstract="false" native="false" synchronized="false"
  16911. static="false" final="false" visibility="public"
  16912. deprecated="not deprecated">
  16913. <doc>
  16914. <![CDATA[Get the last set status message.
  16915. @return the current status message]]>
  16916. </doc>
  16917. </method>
  16918. <method name="getCounter" return="org.apache.hadoop.mapreduce.Counter"
  16919. abstract="false" native="false" synchronized="false"
  16920. static="false" final="false" visibility="public"
  16921. deprecated="not deprecated">
  16922. <param name="counterName" type="java.lang.Enum"/>
  16923. <doc>
  16924. <![CDATA[Get the {@link Counter} for the given <code>counterName</code>.
  16925. @param counterName counter name
  16926. @return the <code>Counter</code> for the given <code>counterName</code>]]>
  16927. </doc>
  16928. </method>
  16929. <method name="getCounter" return="org.apache.hadoop.mapreduce.Counter"
  16930. abstract="false" native="false" synchronized="false"
  16931. static="false" final="false" visibility="public"
  16932. deprecated="not deprecated">
  16933. <param name="groupName" type="java.lang.String"/>
  16934. <param name="counterName" type="java.lang.String"/>
  16935. <doc>
  16936. <![CDATA[Get the {@link Counter} for the given <code>groupName</code> and
  16937. <code>counterName</code>.
  16938. @param counterName counter name
  16939. @return the <code>Counter</code> for the given <code>groupName</code> and
  16940. <code>counterName</code>]]>
  16941. </doc>
  16942. </method>
  16943. <doc>
  16944. <![CDATA[The context for task attempts.]]>
  16945. </doc>
  16946. </interface>
  16947. <!-- end interface org.apache.hadoop.mapreduce.TaskAttemptContext -->
  16948. <!-- start class org.apache.hadoop.mapreduce.TaskAttemptID -->
  16949. <class name="TaskAttemptID" extends="org.apache.hadoop.mapred.ID"
  16950. abstract="false"
  16951. static="false" final="false" visibility="public"
  16952. deprecated="not deprecated">
  16953. <constructor name="TaskAttemptID" type="org.apache.hadoop.mapreduce.TaskID, int"
  16954. static="false" final="false" visibility="public"
  16955. deprecated="not deprecated">
  16956. <doc>
  16957. <![CDATA[Constructs a TaskAttemptID object from given {@link TaskID}.
  16958. @param taskId TaskID that this task belongs to
  16959. @param id the task attempt number]]>
  16960. </doc>
  16961. </constructor>
  16962. <constructor name="TaskAttemptID" type="java.lang.String, int, org.apache.hadoop.mapreduce.TaskType, int, int"
  16963. static="false" final="false" visibility="public"
  16964. deprecated="not deprecated">
  16965. <doc>
  16966. <![CDATA[Constructs a TaskId object from given parts.
  16967. @param jtIdentifier jobTracker identifier
  16968. @param jobId job number
  16969. @param type the TaskType
  16970. @param taskId taskId number
  16971. @param id the task attempt number]]>
  16972. </doc>
  16973. </constructor>
  16974. <constructor name="TaskAttemptID"
  16975. static="false" final="false" visibility="public"
  16976. deprecated="not deprecated">
  16977. </constructor>
  16978. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  16979. abstract="false" native="false" synchronized="false"
  16980. static="false" final="false" visibility="public"
  16981. deprecated="not deprecated">
  16982. <doc>
  16983. <![CDATA[Returns the {@link JobID} object that this task attempt belongs to]]>
  16984. </doc>
  16985. </method>
  16986. <method name="getTaskID" return="org.apache.hadoop.mapreduce.TaskID"
  16987. abstract="false" native="false" synchronized="false"
  16988. static="false" final="false" visibility="public"
  16989. deprecated="not deprecated">
  16990. <doc>
  16991. <![CDATA[Returns the {@link TaskID} object that this task attempt belongs to]]>
  16992. </doc>
  16993. </method>
  16994. <method name="getTaskType" return="org.apache.hadoop.mapreduce.TaskType"
  16995. abstract="false" native="false" synchronized="false"
  16996. static="false" final="false" visibility="public"
  16997. deprecated="not deprecated">
  16998. <doc>
  16999. <![CDATA[Returns the TaskType of the TaskAttemptID]]>
  17000. </doc>
  17001. </method>
  17002. <method name="equals" return="boolean"
  17003. abstract="false" native="false" synchronized="false"
  17004. static="false" final="false" visibility="public"
  17005. deprecated="not deprecated">
  17006. <param name="o" type="java.lang.Object"/>
  17007. </method>
  17008. <method name="appendTo" return="java.lang.StringBuilder"
  17009. abstract="false" native="false" synchronized="false"
  17010. static="false" final="false" visibility="protected"
  17011. deprecated="not deprecated">
  17012. <param name="builder" type="java.lang.StringBuilder"/>
  17013. <doc>
  17014. <![CDATA[Add the unique string to the StringBuilder
  17015. @param builder the builder to append ot
  17016. @return the builder that was passed in.]]>
  17017. </doc>
  17018. </method>
  17019. <method name="readFields"
  17020. abstract="false" native="false" synchronized="false"
  17021. static="false" final="false" visibility="public"
  17022. deprecated="not deprecated">
  17023. <param name="in" type="java.io.DataInput"/>
  17024. <exception name="IOException" type="java.io.IOException"/>
  17025. </method>
  17026. <method name="write"
  17027. abstract="false" native="false" synchronized="false"
  17028. static="false" final="false" visibility="public"
  17029. deprecated="not deprecated">
  17030. <param name="out" type="java.io.DataOutput"/>
  17031. <exception name="IOException" type="java.io.IOException"/>
  17032. </method>
  17033. <method name="hashCode" return="int"
  17034. abstract="false" native="false" synchronized="false"
  17035. static="false" final="false" visibility="public"
  17036. deprecated="not deprecated">
  17037. </method>
  17038. <method name="compareTo" return="int"
  17039. abstract="false" native="false" synchronized="false"
  17040. static="false" final="false" visibility="public"
  17041. deprecated="not deprecated">
  17042. <param name="o" type="org.apache.hadoop.mapreduce.ID"/>
  17043. <doc>
  17044. <![CDATA[Compare TaskIds by first tipIds, then by task numbers.]]>
  17045. </doc>
  17046. </method>
  17047. <method name="toString" return="java.lang.String"
  17048. abstract="false" native="false" synchronized="false"
  17049. static="false" final="false" visibility="public"
  17050. deprecated="not deprecated">
  17051. </method>
  17052. <method name="forName" return="org.apache.hadoop.mapreduce.TaskAttemptID"
  17053. abstract="false" native="false" synchronized="false"
  17054. static="true" final="false" visibility="public"
  17055. deprecated="not deprecated">
  17056. <param name="str" type="java.lang.String"/>
  17057. <exception name="IllegalArgumentException" type="java.lang.IllegalArgumentException"/>
  17058. <doc>
  17059. <![CDATA[Construct a TaskAttemptID object from given string
  17060. @return constructed TaskAttemptID object or null if the given String is null
  17061. @throws IllegalArgumentException if the given string is malformed]]>
  17062. </doc>
  17063. </method>
  17064. <field name="ATTEMPT" type="java.lang.String"
  17065. transient="false" volatile="false"
  17066. static="true" final="true" visibility="protected"
  17067. deprecated="not deprecated">
  17068. </field>
  17069. <doc>
  17070. <![CDATA[TaskAttemptID represents the immutable and unique identifier for
  17071. a task attempt. Each task attempt is one particular instance of a Map or
  17072. Reduce Task identified by its TaskID.
  17073. TaskAttemptID consists of 2 parts. First part is the
  17074. {@link TaskID}, that this TaskAttemptID belongs to.
  17075. Second part is the task attempt number. <br>
  17076. An example TaskAttemptID is :
  17077. <code>attempt_200707121733_0003_m_000005_0</code> , which represents the
  17078. zeroth task attempt for the fifth map task in the third job
  17079. running at the jobtracker started at <code>200707121733</code>.
  17080. <p>
  17081. Applications should never construct or parse TaskAttemptID strings
  17082. , but rather use appropriate constructors or {@link #forName(String)}
  17083. method.
  17084. @see JobID
  17085. @see TaskID]]>
  17086. </doc>
  17087. </class>
  17088. <!-- end class org.apache.hadoop.mapreduce.TaskAttemptID -->
  17089. <!-- start class org.apache.hadoop.mapreduce.TaskCompletionEvent -->
  17090. <class name="TaskCompletionEvent" extends="java.lang.Object"
  17091. abstract="false"
  17092. static="false" final="false" visibility="public"
  17093. deprecated="not deprecated">
  17094. <implements name="org.apache.hadoop.io.Writable"/>
  17095. <constructor name="TaskCompletionEvent"
  17096. static="false" final="false" visibility="public"
  17097. deprecated="not deprecated">
  17098. <doc>
  17099. <![CDATA[Default constructor for Writable.]]>
  17100. </doc>
  17101. </constructor>
  17102. <constructor name="TaskCompletionEvent" type="int, org.apache.hadoop.mapreduce.TaskAttemptID, int, boolean, org.apache.hadoop.mapreduce.TaskCompletionEvent.Status, java.lang.String"
  17103. static="false" final="false" visibility="public"
  17104. deprecated="not deprecated">
  17105. <doc>
  17106. <![CDATA[Constructor. eventId should be created externally and incremented
  17107. per event for each job.
  17108. @param eventId event id, event id should be unique and assigned in
  17109. incrementally, starting from 0.
  17110. @param taskId task id
  17111. @param status task's status
  17112. @param taskTrackerHttp task tracker's host:port for http.]]>
  17113. </doc>
  17114. </constructor>
  17115. <method name="getEventId" return="int"
  17116. abstract="false" native="false" synchronized="false"
  17117. static="false" final="false" visibility="public"
  17118. deprecated="not deprecated">
  17119. <doc>
  17120. <![CDATA[Returns event Id.
  17121. @return event id]]>
  17122. </doc>
  17123. </method>
  17124. <method name="getTaskAttemptId" return="org.apache.hadoop.mapreduce.TaskAttemptID"
  17125. abstract="false" native="false" synchronized="false"
  17126. static="false" final="false" visibility="public"
  17127. deprecated="not deprecated">
  17128. <doc>
  17129. <![CDATA[Returns task id.
  17130. @return task id]]>
  17131. </doc>
  17132. </method>
  17133. <method name="getStatus" return="org.apache.hadoop.mapreduce.TaskCompletionEvent.Status"
  17134. abstract="false" native="false" synchronized="false"
  17135. static="false" final="false" visibility="public"
  17136. deprecated="not deprecated">
  17137. <doc>
  17138. <![CDATA[Returns enum Status.SUCESS or Status.FAILURE.
  17139. @return task tracker status]]>
  17140. </doc>
  17141. </method>
  17142. <method name="getTaskTrackerHttp" return="java.lang.String"
  17143. abstract="false" native="false" synchronized="false"
  17144. static="false" final="false" visibility="public"
  17145. deprecated="not deprecated">
  17146. <doc>
  17147. <![CDATA[http location of the tasktracker where this task ran.
  17148. @return http location of tasktracker user logs]]>
  17149. </doc>
  17150. </method>
  17151. <method name="getTaskRunTime" return="int"
  17152. abstract="false" native="false" synchronized="false"
  17153. static="false" final="false" visibility="public"
  17154. deprecated="not deprecated">
  17155. <doc>
  17156. <![CDATA[Returns time (in millisec) the task took to complete.]]>
  17157. </doc>
  17158. </method>
  17159. <method name="setTaskRunTime"
  17160. abstract="false" native="false" synchronized="false"
  17161. static="false" final="false" visibility="protected"
  17162. deprecated="not deprecated">
  17163. <param name="taskCompletionTime" type="int"/>
  17164. <doc>
  17165. <![CDATA[Set the task completion time
  17166. @param taskCompletionTime time (in millisec) the task took to complete]]>
  17167. </doc>
  17168. </method>
  17169. <method name="setEventId"
  17170. abstract="false" native="false" synchronized="false"
  17171. static="false" final="false" visibility="protected"
  17172. deprecated="not deprecated">
  17173. <param name="eventId" type="int"/>
  17174. <doc>
  17175. <![CDATA[set event Id. should be assigned incrementally starting from 0.
  17176. @param eventId]]>
  17177. </doc>
  17178. </method>
  17179. <method name="setTaskAttemptId"
  17180. abstract="false" native="false" synchronized="false"
  17181. static="false" final="false" visibility="protected"
  17182. deprecated="not deprecated">
  17183. <param name="taskId" type="org.apache.hadoop.mapreduce.TaskAttemptID"/>
  17184. <doc>
  17185. <![CDATA[Sets task id.
  17186. @param taskId]]>
  17187. </doc>
  17188. </method>
  17189. <method name="setTaskStatus"
  17190. abstract="false" native="false" synchronized="false"
  17191. static="false" final="false" visibility="protected"
  17192. deprecated="not deprecated">
  17193. <param name="status" type="org.apache.hadoop.mapreduce.TaskCompletionEvent.Status"/>
  17194. <doc>
  17195. <![CDATA[Set task status.
  17196. @param status]]>
  17197. </doc>
  17198. </method>
  17199. <method name="setTaskTrackerHttp"
  17200. abstract="false" native="false" synchronized="false"
  17201. static="false" final="false" visibility="protected"
  17202. deprecated="not deprecated">
  17203. <param name="taskTrackerHttp" type="java.lang.String"/>
  17204. <doc>
  17205. <![CDATA[Set task tracker http location.
  17206. @param taskTrackerHttp]]>
  17207. </doc>
  17208. </method>
  17209. <method name="toString" return="java.lang.String"
  17210. abstract="false" native="false" synchronized="false"
  17211. static="false" final="false" visibility="public"
  17212. deprecated="not deprecated">
  17213. </method>
  17214. <method name="equals" return="boolean"
  17215. abstract="false" native="false" synchronized="false"
  17216. static="false" final="false" visibility="public"
  17217. deprecated="not deprecated">
  17218. <param name="o" type="java.lang.Object"/>
  17219. </method>
  17220. <method name="hashCode" return="int"
  17221. abstract="false" native="false" synchronized="false"
  17222. static="false" final="false" visibility="public"
  17223. deprecated="not deprecated">
  17224. </method>
  17225. <method name="isMapTask" return="boolean"
  17226. abstract="false" native="false" synchronized="false"
  17227. static="false" final="false" visibility="public"
  17228. deprecated="not deprecated">
  17229. </method>
  17230. <method name="idWithinJob" return="int"
  17231. abstract="false" native="false" synchronized="false"
  17232. static="false" final="false" visibility="public"
  17233. deprecated="not deprecated">
  17234. </method>
  17235. <method name="write"
  17236. abstract="false" native="false" synchronized="false"
  17237. static="false" final="false" visibility="public"
  17238. deprecated="not deprecated">
  17239. <param name="out" type="java.io.DataOutput"/>
  17240. <exception name="IOException" type="java.io.IOException"/>
  17241. </method>
  17242. <method name="readFields"
  17243. abstract="false" native="false" synchronized="false"
  17244. static="false" final="false" visibility="public"
  17245. deprecated="not deprecated">
  17246. <param name="in" type="java.io.DataInput"/>
  17247. <exception name="IOException" type="java.io.IOException"/>
  17248. </method>
  17249. <field name="EMPTY_ARRAY" type="org.apache.hadoop.mapreduce.TaskCompletionEvent[]"
  17250. transient="false" volatile="false"
  17251. static="true" final="true" visibility="public"
  17252. deprecated="not deprecated">
  17253. </field>
  17254. <doc>
  17255. <![CDATA[This is used to track task completion events on
  17256. job tracker.]]>
  17257. </doc>
  17258. </class>
  17259. <!-- end class org.apache.hadoop.mapreduce.TaskCompletionEvent -->
  17260. <!-- start class org.apache.hadoop.mapreduce.TaskCompletionEvent.Status -->
  17261. <class name="TaskCompletionEvent.Status" extends="java.lang.Enum"
  17262. abstract="false"
  17263. static="true" final="true" visibility="public"
  17264. deprecated="not deprecated">
  17265. <method name="values" return="org.apache.hadoop.mapreduce.TaskCompletionEvent.Status[]"
  17266. abstract="false" native="false" synchronized="false"
  17267. static="true" final="false" visibility="public"
  17268. deprecated="not deprecated">
  17269. </method>
  17270. <method name="valueOf" return="org.apache.hadoop.mapreduce.TaskCompletionEvent.Status"
  17271. abstract="false" native="false" synchronized="false"
  17272. static="true" final="false" visibility="public"
  17273. deprecated="not deprecated">
  17274. <param name="name" type="java.lang.String"/>
  17275. </method>
  17276. </class>
  17277. <!-- end class org.apache.hadoop.mapreduce.TaskCompletionEvent.Status -->
  17278. <!-- start class org.apache.hadoop.mapreduce.TaskCounter -->
  17279. <class name="TaskCounter" extends="java.lang.Enum"
  17280. abstract="false"
  17281. static="false" final="true" visibility="public"
  17282. deprecated="not deprecated">
  17283. <method name="values" return="org.apache.hadoop.mapreduce.TaskCounter[]"
  17284. abstract="false" native="false" synchronized="false"
  17285. static="true" final="false" visibility="public"
  17286. deprecated="not deprecated">
  17287. </method>
  17288. <method name="valueOf" return="org.apache.hadoop.mapreduce.TaskCounter"
  17289. abstract="false" native="false" synchronized="false"
  17290. static="true" final="false" visibility="public"
  17291. deprecated="not deprecated">
  17292. <param name="name" type="java.lang.String"/>
  17293. </method>
  17294. </class>
  17295. <!-- end class org.apache.hadoop.mapreduce.TaskCounter -->
  17296. <!-- start class org.apache.hadoop.mapreduce.TaskID -->
  17297. <class name="TaskID" extends="org.apache.hadoop.mapred.ID"
  17298. abstract="false"
  17299. static="false" final="false" visibility="public"
  17300. deprecated="not deprecated">
  17301. <constructor name="TaskID" type="org.apache.hadoop.mapreduce.JobID, org.apache.hadoop.mapreduce.TaskType, int"
  17302. static="false" final="false" visibility="public"
  17303. deprecated="not deprecated">
  17304. <doc>
  17305. <![CDATA[Constructs a TaskID object from given {@link JobID}.
  17306. @param jobId JobID that this tip belongs to
  17307. @param type the {@link TaskType} of the task
  17308. @param id the tip number]]>
  17309. </doc>
  17310. </constructor>
  17311. <constructor name="TaskID" type="java.lang.String, int, org.apache.hadoop.mapreduce.TaskType, int"
  17312. static="false" final="false" visibility="public"
  17313. deprecated="not deprecated">
  17314. <doc>
  17315. <![CDATA[Constructs a TaskInProgressId object from given parts.
  17316. @param jtIdentifier jobTracker identifier
  17317. @param jobId job number
  17318. @param type the TaskType
  17319. @param id the tip number]]>
  17320. </doc>
  17321. </constructor>
  17322. <constructor name="TaskID"
  17323. static="false" final="false" visibility="public"
  17324. deprecated="not deprecated">
  17325. </constructor>
  17326. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  17327. abstract="false" native="false" synchronized="false"
  17328. static="false" final="false" visibility="public"
  17329. deprecated="not deprecated">
  17330. <doc>
  17331. <![CDATA[Returns the {@link JobID} object that this tip belongs to]]>
  17332. </doc>
  17333. </method>
  17334. <method name="getTaskType" return="org.apache.hadoop.mapreduce.TaskType"
  17335. abstract="false" native="false" synchronized="false"
  17336. static="false" final="false" visibility="public"
  17337. deprecated="not deprecated">
  17338. <doc>
  17339. <![CDATA[Get the type of the task]]>
  17340. </doc>
  17341. </method>
  17342. <method name="equals" return="boolean"
  17343. abstract="false" native="false" synchronized="false"
  17344. static="false" final="false" visibility="public"
  17345. deprecated="not deprecated">
  17346. <param name="o" type="java.lang.Object"/>
  17347. </method>
  17348. <method name="compareTo" return="int"
  17349. abstract="false" native="false" synchronized="false"
  17350. static="false" final="false" visibility="public"
  17351. deprecated="not deprecated">
  17352. <param name="o" type="org.apache.hadoop.mapreduce.ID"/>
  17353. <doc>
  17354. <![CDATA[Compare TaskInProgressIds by first jobIds, then by tip numbers. Reduces are
  17355. defined as greater then maps.]]>
  17356. </doc>
  17357. </method>
  17358. <method name="toString" return="java.lang.String"
  17359. abstract="false" native="false" synchronized="false"
  17360. static="false" final="false" visibility="public"
  17361. deprecated="not deprecated">
  17362. </method>
  17363. <method name="appendTo" return="java.lang.StringBuilder"
  17364. abstract="false" native="false" synchronized="false"
  17365. static="false" final="false" visibility="protected"
  17366. deprecated="not deprecated">
  17367. <param name="builder" type="java.lang.StringBuilder"/>
  17368. <doc>
  17369. <![CDATA[Add the unique string to the given builder.
  17370. @param builder the builder to append to
  17371. @return the builder that was passed in]]>
  17372. </doc>
  17373. </method>
  17374. <method name="hashCode" return="int"
  17375. abstract="false" native="false" synchronized="false"
  17376. static="false" final="false" visibility="public"
  17377. deprecated="not deprecated">
  17378. </method>
  17379. <method name="readFields"
  17380. abstract="false" native="false" synchronized="false"
  17381. static="false" final="false" visibility="public"
  17382. deprecated="not deprecated">
  17383. <param name="in" type="java.io.DataInput"/>
  17384. <exception name="IOException" type="java.io.IOException"/>
  17385. </method>
  17386. <method name="write"
  17387. abstract="false" native="false" synchronized="false"
  17388. static="false" final="false" visibility="public"
  17389. deprecated="not deprecated">
  17390. <param name="out" type="java.io.DataOutput"/>
  17391. <exception name="IOException" type="java.io.IOException"/>
  17392. </method>
  17393. <method name="forName" return="org.apache.hadoop.mapreduce.TaskID"
  17394. abstract="false" native="false" synchronized="false"
  17395. static="true" final="false" visibility="public"
  17396. deprecated="not deprecated">
  17397. <param name="str" type="java.lang.String"/>
  17398. <exception name="IllegalArgumentException" type="java.lang.IllegalArgumentException"/>
  17399. <doc>
  17400. <![CDATA[Construct a TaskID object from given string
  17401. @return constructed TaskID object or null if the given String is null
  17402. @throws IllegalArgumentException if the given string is malformed]]>
  17403. </doc>
  17404. </method>
  17405. <method name="getRepresentingCharacter" return="char"
  17406. abstract="false" native="false" synchronized="false"
  17407. static="true" final="false" visibility="public"
  17408. deprecated="not deprecated">
  17409. <param name="type" type="org.apache.hadoop.mapreduce.TaskType"/>
  17410. <doc>
  17411. <![CDATA[Gets the character representing the {@link TaskType}
  17412. @param type the TaskType
  17413. @return the character]]>
  17414. </doc>
  17415. </method>
  17416. <method name="getTaskType" return="org.apache.hadoop.mapreduce.TaskType"
  17417. abstract="false" native="false" synchronized="false"
  17418. static="true" final="false" visibility="public"
  17419. deprecated="not deprecated">
  17420. <param name="c" type="char"/>
  17421. <doc>
  17422. <![CDATA[Gets the {@link TaskType} corresponding to the character
  17423. @param c the character
  17424. @return the TaskType]]>
  17425. </doc>
  17426. </method>
  17427. <method name="getAllTaskTypes" return="java.lang.String"
  17428. abstract="false" native="false" synchronized="false"
  17429. static="true" final="false" visibility="public"
  17430. deprecated="not deprecated">
  17431. </method>
  17432. <field name="TASK" type="java.lang.String"
  17433. transient="false" volatile="false"
  17434. static="true" final="true" visibility="protected"
  17435. deprecated="not deprecated">
  17436. </field>
  17437. <field name="idFormat" type="java.text.NumberFormat"
  17438. transient="false" volatile="false"
  17439. static="true" final="true" visibility="protected"
  17440. deprecated="not deprecated">
  17441. </field>
  17442. <doc>
  17443. <![CDATA[TaskID represents the immutable and unique identifier for
  17444. a Map or Reduce Task. Each TaskID encompasses multiple attempts made to
  17445. execute the Map or Reduce Task, each of which are uniquely indentified by
  17446. their TaskAttemptID.
  17447. TaskID consists of 3 parts. First part is the {@link JobID}, that this
  17448. TaskInProgress belongs to. Second part of the TaskID is either 'm' or 'r'
  17449. representing whether the task is a map task or a reduce task.
  17450. And the third part is the task number. <br>
  17451. An example TaskID is :
  17452. <code>task_200707121733_0003_m_000005</code> , which represents the
  17453. fifth map task in the third job running at the jobtracker
  17454. started at <code>200707121733</code>.
  17455. <p>
  17456. Applications should never construct or parse TaskID strings
  17457. , but rather use appropriate constructors or {@link #forName(String)}
  17458. method.
  17459. @see JobID
  17460. @see TaskAttemptID]]>
  17461. </doc>
  17462. </class>
  17463. <!-- end class org.apache.hadoop.mapreduce.TaskID -->
  17464. <!-- start interface org.apache.hadoop.mapreduce.TaskInputOutputContext -->
  17465. <interface name="TaskInputOutputContext" abstract="true"
  17466. static="false" final="false" visibility="public"
  17467. deprecated="not deprecated">
  17468. <implements name="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  17469. <method name="nextKeyValue" return="boolean"
  17470. abstract="false" native="false" synchronized="false"
  17471. static="false" final="false" visibility="public"
  17472. deprecated="not deprecated">
  17473. <exception name="IOException" type="java.io.IOException"/>
  17474. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  17475. <doc>
  17476. <![CDATA[Advance to the next key, value pair, returning null if at end.
  17477. @return the key object that was read into, or null if no more]]>
  17478. </doc>
  17479. </method>
  17480. <method name="getCurrentKey" return="KEYIN"
  17481. abstract="false" native="false" synchronized="false"
  17482. static="false" final="false" visibility="public"
  17483. deprecated="not deprecated">
  17484. <exception name="IOException" type="java.io.IOException"/>
  17485. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  17486. <doc>
  17487. <![CDATA[Get the current key.
  17488. @return the current key object or null if there isn't one
  17489. @throws IOException
  17490. @throws InterruptedException]]>
  17491. </doc>
  17492. </method>
  17493. <method name="getCurrentValue" return="VALUEIN"
  17494. abstract="false" native="false" synchronized="false"
  17495. static="false" final="false" visibility="public"
  17496. deprecated="not deprecated">
  17497. <exception name="IOException" type="java.io.IOException"/>
  17498. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  17499. <doc>
  17500. <![CDATA[Get the current value.
  17501. @return the value object that was read into
  17502. @throws IOException
  17503. @throws InterruptedException]]>
  17504. </doc>
  17505. </method>
  17506. <method name="write"
  17507. abstract="false" native="false" synchronized="false"
  17508. static="false" final="false" visibility="public"
  17509. deprecated="not deprecated">
  17510. <param name="key" type="KEYOUT"/>
  17511. <param name="value" type="VALUEOUT"/>
  17512. <exception name="IOException" type="java.io.IOException"/>
  17513. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  17514. <doc>
  17515. <![CDATA[Generate an output key/value pair.]]>
  17516. </doc>
  17517. </method>
  17518. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  17519. abstract="false" native="false" synchronized="false"
  17520. static="false" final="false" visibility="public"
  17521. deprecated="not deprecated">
  17522. <doc>
  17523. <![CDATA[Get the {@link OutputCommitter} for the task-attempt.
  17524. @return the <code>OutputCommitter</code> for the task-attempt]]>
  17525. </doc>
  17526. </method>
  17527. <doc>
  17528. <![CDATA[A context object that allows input and output from the task. It is only
  17529. supplied to the {@link Mapper} or {@link Reducer}.
  17530. @param <KEYIN> the input key type for the task
  17531. @param <VALUEIN> the input value type for the task
  17532. @param <KEYOUT> the output key type for the task
  17533. @param <VALUEOUT> the output value type for the task]]>
  17534. </doc>
  17535. </interface>
  17536. <!-- end interface org.apache.hadoop.mapreduce.TaskInputOutputContext -->
  17537. <!-- start class org.apache.hadoop.mapreduce.TaskTrackerInfo -->
  17538. <class name="TaskTrackerInfo" extends="java.lang.Object"
  17539. abstract="false"
  17540. static="false" final="false" visibility="public"
  17541. deprecated="not deprecated">
  17542. <implements name="org.apache.hadoop.io.Writable"/>
  17543. <constructor name="TaskTrackerInfo"
  17544. static="false" final="false" visibility="public"
  17545. deprecated="not deprecated">
  17546. </constructor>
  17547. <constructor name="TaskTrackerInfo" type="java.lang.String"
  17548. static="false" final="false" visibility="public"
  17549. deprecated="not deprecated">
  17550. </constructor>
  17551. <constructor name="TaskTrackerInfo" type="java.lang.String, java.lang.String, java.lang.String"
  17552. static="false" final="false" visibility="public"
  17553. deprecated="not deprecated">
  17554. </constructor>
  17555. <method name="getTaskTrackerName" return="java.lang.String"
  17556. abstract="false" native="false" synchronized="false"
  17557. static="false" final="false" visibility="public"
  17558. deprecated="not deprecated">
  17559. <doc>
  17560. <![CDATA[Gets the tasktracker's name.
  17561. @return tracker's name.]]>
  17562. </doc>
  17563. </method>
  17564. <method name="isBlacklisted" return="boolean"
  17565. abstract="false" native="false" synchronized="false"
  17566. static="false" final="false" visibility="public"
  17567. deprecated="not deprecated">
  17568. <doc>
  17569. <![CDATA[Whether tracker is blacklisted
  17570. @return true if tracker is blacklisted
  17571. false otherwise]]>
  17572. </doc>
  17573. </method>
  17574. <method name="getReasonForBlacklist" return="java.lang.String"
  17575. abstract="false" native="false" synchronized="false"
  17576. static="false" final="false" visibility="public"
  17577. deprecated="not deprecated">
  17578. <doc>
  17579. <![CDATA[Gets the reason for which the tasktracker was blacklisted.
  17580. @return reason which tracker was blacklisted]]>
  17581. </doc>
  17582. </method>
  17583. <method name="getBlacklistReport" return="java.lang.String"
  17584. abstract="false" native="false" synchronized="false"
  17585. static="false" final="false" visibility="public"
  17586. deprecated="not deprecated">
  17587. <doc>
  17588. <![CDATA[Gets a descriptive report about why the tasktracker was blacklisted.
  17589. @return report describing why the tasktracker was blacklisted.]]>
  17590. </doc>
  17591. </method>
  17592. <method name="readFields"
  17593. abstract="false" native="false" synchronized="false"
  17594. static="false" final="false" visibility="public"
  17595. deprecated="not deprecated">
  17596. <param name="in" type="java.io.DataInput"/>
  17597. <exception name="IOException" type="java.io.IOException"/>
  17598. </method>
  17599. <method name="write"
  17600. abstract="false" native="false" synchronized="false"
  17601. static="false" final="false" visibility="public"
  17602. deprecated="not deprecated">
  17603. <param name="out" type="java.io.DataOutput"/>
  17604. <exception name="IOException" type="java.io.IOException"/>
  17605. </method>
  17606. <doc>
  17607. <![CDATA[Information about TaskTracker.]]>
  17608. </doc>
  17609. </class>
  17610. <!-- end class org.apache.hadoop.mapreduce.TaskTrackerInfo -->
  17611. <!-- start class org.apache.hadoop.mapreduce.TaskType -->
  17612. <class name="TaskType" extends="java.lang.Enum"
  17613. abstract="false"
  17614. static="false" final="true" visibility="public"
  17615. deprecated="not deprecated">
  17616. <method name="values" return="org.apache.hadoop.mapreduce.TaskType[]"
  17617. abstract="false" native="false" synchronized="false"
  17618. static="true" final="false" visibility="public"
  17619. deprecated="not deprecated">
  17620. </method>
  17621. <method name="valueOf" return="org.apache.hadoop.mapreduce.TaskType"
  17622. abstract="false" native="false" synchronized="false"
  17623. static="true" final="false" visibility="public"
  17624. deprecated="not deprecated">
  17625. <param name="name" type="java.lang.String"/>
  17626. </method>
  17627. <doc>
  17628. <![CDATA[Enum for map, reduce, job-setup, job-cleanup, task-cleanup task types.]]>
  17629. </doc>
  17630. </class>
  17631. <!-- end class org.apache.hadoop.mapreduce.TaskType -->
  17632. </package>
  17633. <package name="org.apache.hadoop.mapreduce.lib.aggregate">
  17634. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.DoubleValueSum -->
  17635. <class name="DoubleValueSum" extends="java.lang.Object"
  17636. abstract="false"
  17637. static="false" final="false" visibility="public"
  17638. deprecated="not deprecated">
  17639. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  17640. <constructor name="DoubleValueSum"
  17641. static="false" final="false" visibility="public"
  17642. deprecated="not deprecated">
  17643. <doc>
  17644. <![CDATA[The default constructor]]>
  17645. </doc>
  17646. </constructor>
  17647. <method name="addNextValue"
  17648. abstract="false" native="false" synchronized="false"
  17649. static="false" final="false" visibility="public"
  17650. deprecated="not deprecated">
  17651. <param name="val" type="java.lang.Object"/>
  17652. <doc>
  17653. <![CDATA[add a value to the aggregator
  17654. @param val
  17655. an object whose string representation represents a double value.]]>
  17656. </doc>
  17657. </method>
  17658. <method name="addNextValue"
  17659. abstract="false" native="false" synchronized="false"
  17660. static="false" final="false" visibility="public"
  17661. deprecated="not deprecated">
  17662. <param name="val" type="double"/>
  17663. <doc>
  17664. <![CDATA[add a value to the aggregator
  17665. @param val
  17666. a double value.]]>
  17667. </doc>
  17668. </method>
  17669. <method name="getReport" return="java.lang.String"
  17670. abstract="false" native="false" synchronized="false"
  17671. static="false" final="false" visibility="public"
  17672. deprecated="not deprecated">
  17673. <doc>
  17674. <![CDATA[@return the string representation of the aggregated value]]>
  17675. </doc>
  17676. </method>
  17677. <method name="getSum" return="double"
  17678. abstract="false" native="false" synchronized="false"
  17679. static="false" final="false" visibility="public"
  17680. deprecated="not deprecated">
  17681. <doc>
  17682. <![CDATA[@return the aggregated value]]>
  17683. </doc>
  17684. </method>
  17685. <method name="reset"
  17686. abstract="false" native="false" synchronized="false"
  17687. static="false" final="false" visibility="public"
  17688. deprecated="not deprecated">
  17689. <doc>
  17690. <![CDATA[reset the aggregator]]>
  17691. </doc>
  17692. </method>
  17693. <method name="getCombinerOutput" return="java.util.ArrayList"
  17694. abstract="false" native="false" synchronized="false"
  17695. static="false" final="false" visibility="public"
  17696. deprecated="not deprecated">
  17697. <doc>
  17698. <![CDATA[@return return an array of one element. The element is a string
  17699. representation of the aggregated value. The return value is
  17700. expected to be used by the a combiner.]]>
  17701. </doc>
  17702. </method>
  17703. <doc>
  17704. <![CDATA[This class implements a value aggregator that sums up a sequence of double
  17705. values.]]>
  17706. </doc>
  17707. </class>
  17708. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.DoubleValueSum -->
  17709. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.LongValueMax -->
  17710. <class name="LongValueMax" extends="java.lang.Object"
  17711. abstract="false"
  17712. static="false" final="false" visibility="public"
  17713. deprecated="not deprecated">
  17714. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  17715. <constructor name="LongValueMax"
  17716. static="false" final="false" visibility="public"
  17717. deprecated="not deprecated">
  17718. <doc>
  17719. <![CDATA[the default constructor]]>
  17720. </doc>
  17721. </constructor>
  17722. <method name="addNextValue"
  17723. abstract="false" native="false" synchronized="false"
  17724. static="false" final="false" visibility="public"
  17725. deprecated="not deprecated">
  17726. <param name="val" type="java.lang.Object"/>
  17727. <doc>
  17728. <![CDATA[add a value to the aggregator
  17729. @param val
  17730. an object whose string representation represents a long value.]]>
  17731. </doc>
  17732. </method>
  17733. <method name="addNextValue"
  17734. abstract="false" native="false" synchronized="false"
  17735. static="false" final="false" visibility="public"
  17736. deprecated="not deprecated">
  17737. <param name="newVal" type="long"/>
  17738. <doc>
  17739. <![CDATA[add a value to the aggregator
  17740. @param newVal
  17741. a long value.]]>
  17742. </doc>
  17743. </method>
  17744. <method name="getVal" return="long"
  17745. abstract="false" native="false" synchronized="false"
  17746. static="false" final="false" visibility="public"
  17747. deprecated="not deprecated">
  17748. <doc>
  17749. <![CDATA[@return the aggregated value]]>
  17750. </doc>
  17751. </method>
  17752. <method name="getReport" return="java.lang.String"
  17753. abstract="false" native="false" synchronized="false"
  17754. static="false" final="false" visibility="public"
  17755. deprecated="not deprecated">
  17756. <doc>
  17757. <![CDATA[@return the string representation of the aggregated value]]>
  17758. </doc>
  17759. </method>
  17760. <method name="reset"
  17761. abstract="false" native="false" synchronized="false"
  17762. static="false" final="false" visibility="public"
  17763. deprecated="not deprecated">
  17764. <doc>
  17765. <![CDATA[reset the aggregator]]>
  17766. </doc>
  17767. </method>
  17768. <method name="getCombinerOutput" return="java.util.ArrayList"
  17769. abstract="false" native="false" synchronized="false"
  17770. static="false" final="false" visibility="public"
  17771. deprecated="not deprecated">
  17772. <doc>
  17773. <![CDATA[@return return an array of one element. The element is a string
  17774. representation of the aggregated value. The return value is
  17775. expected to be used by the a combiner.]]>
  17776. </doc>
  17777. </method>
  17778. <doc>
  17779. <![CDATA[This class implements a value aggregator that maintain the maximum of
  17780. a sequence of long values.]]>
  17781. </doc>
  17782. </class>
  17783. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.LongValueMax -->
  17784. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.LongValueMin -->
  17785. <class name="LongValueMin" extends="java.lang.Object"
  17786. abstract="false"
  17787. static="false" final="false" visibility="public"
  17788. deprecated="not deprecated">
  17789. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  17790. <constructor name="LongValueMin"
  17791. static="false" final="false" visibility="public"
  17792. deprecated="not deprecated">
  17793. <doc>
  17794. <![CDATA[the default constructor]]>
  17795. </doc>
  17796. </constructor>
  17797. <method name="addNextValue"
  17798. abstract="false" native="false" synchronized="false"
  17799. static="false" final="false" visibility="public"
  17800. deprecated="not deprecated">
  17801. <param name="val" type="java.lang.Object"/>
  17802. <doc>
  17803. <![CDATA[add a value to the aggregator
  17804. @param val
  17805. an object whose string representation represents a long value.]]>
  17806. </doc>
  17807. </method>
  17808. <method name="addNextValue"
  17809. abstract="false" native="false" synchronized="false"
  17810. static="false" final="false" visibility="public"
  17811. deprecated="not deprecated">
  17812. <param name="newVal" type="long"/>
  17813. <doc>
  17814. <![CDATA[add a value to the aggregator
  17815. @param newVal
  17816. a long value.]]>
  17817. </doc>
  17818. </method>
  17819. <method name="getVal" return="long"
  17820. abstract="false" native="false" synchronized="false"
  17821. static="false" final="false" visibility="public"
  17822. deprecated="not deprecated">
  17823. <doc>
  17824. <![CDATA[@return the aggregated value]]>
  17825. </doc>
  17826. </method>
  17827. <method name="getReport" return="java.lang.String"
  17828. abstract="false" native="false" synchronized="false"
  17829. static="false" final="false" visibility="public"
  17830. deprecated="not deprecated">
  17831. <doc>
  17832. <![CDATA[@return the string representation of the aggregated value]]>
  17833. </doc>
  17834. </method>
  17835. <method name="reset"
  17836. abstract="false" native="false" synchronized="false"
  17837. static="false" final="false" visibility="public"
  17838. deprecated="not deprecated">
  17839. <doc>
  17840. <![CDATA[reset the aggregator]]>
  17841. </doc>
  17842. </method>
  17843. <method name="getCombinerOutput" return="java.util.ArrayList"
  17844. abstract="false" native="false" synchronized="false"
  17845. static="false" final="false" visibility="public"
  17846. deprecated="not deprecated">
  17847. <doc>
  17848. <![CDATA[@return return an array of one element. The element is a string
  17849. representation of the aggregated value. The return value is
  17850. expected to be used by the a combiner.]]>
  17851. </doc>
  17852. </method>
  17853. <doc>
  17854. <![CDATA[This class implements a value aggregator that maintain the minimum of
  17855. a sequence of long values.]]>
  17856. </doc>
  17857. </class>
  17858. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.LongValueMin -->
  17859. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.LongValueSum -->
  17860. <class name="LongValueSum" extends="java.lang.Object"
  17861. abstract="false"
  17862. static="false" final="false" visibility="public"
  17863. deprecated="not deprecated">
  17864. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  17865. <constructor name="LongValueSum"
  17866. static="false" final="false" visibility="public"
  17867. deprecated="not deprecated">
  17868. <doc>
  17869. <![CDATA[the default constructor]]>
  17870. </doc>
  17871. </constructor>
  17872. <method name="addNextValue"
  17873. abstract="false" native="false" synchronized="false"
  17874. static="false" final="false" visibility="public"
  17875. deprecated="not deprecated">
  17876. <param name="val" type="java.lang.Object"/>
  17877. <doc>
  17878. <![CDATA[add a value to the aggregator
  17879. @param val
  17880. an object whose string representation represents a long value.]]>
  17881. </doc>
  17882. </method>
  17883. <method name="addNextValue"
  17884. abstract="false" native="false" synchronized="false"
  17885. static="false" final="false" visibility="public"
  17886. deprecated="not deprecated">
  17887. <param name="val" type="long"/>
  17888. <doc>
  17889. <![CDATA[add a value to the aggregator
  17890. @param val
  17891. a long value.]]>
  17892. </doc>
  17893. </method>
  17894. <method name="getSum" return="long"
  17895. abstract="false" native="false" synchronized="false"
  17896. static="false" final="false" visibility="public"
  17897. deprecated="not deprecated">
  17898. <doc>
  17899. <![CDATA[@return the aggregated value]]>
  17900. </doc>
  17901. </method>
  17902. <method name="getReport" return="java.lang.String"
  17903. abstract="false" native="false" synchronized="false"
  17904. static="false" final="false" visibility="public"
  17905. deprecated="not deprecated">
  17906. <doc>
  17907. <![CDATA[@return the string representation of the aggregated value]]>
  17908. </doc>
  17909. </method>
  17910. <method name="reset"
  17911. abstract="false" native="false" synchronized="false"
  17912. static="false" final="false" visibility="public"
  17913. deprecated="not deprecated">
  17914. <doc>
  17915. <![CDATA[reset the aggregator]]>
  17916. </doc>
  17917. </method>
  17918. <method name="getCombinerOutput" return="java.util.ArrayList"
  17919. abstract="false" native="false" synchronized="false"
  17920. static="false" final="false" visibility="public"
  17921. deprecated="not deprecated">
  17922. <doc>
  17923. <![CDATA[@return return an array of one element. The element is a string
  17924. representation of the aggregated value. The return value is
  17925. expected to be used by the a combiner.]]>
  17926. </doc>
  17927. </method>
  17928. <doc>
  17929. <![CDATA[This class implements a value aggregator that sums up
  17930. a sequence of long values.]]>
  17931. </doc>
  17932. </class>
  17933. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.LongValueSum -->
  17934. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.StringValueMax -->
  17935. <class name="StringValueMax" extends="java.lang.Object"
  17936. abstract="false"
  17937. static="false" final="false" visibility="public"
  17938. deprecated="not deprecated">
  17939. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  17940. <constructor name="StringValueMax"
  17941. static="false" final="false" visibility="public"
  17942. deprecated="not deprecated">
  17943. <doc>
  17944. <![CDATA[the default constructor]]>
  17945. </doc>
  17946. </constructor>
  17947. <method name="addNextValue"
  17948. abstract="false" native="false" synchronized="false"
  17949. static="false" final="false" visibility="public"
  17950. deprecated="not deprecated">
  17951. <param name="val" type="java.lang.Object"/>
  17952. <doc>
  17953. <![CDATA[add a value to the aggregator
  17954. @param val
  17955. a string.]]>
  17956. </doc>
  17957. </method>
  17958. <method name="getVal" return="java.lang.String"
  17959. abstract="false" native="false" synchronized="false"
  17960. static="false" final="false" visibility="public"
  17961. deprecated="not deprecated">
  17962. <doc>
  17963. <![CDATA[@return the aggregated value]]>
  17964. </doc>
  17965. </method>
  17966. <method name="getReport" return="java.lang.String"
  17967. abstract="false" native="false" synchronized="false"
  17968. static="false" final="false" visibility="public"
  17969. deprecated="not deprecated">
  17970. <doc>
  17971. <![CDATA[@return the string representation of the aggregated value]]>
  17972. </doc>
  17973. </method>
  17974. <method name="reset"
  17975. abstract="false" native="false" synchronized="false"
  17976. static="false" final="false" visibility="public"
  17977. deprecated="not deprecated">
  17978. <doc>
  17979. <![CDATA[reset the aggregator]]>
  17980. </doc>
  17981. </method>
  17982. <method name="getCombinerOutput" return="java.util.ArrayList"
  17983. abstract="false" native="false" synchronized="false"
  17984. static="false" final="false" visibility="public"
  17985. deprecated="not deprecated">
  17986. <doc>
  17987. <![CDATA[@return return an array of one element. The element is a string
  17988. representation of the aggregated value. The return value is
  17989. expected to be used by the a combiner.]]>
  17990. </doc>
  17991. </method>
  17992. <doc>
  17993. <![CDATA[This class implements a value aggregator that maintain the biggest of
  17994. a sequence of strings.]]>
  17995. </doc>
  17996. </class>
  17997. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.StringValueMax -->
  17998. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.StringValueMin -->
  17999. <class name="StringValueMin" extends="java.lang.Object"
  18000. abstract="false"
  18001. static="false" final="false" visibility="public"
  18002. deprecated="not deprecated">
  18003. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  18004. <constructor name="StringValueMin"
  18005. static="false" final="false" visibility="public"
  18006. deprecated="not deprecated">
  18007. <doc>
  18008. <![CDATA[the default constructor]]>
  18009. </doc>
  18010. </constructor>
  18011. <method name="addNextValue"
  18012. abstract="false" native="false" synchronized="false"
  18013. static="false" final="false" visibility="public"
  18014. deprecated="not deprecated">
  18015. <param name="val" type="java.lang.Object"/>
  18016. <doc>
  18017. <![CDATA[add a value to the aggregator
  18018. @param val
  18019. a string.]]>
  18020. </doc>
  18021. </method>
  18022. <method name="getVal" return="java.lang.String"
  18023. abstract="false" native="false" synchronized="false"
  18024. static="false" final="false" visibility="public"
  18025. deprecated="not deprecated">
  18026. <doc>
  18027. <![CDATA[@return the aggregated value]]>
  18028. </doc>
  18029. </method>
  18030. <method name="getReport" return="java.lang.String"
  18031. abstract="false" native="false" synchronized="false"
  18032. static="false" final="false" visibility="public"
  18033. deprecated="not deprecated">
  18034. <doc>
  18035. <![CDATA[@return the string representation of the aggregated value]]>
  18036. </doc>
  18037. </method>
  18038. <method name="reset"
  18039. abstract="false" native="false" synchronized="false"
  18040. static="false" final="false" visibility="public"
  18041. deprecated="not deprecated">
  18042. <doc>
  18043. <![CDATA[reset the aggregator]]>
  18044. </doc>
  18045. </method>
  18046. <method name="getCombinerOutput" return="java.util.ArrayList"
  18047. abstract="false" native="false" synchronized="false"
  18048. static="false" final="false" visibility="public"
  18049. deprecated="not deprecated">
  18050. <doc>
  18051. <![CDATA[@return return an array of one element. The element is a string
  18052. representation of the aggregated value. The return value is
  18053. expected to be used by the a combiner.]]>
  18054. </doc>
  18055. </method>
  18056. <doc>
  18057. <![CDATA[This class implements a value aggregator that maintain the smallest of
  18058. a sequence of strings.]]>
  18059. </doc>
  18060. </class>
  18061. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.StringValueMin -->
  18062. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.UniqValueCount -->
  18063. <class name="UniqValueCount" extends="java.lang.Object"
  18064. abstract="false"
  18065. static="false" final="false" visibility="public"
  18066. deprecated="not deprecated">
  18067. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  18068. <constructor name="UniqValueCount"
  18069. static="false" final="false" visibility="public"
  18070. deprecated="not deprecated">
  18071. <doc>
  18072. <![CDATA[the default constructor]]>
  18073. </doc>
  18074. </constructor>
  18075. <constructor name="UniqValueCount" type="long"
  18076. static="false" final="false" visibility="public"
  18077. deprecated="not deprecated">
  18078. <doc>
  18079. <![CDATA[constructor
  18080. @param maxNum the limit in the number of unique values to keep.]]>
  18081. </doc>
  18082. </constructor>
  18083. <method name="setMaxItems" return="long"
  18084. abstract="false" native="false" synchronized="false"
  18085. static="false" final="false" visibility="public"
  18086. deprecated="not deprecated">
  18087. <param name="n" type="long"/>
  18088. <doc>
  18089. <![CDATA[Set the limit on the number of unique values
  18090. @param n the desired limit on the number of unique values
  18091. @return the new limit on the number of unique values]]>
  18092. </doc>
  18093. </method>
  18094. <method name="addNextValue"
  18095. abstract="false" native="false" synchronized="false"
  18096. static="false" final="false" visibility="public"
  18097. deprecated="not deprecated">
  18098. <param name="val" type="java.lang.Object"/>
  18099. <doc>
  18100. <![CDATA[add a value to the aggregator
  18101. @param val
  18102. an object.]]>
  18103. </doc>
  18104. </method>
  18105. <method name="getReport" return="java.lang.String"
  18106. abstract="false" native="false" synchronized="false"
  18107. static="false" final="false" visibility="public"
  18108. deprecated="not deprecated">
  18109. <doc>
  18110. <![CDATA[@return return the number of unique objects aggregated]]>
  18111. </doc>
  18112. </method>
  18113. <method name="getUniqueItems" return="java.util.Set"
  18114. abstract="false" native="false" synchronized="false"
  18115. static="false" final="false" visibility="public"
  18116. deprecated="not deprecated">
  18117. <doc>
  18118. <![CDATA[@return the set of the unique objects]]>
  18119. </doc>
  18120. </method>
  18121. <method name="reset"
  18122. abstract="false" native="false" synchronized="false"
  18123. static="false" final="false" visibility="public"
  18124. deprecated="not deprecated">
  18125. <doc>
  18126. <![CDATA[reset the aggregator]]>
  18127. </doc>
  18128. </method>
  18129. <method name="getCombinerOutput" return="java.util.ArrayList"
  18130. abstract="false" native="false" synchronized="false"
  18131. static="false" final="false" visibility="public"
  18132. deprecated="not deprecated">
  18133. <doc>
  18134. <![CDATA[@return return an array of the unique objects. The return value is
  18135. expected to be used by the a combiner.]]>
  18136. </doc>
  18137. </method>
  18138. <field name="MAX_NUM_UNIQUE_VALUES" type="java.lang.String"
  18139. transient="false" volatile="false"
  18140. static="true" final="true" visibility="public"
  18141. deprecated="not deprecated">
  18142. </field>
  18143. <doc>
  18144. <![CDATA[This class implements a value aggregator that dedupes a sequence of objects.]]>
  18145. </doc>
  18146. </class>
  18147. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.UniqValueCount -->
  18148. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.UserDefinedValueAggregatorDescriptor -->
  18149. <class name="UserDefinedValueAggregatorDescriptor" extends="java.lang.Object"
  18150. abstract="false"
  18151. static="false" final="false" visibility="public"
  18152. deprecated="not deprecated">
  18153. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor"/>
  18154. <constructor name="UserDefinedValueAggregatorDescriptor" type="java.lang.String, org.apache.hadoop.conf.Configuration"
  18155. static="false" final="false" visibility="public"
  18156. deprecated="not deprecated">
  18157. <doc>
  18158. <![CDATA[@param className the class name of the user defined descriptor class
  18159. @param conf a configure object used for decriptor configuration]]>
  18160. </doc>
  18161. </constructor>
  18162. <method name="createInstance" return="java.lang.Object"
  18163. abstract="false" native="false" synchronized="false"
  18164. static="true" final="false" visibility="public"
  18165. deprecated="not deprecated">
  18166. <param name="className" type="java.lang.String"/>
  18167. <doc>
  18168. <![CDATA[Create an instance of the given class
  18169. @param className the name of the class
  18170. @return a dynamically created instance of the given class]]>
  18171. </doc>
  18172. </method>
  18173. <method name="generateKeyValPairs" return="java.util.ArrayList"
  18174. abstract="false" native="false" synchronized="false"
  18175. static="false" final="false" visibility="public"
  18176. deprecated="not deprecated">
  18177. <param name="key" type="java.lang.Object"/>
  18178. <param name="val" type="java.lang.Object"/>
  18179. <doc>
  18180. <![CDATA[Generate a list of aggregation-id/value pairs for the given
  18181. key/value pairs by delegating the invocation to the real object.
  18182. @param key
  18183. input key
  18184. @param val
  18185. input value
  18186. @return a list of aggregation id/value pairs. An aggregation id encodes an
  18187. aggregation type which is used to guide the way to aggregate the
  18188. value in the reduce/combiner phrase of an Aggregate based job.]]>
  18189. </doc>
  18190. </method>
  18191. <method name="toString" return="java.lang.String"
  18192. abstract="false" native="false" synchronized="false"
  18193. static="false" final="false" visibility="public"
  18194. deprecated="not deprecated">
  18195. <doc>
  18196. <![CDATA[@return the string representation of this object.]]>
  18197. </doc>
  18198. </method>
  18199. <method name="configure"
  18200. abstract="false" native="false" synchronized="false"
  18201. static="false" final="false" visibility="public"
  18202. deprecated="not deprecated">
  18203. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  18204. <doc>
  18205. <![CDATA[Do nothing.]]>
  18206. </doc>
  18207. </method>
  18208. <field name="theAggregatorDescriptor" type="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor"
  18209. transient="false" volatile="false"
  18210. static="false" final="false" visibility="protected"
  18211. deprecated="not deprecated">
  18212. </field>
  18213. <doc>
  18214. <![CDATA[This class implements a wrapper for a user defined value
  18215. aggregator descriptor.
  18216. It serves two functions: One is to create an object of
  18217. ValueAggregatorDescriptor from the name of a user defined class
  18218. that may be dynamically loaded. The other is to
  18219. delegate invocations of generateKeyValPairs function to the created object.]]>
  18220. </doc>
  18221. </class>
  18222. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.UserDefinedValueAggregatorDescriptor -->
  18223. <!-- start interface org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator -->
  18224. <interface name="ValueAggregator" abstract="true"
  18225. static="false" final="false" visibility="public"
  18226. deprecated="not deprecated">
  18227. <method name="addNextValue"
  18228. abstract="false" native="false" synchronized="false"
  18229. static="false" final="false" visibility="public"
  18230. deprecated="not deprecated">
  18231. <param name="val" type="java.lang.Object"/>
  18232. <doc>
  18233. <![CDATA[add a value to the aggregator
  18234. @param val the value to be added]]>
  18235. </doc>
  18236. </method>
  18237. <method name="reset"
  18238. abstract="false" native="false" synchronized="false"
  18239. static="false" final="false" visibility="public"
  18240. deprecated="not deprecated">
  18241. <doc>
  18242. <![CDATA[reset the aggregator]]>
  18243. </doc>
  18244. </method>
  18245. <method name="getReport" return="java.lang.String"
  18246. abstract="false" native="false" synchronized="false"
  18247. static="false" final="false" visibility="public"
  18248. deprecated="not deprecated">
  18249. <doc>
  18250. <![CDATA[@return the string representation of the agregator]]>
  18251. </doc>
  18252. </method>
  18253. <method name="getCombinerOutput" return="java.util.ArrayList"
  18254. abstract="false" native="false" synchronized="false"
  18255. static="false" final="false" visibility="public"
  18256. deprecated="not deprecated">
  18257. <doc>
  18258. <![CDATA[@return an array of values as the outputs of the combiner.]]>
  18259. </doc>
  18260. </method>
  18261. <doc>
  18262. <![CDATA[This interface defines the minimal protocol for value aggregators.]]>
  18263. </doc>
  18264. </interface>
  18265. <!-- end interface org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator -->
  18266. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorBaseDescriptor -->
  18267. <class name="ValueAggregatorBaseDescriptor" extends="java.lang.Object"
  18268. abstract="false"
  18269. static="false" final="false" visibility="public"
  18270. deprecated="not deprecated">
  18271. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor"/>
  18272. <constructor name="ValueAggregatorBaseDescriptor"
  18273. static="false" final="false" visibility="public"
  18274. deprecated="not deprecated">
  18275. </constructor>
  18276. <method name="generateEntry" return="java.util.Map.Entry"
  18277. abstract="false" native="false" synchronized="false"
  18278. static="true" final="false" visibility="public"
  18279. deprecated="not deprecated">
  18280. <param name="type" type="java.lang.String"/>
  18281. <param name="id" type="java.lang.String"/>
  18282. <param name="val" type="org.apache.hadoop.io.Text"/>
  18283. <doc>
  18284. <![CDATA[@param type the aggregation type
  18285. @param id the aggregation id
  18286. @param val the val associated with the id to be aggregated
  18287. @return an Entry whose key is the aggregation id prefixed with
  18288. the aggregation type.]]>
  18289. </doc>
  18290. </method>
  18291. <method name="generateValueAggregator" return="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"
  18292. abstract="false" native="false" synchronized="false"
  18293. static="true" final="false" visibility="public"
  18294. deprecated="not deprecated">
  18295. <param name="type" type="java.lang.String"/>
  18296. <param name="uniqCount" type="long"/>
  18297. <doc>
  18298. <![CDATA[@param type the aggregation type
  18299. @param uniqCount the limit in the number of unique values to keep,
  18300. if type is UNIQ_VALUE_COUNT
  18301. @return a value aggregator of the given type.]]>
  18302. </doc>
  18303. </method>
  18304. <method name="generateKeyValPairs" return="java.util.ArrayList"
  18305. abstract="false" native="false" synchronized="false"
  18306. static="false" final="false" visibility="public"
  18307. deprecated="not deprecated">
  18308. <param name="key" type="java.lang.Object"/>
  18309. <param name="val" type="java.lang.Object"/>
  18310. <doc>
  18311. <![CDATA[Generate 1 or 2 aggregation-id/value pairs for the given key/value pair.
  18312. The first id will be of type LONG_VALUE_SUM, with "record_count" as
  18313. its aggregation id. If the input is a file split,
  18314. the second id of the same type will be generated too, with the file name
  18315. as its aggregation id. This achieves the behavior of counting the total
  18316. number of records in the input data, and the number of records
  18317. in each input file.
  18318. @param key
  18319. input key
  18320. @param val
  18321. input value
  18322. @return a list of aggregation id/value pairs. An aggregation id encodes an
  18323. aggregation type which is used to guide the way to aggregate the
  18324. value in the reduce/combiner phrase of an Aggregate based job.]]>
  18325. </doc>
  18326. </method>
  18327. <method name="configure"
  18328. abstract="false" native="false" synchronized="false"
  18329. static="false" final="false" visibility="public"
  18330. deprecated="not deprecated">
  18331. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  18332. <doc>
  18333. <![CDATA[get the input file name.
  18334. @param conf a configuration object]]>
  18335. </doc>
  18336. </method>
  18337. <field name="UNIQ_VALUE_COUNT" type="java.lang.String"
  18338. transient="false" volatile="false"
  18339. static="true" final="true" visibility="public"
  18340. deprecated="not deprecated">
  18341. </field>
  18342. <field name="LONG_VALUE_SUM" type="java.lang.String"
  18343. transient="false" volatile="false"
  18344. static="true" final="true" visibility="public"
  18345. deprecated="not deprecated">
  18346. </field>
  18347. <field name="DOUBLE_VALUE_SUM" type="java.lang.String"
  18348. transient="false" volatile="false"
  18349. static="true" final="true" visibility="public"
  18350. deprecated="not deprecated">
  18351. </field>
  18352. <field name="VALUE_HISTOGRAM" type="java.lang.String"
  18353. transient="false" volatile="false"
  18354. static="true" final="true" visibility="public"
  18355. deprecated="not deprecated">
  18356. </field>
  18357. <field name="LONG_VALUE_MAX" type="java.lang.String"
  18358. transient="false" volatile="false"
  18359. static="true" final="true" visibility="public"
  18360. deprecated="not deprecated">
  18361. </field>
  18362. <field name="LONG_VALUE_MIN" type="java.lang.String"
  18363. transient="false" volatile="false"
  18364. static="true" final="true" visibility="public"
  18365. deprecated="not deprecated">
  18366. </field>
  18367. <field name="STRING_VALUE_MAX" type="java.lang.String"
  18368. transient="false" volatile="false"
  18369. static="true" final="true" visibility="public"
  18370. deprecated="not deprecated">
  18371. </field>
  18372. <field name="STRING_VALUE_MIN" type="java.lang.String"
  18373. transient="false" volatile="false"
  18374. static="true" final="true" visibility="public"
  18375. deprecated="not deprecated">
  18376. </field>
  18377. <field name="inputFile" type="java.lang.String"
  18378. transient="false" volatile="false"
  18379. static="false" final="false" visibility="public"
  18380. deprecated="not deprecated">
  18381. </field>
  18382. <doc>
  18383. <![CDATA[This class implements the common functionalities of
  18384. the subclasses of ValueAggregatorDescriptor class.]]>
  18385. </doc>
  18386. </class>
  18387. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorBaseDescriptor -->
  18388. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorCombiner -->
  18389. <class name="ValueAggregatorCombiner" extends="org.apache.hadoop.mapreduce.Reducer"
  18390. abstract="false"
  18391. static="false" final="false" visibility="public"
  18392. deprecated="not deprecated">
  18393. <constructor name="ValueAggregatorCombiner"
  18394. static="false" final="false" visibility="public"
  18395. deprecated="not deprecated">
  18396. </constructor>
  18397. <method name="reduce"
  18398. abstract="false" native="false" synchronized="false"
  18399. static="false" final="false" visibility="public"
  18400. deprecated="not deprecated">
  18401. <param name="key" type="org.apache.hadoop.io.Text"/>
  18402. <param name="values" type="java.lang.Iterable"/>
  18403. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  18404. <exception name="IOException" type="java.io.IOException"/>
  18405. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  18406. <doc>
  18407. <![CDATA[Combines values for a given key.
  18408. @param key the key is expected to be a Text object, whose prefix indicates
  18409. the type of aggregation to aggregate the values.
  18410. @param values the values to combine
  18411. @param context to collect combined values]]>
  18412. </doc>
  18413. </method>
  18414. <doc>
  18415. <![CDATA[This class implements the generic combiner of Aggregate.]]>
  18416. </doc>
  18417. </class>
  18418. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorCombiner -->
  18419. <!-- start interface org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor -->
  18420. <interface name="ValueAggregatorDescriptor" abstract="true"
  18421. static="false" final="false" visibility="public"
  18422. deprecated="not deprecated">
  18423. <method name="generateKeyValPairs" return="java.util.ArrayList"
  18424. abstract="false" native="false" synchronized="false"
  18425. static="false" final="false" visibility="public"
  18426. deprecated="not deprecated">
  18427. <param name="key" type="java.lang.Object"/>
  18428. <param name="val" type="java.lang.Object"/>
  18429. <doc>
  18430. <![CDATA[Generate a list of aggregation-id/value pairs for
  18431. the given key/value pair.
  18432. This function is usually called by the mapper of an Aggregate based job.
  18433. @param key
  18434. input key
  18435. @param val
  18436. input value
  18437. @return a list of aggregation id/value pairs. An aggregation id encodes an
  18438. aggregation type which is used to guide the way to aggregate the
  18439. value in the reduce/combiner phrase of an Aggregate based job.]]>
  18440. </doc>
  18441. </method>
  18442. <method name="configure"
  18443. abstract="false" native="false" synchronized="false"
  18444. static="false" final="false" visibility="public"
  18445. deprecated="not deprecated">
  18446. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  18447. <doc>
  18448. <![CDATA[Configure the object
  18449. @param conf
  18450. a Configuration object that may contain the information
  18451. that can be used to configure the object.]]>
  18452. </doc>
  18453. </method>
  18454. <field name="TYPE_SEPARATOR" type="java.lang.String"
  18455. transient="false" volatile="false"
  18456. static="true" final="true" visibility="public"
  18457. deprecated="not deprecated">
  18458. </field>
  18459. <field name="ONE" type="org.apache.hadoop.io.Text"
  18460. transient="false" volatile="false"
  18461. static="true" final="true" visibility="public"
  18462. deprecated="not deprecated">
  18463. </field>
  18464. <doc>
  18465. <![CDATA[This interface defines the contract a value aggregator descriptor must
  18466. support. Such a descriptor can be configured with a {@link Configuration}
  18467. object. Its main function is to generate a list of aggregation-id/value
  18468. pairs. An aggregation id encodes an aggregation type which is used to
  18469. guide the way to aggregate the value in the reduce/combiner phrase of an
  18470. Aggregate based job.
  18471. The mapper in an Aggregate based map/reduce job may create one or more of
  18472. ValueAggregatorDescriptor objects at configuration time. For each input
  18473. key/value pair, the mapper will use those objects to create aggregation
  18474. id/value pairs.]]>
  18475. </doc>
  18476. </interface>
  18477. <!-- end interface org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor -->
  18478. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJob -->
  18479. <class name="ValueAggregatorJob" extends="java.lang.Object"
  18480. abstract="false"
  18481. static="false" final="false" visibility="public"
  18482. deprecated="not deprecated">
  18483. <constructor name="ValueAggregatorJob"
  18484. static="false" final="false" visibility="public"
  18485. deprecated="not deprecated">
  18486. </constructor>
  18487. <method name="createValueAggregatorJobs" return="org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl"
  18488. abstract="false" native="false" synchronized="false"
  18489. static="true" final="false" visibility="public"
  18490. deprecated="not deprecated">
  18491. <param name="args" type="java.lang.String[]"/>
  18492. <param name="descriptors" type="java.lang.Class[]"/>
  18493. <exception name="IOException" type="java.io.IOException"/>
  18494. </method>
  18495. <method name="createValueAggregatorJobs" return="org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl"
  18496. abstract="false" native="false" synchronized="false"
  18497. static="true" final="false" visibility="public"
  18498. deprecated="not deprecated">
  18499. <param name="args" type="java.lang.String[]"/>
  18500. <exception name="IOException" type="java.io.IOException"/>
  18501. </method>
  18502. <method name="createValueAggregatorJob" return="org.apache.hadoop.mapreduce.Job"
  18503. abstract="false" native="false" synchronized="false"
  18504. static="true" final="false" visibility="public"
  18505. deprecated="not deprecated">
  18506. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  18507. <param name="args" type="java.lang.String[]"/>
  18508. <exception name="IOException" type="java.io.IOException"/>
  18509. <doc>
  18510. <![CDATA[Create an Aggregate based map/reduce job.
  18511. @param conf The configuration for job
  18512. @param args the arguments used for job creation. Generic hadoop
  18513. arguments are accepted.
  18514. @return a Job object ready for submission.
  18515. @throws IOException
  18516. @see GenericOptionsParser]]>
  18517. </doc>
  18518. </method>
  18519. <method name="createValueAggregatorJob" return="org.apache.hadoop.mapreduce.Job"
  18520. abstract="false" native="false" synchronized="false"
  18521. static="true" final="false" visibility="public"
  18522. deprecated="not deprecated">
  18523. <param name="args" type="java.lang.String[]"/>
  18524. <param name="descriptors" type="java.lang.Class[]"/>
  18525. <exception name="IOException" type="java.io.IOException"/>
  18526. </method>
  18527. <method name="setAggregatorDescriptors" return="org.apache.hadoop.conf.Configuration"
  18528. abstract="false" native="false" synchronized="false"
  18529. static="true" final="false" visibility="public"
  18530. deprecated="not deprecated">
  18531. <param name="descriptors" type="java.lang.Class[]"/>
  18532. </method>
  18533. <method name="main"
  18534. abstract="false" native="false" synchronized="false"
  18535. static="true" final="false" visibility="public"
  18536. deprecated="not deprecated">
  18537. <param name="args" type="java.lang.String[]"/>
  18538. <exception name="IOException" type="java.io.IOException"/>
  18539. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  18540. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  18541. <doc>
  18542. <![CDATA[create and run an Aggregate based map/reduce job.
  18543. @param args the arguments used for job creation
  18544. @throws IOException]]>
  18545. </doc>
  18546. </method>
  18547. <doc>
  18548. <![CDATA[This is the main class for creating a map/reduce job using Aggregate
  18549. framework. The Aggregate is a specialization of map/reduce framework,
  18550. specializing for performing various simple aggregations.
  18551. Generally speaking, in order to implement an application using Map/Reduce
  18552. model, the developer is to implement Map and Reduce functions (and possibly
  18553. combine function). However, a lot of applications related to counting and
  18554. statistics computing have very similar characteristics. Aggregate abstracts
  18555. out the general patterns of these functions and implementing those patterns.
  18556. In particular, the package provides generic mapper/redducer/combiner
  18557. classes, and a set of built-in value aggregators, and a generic utility
  18558. class that helps user create map/reduce jobs using the generic class.
  18559. The built-in aggregators include:
  18560. sum over numeric values count the number of distinct values compute the
  18561. histogram of values compute the minimum, maximum, media,average, standard
  18562. deviation of numeric values
  18563. The developer using Aggregate will need only to provide a plugin class
  18564. conforming to the following interface:
  18565. public interface ValueAggregatorDescriptor { public ArrayList<Entry>
  18566. generateKeyValPairs(Object key, Object value); public void
  18567. configure(Configuration conf); }
  18568. The package also provides a base class, ValueAggregatorBaseDescriptor,
  18569. implementing the above interface. The user can extend the base class and
  18570. implement generateKeyValPairs accordingly.
  18571. The primary work of generateKeyValPairs is to emit one or more key/value
  18572. pairs based on the input key/value pair. The key in an output key/value pair
  18573. encode two pieces of information: aggregation type and aggregation id. The
  18574. value will be aggregated onto the aggregation id according the aggregation
  18575. type.
  18576. This class offers a function to generate a map/reduce job using Aggregate
  18577. framework. The function takes the following parameters: input directory spec
  18578. input format (text or sequence file) output directory a file specifying the
  18579. user plugin class]]>
  18580. </doc>
  18581. </class>
  18582. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJob -->
  18583. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJobBase -->
  18584. <class name="ValueAggregatorJobBase" extends="java.lang.Object"
  18585. abstract="false"
  18586. static="false" final="false" visibility="public"
  18587. deprecated="not deprecated">
  18588. <constructor name="ValueAggregatorJobBase"
  18589. static="false" final="false" visibility="public"
  18590. deprecated="not deprecated">
  18591. </constructor>
  18592. <method name="setup"
  18593. abstract="false" native="false" synchronized="false"
  18594. static="true" final="false" visibility="public"
  18595. deprecated="not deprecated">
  18596. <param name="job" type="org.apache.hadoop.conf.Configuration"/>
  18597. </method>
  18598. <method name="getValueAggregatorDescriptor" return="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorDescriptor"
  18599. abstract="false" native="false" synchronized="false"
  18600. static="true" final="false" visibility="protected"
  18601. deprecated="not deprecated">
  18602. <param name="spec" type="java.lang.String"/>
  18603. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  18604. </method>
  18605. <method name="getAggregatorDescriptors" return="java.util.ArrayList"
  18606. abstract="false" native="false" synchronized="false"
  18607. static="true" final="false" visibility="protected"
  18608. deprecated="not deprecated">
  18609. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  18610. </method>
  18611. <method name="logSpec"
  18612. abstract="false" native="false" synchronized="false"
  18613. static="true" final="false" visibility="protected"
  18614. deprecated="not deprecated">
  18615. </method>
  18616. <field name="DESCRIPTOR" type="java.lang.String"
  18617. transient="false" volatile="false"
  18618. static="true" final="true" visibility="public"
  18619. deprecated="not deprecated">
  18620. </field>
  18621. <field name="DESCRIPTOR_NUM" type="java.lang.String"
  18622. transient="false" volatile="false"
  18623. static="true" final="true" visibility="public"
  18624. deprecated="not deprecated">
  18625. </field>
  18626. <field name="USER_JAR" type="java.lang.String"
  18627. transient="false" volatile="false"
  18628. static="true" final="true" visibility="public"
  18629. deprecated="not deprecated">
  18630. </field>
  18631. <field name="aggregatorDescriptorList" type="java.util.ArrayList"
  18632. transient="false" volatile="false"
  18633. static="true" final="false" visibility="protected"
  18634. deprecated="not deprecated">
  18635. </field>
  18636. <doc>
  18637. <![CDATA[This abstract class implements some common functionalities of the
  18638. the generic mapper, reducer and combiner classes of Aggregate.]]>
  18639. </doc>
  18640. </class>
  18641. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorJobBase -->
  18642. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorMapper -->
  18643. <class name="ValueAggregatorMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  18644. abstract="false"
  18645. static="false" final="false" visibility="public"
  18646. deprecated="not deprecated">
  18647. <constructor name="ValueAggregatorMapper"
  18648. static="false" final="false" visibility="public"
  18649. deprecated="not deprecated">
  18650. </constructor>
  18651. <method name="setup"
  18652. abstract="false" native="false" synchronized="false"
  18653. static="false" final="false" visibility="public"
  18654. deprecated="not deprecated">
  18655. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  18656. <exception name="IOException" type="java.io.IOException"/>
  18657. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  18658. </method>
  18659. <method name="map"
  18660. abstract="false" native="false" synchronized="false"
  18661. static="false" final="false" visibility="public"
  18662. deprecated="not deprecated">
  18663. <param name="key" type="K1"/>
  18664. <param name="value" type="V1"/>
  18665. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  18666. <exception name="IOException" type="java.io.IOException"/>
  18667. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  18668. <doc>
  18669. <![CDATA[the map function. It iterates through the value aggregator descriptor
  18670. list to generate aggregation id/value pairs and emit them.]]>
  18671. </doc>
  18672. </method>
  18673. <doc>
  18674. <![CDATA[This class implements the generic mapper of Aggregate.]]>
  18675. </doc>
  18676. </class>
  18677. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorMapper -->
  18678. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorReducer -->
  18679. <class name="ValueAggregatorReducer" extends="org.apache.hadoop.mapreduce.Reducer"
  18680. abstract="false"
  18681. static="false" final="false" visibility="public"
  18682. deprecated="not deprecated">
  18683. <constructor name="ValueAggregatorReducer"
  18684. static="false" final="false" visibility="public"
  18685. deprecated="not deprecated">
  18686. </constructor>
  18687. <method name="setup"
  18688. abstract="false" native="false" synchronized="false"
  18689. static="false" final="false" visibility="public"
  18690. deprecated="not deprecated">
  18691. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  18692. <exception name="IOException" type="java.io.IOException"/>
  18693. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  18694. </method>
  18695. <method name="reduce"
  18696. abstract="false" native="false" synchronized="false"
  18697. static="false" final="false" visibility="public"
  18698. deprecated="not deprecated">
  18699. <param name="key" type="org.apache.hadoop.io.Text"/>
  18700. <param name="values" type="java.lang.Iterable"/>
  18701. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  18702. <exception name="IOException" type="java.io.IOException"/>
  18703. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  18704. <doc>
  18705. <![CDATA[@param key
  18706. the key is expected to be a Text object, whose prefix indicates
  18707. the type of aggregation to aggregate the values. In effect, data
  18708. driven computing is achieved. It is assumed that each aggregator's
  18709. getReport method emits appropriate output for the aggregator. This
  18710. may be further customized.
  18711. @param values the values to be aggregated
  18712. @param context]]>
  18713. </doc>
  18714. </method>
  18715. <doc>
  18716. <![CDATA[This class implements the generic reducer of Aggregate.]]>
  18717. </doc>
  18718. </class>
  18719. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregatorReducer -->
  18720. <!-- start class org.apache.hadoop.mapreduce.lib.aggregate.ValueHistogram -->
  18721. <class name="ValueHistogram" extends="java.lang.Object"
  18722. abstract="false"
  18723. static="false" final="false" visibility="public"
  18724. deprecated="not deprecated">
  18725. <implements name="org.apache.hadoop.mapreduce.lib.aggregate.ValueAggregator"/>
  18726. <constructor name="ValueHistogram"
  18727. static="false" final="false" visibility="public"
  18728. deprecated="not deprecated">
  18729. </constructor>
  18730. <method name="addNextValue"
  18731. abstract="false" native="false" synchronized="false"
  18732. static="false" final="false" visibility="public"
  18733. deprecated="not deprecated">
  18734. <param name="val" type="java.lang.Object"/>
  18735. <doc>
  18736. <![CDATA[add the given val to the aggregator.
  18737. @param val the value to be added. It is expected to be a string
  18738. in the form of xxxx\tnum, meaning xxxx has num occurrences.]]>
  18739. </doc>
  18740. </method>
  18741. <method name="getReport" return="java.lang.String"
  18742. abstract="false" native="false" synchronized="false"
  18743. static="false" final="false" visibility="public"
  18744. deprecated="not deprecated">
  18745. <doc>
  18746. <![CDATA[@return the string representation of this aggregator.
  18747. It includes the following basic statistics of the histogram:
  18748. the number of unique values
  18749. the minimum value
  18750. the media value
  18751. the maximum value
  18752. the average value
  18753. the standard deviation]]>
  18754. </doc>
  18755. </method>
  18756. <method name="getReportDetails" return="java.lang.String"
  18757. abstract="false" native="false" synchronized="false"
  18758. static="false" final="false" visibility="public"
  18759. deprecated="not deprecated">
  18760. <doc>
  18761. <![CDATA[@return a string representation of the list of value/frequence pairs of
  18762. the histogram]]>
  18763. </doc>
  18764. </method>
  18765. <method name="getCombinerOutput" return="java.util.ArrayList"
  18766. abstract="false" native="false" synchronized="false"
  18767. static="false" final="false" visibility="public"
  18768. deprecated="not deprecated">
  18769. <doc>
  18770. <![CDATA[@return a list value/frequence pairs.
  18771. The return value is expected to be used by the reducer.]]>
  18772. </doc>
  18773. </method>
  18774. <method name="getReportItems" return="java.util.TreeMap"
  18775. abstract="false" native="false" synchronized="false"
  18776. static="false" final="false" visibility="public"
  18777. deprecated="not deprecated">
  18778. <doc>
  18779. <![CDATA[@return a TreeMap representation of the histogram]]>
  18780. </doc>
  18781. </method>
  18782. <method name="reset"
  18783. abstract="false" native="false" synchronized="false"
  18784. static="false" final="false" visibility="public"
  18785. deprecated="not deprecated">
  18786. <doc>
  18787. <![CDATA[reset the aggregator]]>
  18788. </doc>
  18789. </method>
  18790. <doc>
  18791. <![CDATA[This class implements a value aggregator that computes the
  18792. histogram of a sequence of strings.]]>
  18793. </doc>
  18794. </class>
  18795. <!-- end class org.apache.hadoop.mapreduce.lib.aggregate.ValueHistogram -->
  18796. </package>
  18797. <package name="org.apache.hadoop.mapreduce.lib.chain">
  18798. <!-- start class org.apache.hadoop.mapreduce.lib.chain.ChainMapper -->
  18799. <class name="ChainMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  18800. abstract="false"
  18801. static="false" final="false" visibility="public"
  18802. deprecated="not deprecated">
  18803. <constructor name="ChainMapper"
  18804. static="false" final="false" visibility="public"
  18805. deprecated="not deprecated">
  18806. </constructor>
  18807. <method name="addMapper"
  18808. abstract="false" native="false" synchronized="false"
  18809. static="true" final="false" visibility="public"
  18810. deprecated="not deprecated">
  18811. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  18812. <param name="klass" type="java.lang.Class"/>
  18813. <param name="inputKeyClass" type="java.lang.Class"/>
  18814. <param name="inputValueClass" type="java.lang.Class"/>
  18815. <param name="outputKeyClass" type="java.lang.Class"/>
  18816. <param name="outputValueClass" type="java.lang.Class"/>
  18817. <param name="mapperConf" type="org.apache.hadoop.conf.Configuration"/>
  18818. <exception name="IOException" type="java.io.IOException"/>
  18819. <doc>
  18820. <![CDATA[Adds a {@link Mapper} class to the chain mapper.
  18821. <p>
  18822. The key and values are passed from one element of the chain to the next, by
  18823. value. For the added Mapper the configuration given for it,
  18824. <code>mapperConf</code>, have precedence over the job's Configuration. This
  18825. precedence is in effect when the task is running.
  18826. </p>
  18827. <p>
  18828. IMPORTANT: There is no need to specify the output key/value classes for the
  18829. ChainMapper, this is done by the addMapper for the last mapper in the chain
  18830. </p>
  18831. @param job
  18832. The job.
  18833. @param klass
  18834. the Mapper class to add.
  18835. @param inputKeyClass
  18836. mapper input key class.
  18837. @param inputValueClass
  18838. mapper input value class.
  18839. @param outputKeyClass
  18840. mapper output key class.
  18841. @param outputValueClass
  18842. mapper output value class.
  18843. @param mapperConf
  18844. a configuration for the Mapper class. It is recommended to use a
  18845. Configuration without default values using the
  18846. <code>Configuration(boolean loadDefaults)</code> constructor with
  18847. FALSE.]]>
  18848. </doc>
  18849. </method>
  18850. <method name="setup"
  18851. abstract="false" native="false" synchronized="false"
  18852. static="false" final="false" visibility="protected"
  18853. deprecated="not deprecated">
  18854. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  18855. </method>
  18856. <method name="run"
  18857. abstract="false" native="false" synchronized="false"
  18858. static="false" final="false" visibility="public"
  18859. deprecated="not deprecated">
  18860. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  18861. <exception name="IOException" type="java.io.IOException"/>
  18862. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  18863. </method>
  18864. <doc>
  18865. <![CDATA[The ChainMapper class allows to use multiple Mapper classes within a single
  18866. Map task.
  18867. <p>
  18868. The Mapper classes are invoked in a chained (or piped) fashion, the output of
  18869. the first becomes the input of the second, and so on until the last Mapper,
  18870. the output of the last Mapper will be written to the task's output.
  18871. </p>
  18872. <p>
  18873. The key functionality of this feature is that the Mappers in the chain do not
  18874. need to be aware that they are executed in a chain. This enables having
  18875. reusable specialized Mappers that can be combined to perform composite
  18876. operations within a single task.
  18877. </p>
  18878. <p>
  18879. Special care has to be taken when creating chains that the key/values output
  18880. by a Mapper are valid for the following Mapper in the chain. It is assumed
  18881. all Mappers and the Reduce in the chain use matching output and input key and
  18882. value classes as no conversion is done by the chaining code.
  18883. </p>
  18884. <p>
  18885. Using the ChainMapper and the ChainReducer classes is possible to compose
  18886. Map/Reduce jobs that look like <code>[MAP+ / REDUCE MAP*]</code>. And
  18887. immediate benefit of this pattern is a dramatic reduction in disk IO.
  18888. </p>
  18889. <p>
  18890. IMPORTANT: There is no need to specify the output key/value classes for the
  18891. ChainMapper, this is done by the addMapper for the last mapper in the chain.
  18892. </p>
  18893. ChainMapper usage pattern:
  18894. <p/>
  18895. <pre>
  18896. ...
  18897. Job = new Job(conf);
  18898. <p/>
  18899. Configuration mapAConf = new Configuration(false);
  18900. ...
  18901. ChainMapper.addMapper(job, AMap.class, LongWritable.class, Text.class,
  18902. Text.class, Text.class, true, mapAConf);
  18903. <p/>
  18904. Configuration mapBConf = new Configuration(false);
  18905. ...
  18906. ChainMapper.addMapper(job, BMap.class, Text.class, Text.class,
  18907. LongWritable.class, Text.class, false, mapBConf);
  18908. <p/>
  18909. ...
  18910. <p/>
  18911. job.waitForComplettion(true);
  18912. ...
  18913. </pre>]]>
  18914. </doc>
  18915. </class>
  18916. <!-- end class org.apache.hadoop.mapreduce.lib.chain.ChainMapper -->
  18917. <!-- start class org.apache.hadoop.mapreduce.lib.chain.ChainReducer -->
  18918. <class name="ChainReducer" extends="org.apache.hadoop.mapreduce.Reducer"
  18919. abstract="false"
  18920. static="false" final="false" visibility="public"
  18921. deprecated="not deprecated">
  18922. <constructor name="ChainReducer"
  18923. static="false" final="false" visibility="public"
  18924. deprecated="not deprecated">
  18925. </constructor>
  18926. <method name="setReducer"
  18927. abstract="false" native="false" synchronized="false"
  18928. static="true" final="false" visibility="public"
  18929. deprecated="not deprecated">
  18930. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  18931. <param name="klass" type="java.lang.Class"/>
  18932. <param name="inputKeyClass" type="java.lang.Class"/>
  18933. <param name="inputValueClass" type="java.lang.Class"/>
  18934. <param name="outputKeyClass" type="java.lang.Class"/>
  18935. <param name="outputValueClass" type="java.lang.Class"/>
  18936. <param name="reducerConf" type="org.apache.hadoop.conf.Configuration"/>
  18937. <doc>
  18938. <![CDATA[Sets the {@link Reducer} class to the chain job.
  18939. <p>
  18940. The key and values are passed from one element of the chain to the next, by
  18941. value. For the added Reducer the configuration given for it,
  18942. <code>reducerConf</code>, have precedence over the job's Configuration.
  18943. This precedence is in effect when the task is running.
  18944. </p>
  18945. <p>
  18946. IMPORTANT: There is no need to specify the output key/value classes for the
  18947. ChainReducer, this is done by the setReducer or the addMapper for the last
  18948. element in the chain.
  18949. </p>
  18950. @param job
  18951. the job
  18952. @param klass
  18953. the Reducer class to add.
  18954. @param inputKeyClass
  18955. reducer input key class.
  18956. @param inputValueClass
  18957. reducer input value class.
  18958. @param outputKeyClass
  18959. reducer output key class.
  18960. @param outputValueClass
  18961. reducer output value class.
  18962. @param reducerConf
  18963. a configuration for the Reducer class. It is recommended to use a
  18964. Configuration without default values using the
  18965. <code>Configuration(boolean loadDefaults)</code> constructor with
  18966. FALSE.]]>
  18967. </doc>
  18968. </method>
  18969. <method name="addMapper"
  18970. abstract="false" native="false" synchronized="false"
  18971. static="true" final="false" visibility="public"
  18972. deprecated="not deprecated">
  18973. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  18974. <param name="klass" type="java.lang.Class"/>
  18975. <param name="inputKeyClass" type="java.lang.Class"/>
  18976. <param name="inputValueClass" type="java.lang.Class"/>
  18977. <param name="outputKeyClass" type="java.lang.Class"/>
  18978. <param name="outputValueClass" type="java.lang.Class"/>
  18979. <param name="mapperConf" type="org.apache.hadoop.conf.Configuration"/>
  18980. <exception name="IOException" type="java.io.IOException"/>
  18981. <doc>
  18982. <![CDATA[Adds a {@link Mapper} class to the chain reducer.
  18983. <p>
  18984. The key and values are passed from one element of the chain to the next, by
  18985. value For the added Mapper the configuration given for it,
  18986. <code>mapperConf</code>, have precedence over the job's Configuration. This
  18987. precedence is in effect when the task is running.
  18988. </p>
  18989. <p>
  18990. IMPORTANT: There is no need to specify the output key/value classes for the
  18991. ChainMapper, this is done by the addMapper for the last mapper in the
  18992. chain.
  18993. </p>
  18994. @param job
  18995. The job.
  18996. @param klass
  18997. the Mapper class to add.
  18998. @param inputKeyClass
  18999. mapper input key class.
  19000. @param inputValueClass
  19001. mapper input value class.
  19002. @param outputKeyClass
  19003. mapper output key class.
  19004. @param outputValueClass
  19005. mapper output value class.
  19006. @param mapperConf
  19007. a configuration for the Mapper class. It is recommended to use a
  19008. Configuration without default values using the
  19009. <code>Configuration(boolean loadDefaults)</code> constructor with
  19010. FALSE.]]>
  19011. </doc>
  19012. </method>
  19013. <method name="setup"
  19014. abstract="false" native="false" synchronized="false"
  19015. static="false" final="false" visibility="protected"
  19016. deprecated="not deprecated">
  19017. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  19018. </method>
  19019. <method name="run"
  19020. abstract="false" native="false" synchronized="false"
  19021. static="false" final="false" visibility="public"
  19022. deprecated="not deprecated">
  19023. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  19024. <exception name="IOException" type="java.io.IOException"/>
  19025. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  19026. </method>
  19027. <doc>
  19028. <![CDATA[The ChainReducer class allows to chain multiple Mapper classes after a
  19029. Reducer within the Reducer task.
  19030. <p>
  19031. For each record output by the Reducer, the Mapper classes are invoked in a
  19032. chained (or piped) fashion. The output of the reducer becomes the input of
  19033. the first mapper and output of first becomes the input of the second, and so
  19034. on until the last Mapper, the output of the last Mapper will be written to
  19035. the task's output.
  19036. </p>
  19037. <p>
  19038. The key functionality of this feature is that the Mappers in the chain do not
  19039. need to be aware that they are executed after the Reducer or in a chain. This
  19040. enables having reusable specialized Mappers that can be combined to perform
  19041. composite operations within a single task.
  19042. </p>
  19043. <p>
  19044. Special care has to be taken when creating chains that the key/values output
  19045. by a Mapper are valid for the following Mapper in the chain. It is assumed
  19046. all Mappers and the Reduce in the chain use matching output and input key and
  19047. value classes as no conversion is done by the chaining code.
  19048. </p>
  19049. </p> Using the ChainMapper and the ChainReducer classes is possible to
  19050. compose Map/Reduce jobs that look like <code>[MAP+ / REDUCE MAP*]</code>. And
  19051. immediate benefit of this pattern is a dramatic reduction in disk IO. </p>
  19052. <p>
  19053. IMPORTANT: There is no need to specify the output key/value classes for the
  19054. ChainReducer, this is done by the setReducer or the addMapper for the last
  19055. element in the chain.
  19056. </p>
  19057. ChainReducer usage pattern:
  19058. <p/>
  19059. <pre>
  19060. ...
  19061. Job = new Job(conf);
  19062. ....
  19063. <p/>
  19064. Configuration reduceConf = new Configuration(false);
  19065. ...
  19066. ChainReducer.setReducer(job, XReduce.class, LongWritable.class, Text.class,
  19067. Text.class, Text.class, true, reduceConf);
  19068. <p/>
  19069. ChainReducer.addMapper(job, CMap.class, Text.class, Text.class,
  19070. LongWritable.class, Text.class, false, null);
  19071. <p/>
  19072. ChainReducer.addMapper(job, DMap.class, LongWritable.class, Text.class,
  19073. LongWritable.class, LongWritable.class, true, null);
  19074. <p/>
  19075. ...
  19076. <p/>
  19077. job.waitForCompletion(true);
  19078. ...
  19079. </pre>]]>
  19080. </doc>
  19081. </class>
  19082. <!-- end class org.apache.hadoop.mapreduce.lib.chain.ChainReducer -->
  19083. </package>
  19084. <package name="org.apache.hadoop.mapreduce.lib.db">
  19085. <!-- start class org.apache.hadoop.mapreduce.lib.db.BigDecimalSplitter -->
  19086. <class name="BigDecimalSplitter" extends="java.lang.Object"
  19087. abstract="false"
  19088. static="false" final="false" visibility="public"
  19089. deprecated="not deprecated">
  19090. <implements name="org.apache.hadoop.mapreduce.lib.db.DBSplitter"/>
  19091. <constructor name="BigDecimalSplitter"
  19092. static="false" final="false" visibility="public"
  19093. deprecated="not deprecated">
  19094. </constructor>
  19095. <method name="split" return="java.util.List"
  19096. abstract="false" native="false" synchronized="false"
  19097. static="false" final="false" visibility="public"
  19098. deprecated="not deprecated">
  19099. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19100. <param name="results" type="java.sql.ResultSet"/>
  19101. <param name="colName" type="java.lang.String"/>
  19102. <exception name="SQLException" type="java.sql.SQLException"/>
  19103. </method>
  19104. <method name="tryDivide" return="java.math.BigDecimal"
  19105. abstract="false" native="false" synchronized="false"
  19106. static="false" final="false" visibility="protected"
  19107. deprecated="not deprecated">
  19108. <param name="numerator" type="java.math.BigDecimal"/>
  19109. <param name="denominator" type="java.math.BigDecimal"/>
  19110. <doc>
  19111. <![CDATA[Divide numerator by denominator. If impossible in exact mode, use rounding.]]>
  19112. </doc>
  19113. </method>
  19114. <doc>
  19115. <![CDATA[Implement DBSplitter over BigDecimal values.]]>
  19116. </doc>
  19117. </class>
  19118. <!-- end class org.apache.hadoop.mapreduce.lib.db.BigDecimalSplitter -->
  19119. <!-- start class org.apache.hadoop.mapreduce.lib.db.BooleanSplitter -->
  19120. <class name="BooleanSplitter" extends="java.lang.Object"
  19121. abstract="false"
  19122. static="false" final="false" visibility="public"
  19123. deprecated="not deprecated">
  19124. <implements name="org.apache.hadoop.mapreduce.lib.db.DBSplitter"/>
  19125. <constructor name="BooleanSplitter"
  19126. static="false" final="false" visibility="public"
  19127. deprecated="not deprecated">
  19128. </constructor>
  19129. <method name="split" return="java.util.List"
  19130. abstract="false" native="false" synchronized="false"
  19131. static="false" final="false" visibility="public"
  19132. deprecated="not deprecated">
  19133. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19134. <param name="results" type="java.sql.ResultSet"/>
  19135. <param name="colName" type="java.lang.String"/>
  19136. <exception name="SQLException" type="java.sql.SQLException"/>
  19137. </method>
  19138. <doc>
  19139. <![CDATA[Implement DBSplitter over boolean values.]]>
  19140. </doc>
  19141. </class>
  19142. <!-- end class org.apache.hadoop.mapreduce.lib.db.BooleanSplitter -->
  19143. <!-- start class org.apache.hadoop.mapreduce.lib.db.DataDrivenDBInputFormat -->
  19144. <class name="DataDrivenDBInputFormat" extends="org.apache.hadoop.mapreduce.lib.db.DBInputFormat"
  19145. abstract="false"
  19146. static="false" final="false" visibility="public"
  19147. deprecated="not deprecated">
  19148. <implements name="org.apache.hadoop.conf.Configurable"/>
  19149. <constructor name="DataDrivenDBInputFormat"
  19150. static="false" final="false" visibility="public"
  19151. deprecated="not deprecated">
  19152. </constructor>
  19153. <method name="getSplitter" return="org.apache.hadoop.mapreduce.lib.db.DBSplitter"
  19154. abstract="false" native="false" synchronized="false"
  19155. static="false" final="false" visibility="protected"
  19156. deprecated="not deprecated">
  19157. <param name="sqlDataType" type="int"/>
  19158. <doc>
  19159. <![CDATA[@return the DBSplitter implementation to use to divide the table/query into InputSplits.]]>
  19160. </doc>
  19161. </method>
  19162. <method name="getSplits" return="java.util.List"
  19163. abstract="false" native="false" synchronized="false"
  19164. static="false" final="false" visibility="public"
  19165. deprecated="not deprecated">
  19166. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  19167. <exception name="IOException" type="java.io.IOException"/>
  19168. <doc>
  19169. <![CDATA[{@inheritDoc}]]>
  19170. </doc>
  19171. </method>
  19172. <method name="getBoundingValsQuery" return="java.lang.String"
  19173. abstract="false" native="false" synchronized="false"
  19174. static="false" final="false" visibility="protected"
  19175. deprecated="not deprecated">
  19176. <doc>
  19177. <![CDATA[@return a query which returns the minimum and maximum values for
  19178. the order-by column.
  19179. The min value should be in the first column, and the
  19180. max value should be in the second column of the results.]]>
  19181. </doc>
  19182. </method>
  19183. <method name="setBoundingQuery"
  19184. abstract="false" native="false" synchronized="false"
  19185. static="true" final="false" visibility="public"
  19186. deprecated="not deprecated">
  19187. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19188. <param name="query" type="java.lang.String"/>
  19189. <doc>
  19190. <![CDATA[Set the user-defined bounding query to use with a user-defined query.
  19191. This *must* include the substring "$CONDITIONS"
  19192. (DataDrivenDBInputFormat.SUBSTITUTE_TOKEN) inside the WHERE clause,
  19193. so that DataDrivenDBInputFormat knows where to insert split clauses.
  19194. e.g., "SELECT foo FROM mytable WHERE $CONDITIONS"
  19195. This will be expanded to something like:
  19196. SELECT foo FROM mytable WHERE (id &gt; 100) AND (id &lt; 250)
  19197. inside each split.]]>
  19198. </doc>
  19199. </method>
  19200. <method name="createDBRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  19201. abstract="false" native="false" synchronized="false"
  19202. static="false" final="false" visibility="protected"
  19203. deprecated="not deprecated">
  19204. <param name="split" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit"/>
  19205. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19206. <exception name="IOException" type="java.io.IOException"/>
  19207. </method>
  19208. <method name="setInput"
  19209. abstract="false" native="false" synchronized="false"
  19210. static="true" final="false" visibility="public"
  19211. deprecated="not deprecated">
  19212. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  19213. <param name="inputClass" type="java.lang.Class"/>
  19214. <param name="tableName" type="java.lang.String"/>
  19215. <param name="conditions" type="java.lang.String"/>
  19216. <param name="splitBy" type="java.lang.String"/>
  19217. <param name="fieldNames" type="java.lang.String[]"/>
  19218. <doc>
  19219. <![CDATA[Note that the "orderBy" column is called the "splitBy" in this version.
  19220. We reuse the same field, but it's not strictly ordering it -- just partitioning
  19221. the results.]]>
  19222. </doc>
  19223. </method>
  19224. <method name="setInput"
  19225. abstract="false" native="false" synchronized="false"
  19226. static="true" final="false" visibility="public"
  19227. deprecated="not deprecated">
  19228. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  19229. <param name="inputClass" type="java.lang.Class"/>
  19230. <param name="inputQuery" type="java.lang.String"/>
  19231. <param name="inputBoundingQuery" type="java.lang.String"/>
  19232. <doc>
  19233. <![CDATA[setInput() takes a custom query and a separate "bounding query" to use
  19234. instead of the custom "count query" used by DBInputFormat.]]>
  19235. </doc>
  19236. </method>
  19237. <field name="SUBSTITUTE_TOKEN" type="java.lang.String"
  19238. transient="false" volatile="false"
  19239. static="true" final="true" visibility="public"
  19240. deprecated="not deprecated">
  19241. <doc>
  19242. <![CDATA[If users are providing their own query, the following string is expected to
  19243. appear in the WHERE clause, which will be substituted with a pair of conditions
  19244. on the input to allow input splits to parallelise the import.]]>
  19245. </doc>
  19246. </field>
  19247. <doc>
  19248. <![CDATA[A InputFormat that reads input data from an SQL table.
  19249. Operates like DBInputFormat, but instead of using LIMIT and OFFSET to demarcate
  19250. splits, it tries to generate WHERE clauses which separate the data into roughly
  19251. equivalent shards.]]>
  19252. </doc>
  19253. </class>
  19254. <!-- end class org.apache.hadoop.mapreduce.lib.db.DataDrivenDBInputFormat -->
  19255. <!-- start class org.apache.hadoop.mapreduce.lib.db.DataDrivenDBInputFormat.DataDrivenDBInputSplit -->
  19256. <class name="DataDrivenDBInputFormat.DataDrivenDBInputSplit" extends="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit"
  19257. abstract="false"
  19258. static="true" final="false" visibility="public"
  19259. deprecated="not deprecated">
  19260. <constructor name="DataDrivenDBInputFormat.DataDrivenDBInputSplit"
  19261. static="false" final="false" visibility="public"
  19262. deprecated="not deprecated">
  19263. <doc>
  19264. <![CDATA[Default Constructor]]>
  19265. </doc>
  19266. </constructor>
  19267. <constructor name="DataDrivenDBInputFormat.DataDrivenDBInputSplit" type="java.lang.String, java.lang.String"
  19268. static="false" final="false" visibility="public"
  19269. deprecated="not deprecated">
  19270. <doc>
  19271. <![CDATA[Convenience Constructor
  19272. @param lower the string to be put in the WHERE clause to guard on the 'lower' end
  19273. @param upper the string to be put in the WHERE clause to guard on the 'upper' end]]>
  19274. </doc>
  19275. </constructor>
  19276. <method name="getLength" return="long"
  19277. abstract="false" native="false" synchronized="false"
  19278. static="false" final="false" visibility="public"
  19279. deprecated="not deprecated">
  19280. <exception name="IOException" type="java.io.IOException"/>
  19281. <doc>
  19282. <![CDATA[@return The total row count in this split]]>
  19283. </doc>
  19284. </method>
  19285. <method name="readFields"
  19286. abstract="false" native="false" synchronized="false"
  19287. static="false" final="false" visibility="public"
  19288. deprecated="not deprecated">
  19289. <param name="input" type="java.io.DataInput"/>
  19290. <exception name="IOException" type="java.io.IOException"/>
  19291. <doc>
  19292. <![CDATA[{@inheritDoc}]]>
  19293. </doc>
  19294. </method>
  19295. <method name="write"
  19296. abstract="false" native="false" synchronized="false"
  19297. static="false" final="false" visibility="public"
  19298. deprecated="not deprecated">
  19299. <param name="output" type="java.io.DataOutput"/>
  19300. <exception name="IOException" type="java.io.IOException"/>
  19301. <doc>
  19302. <![CDATA[{@inheritDoc}]]>
  19303. </doc>
  19304. </method>
  19305. <method name="getLowerClause" return="java.lang.String"
  19306. abstract="false" native="false" synchronized="false"
  19307. static="false" final="false" visibility="public"
  19308. deprecated="not deprecated">
  19309. </method>
  19310. <method name="getUpperClause" return="java.lang.String"
  19311. abstract="false" native="false" synchronized="false"
  19312. static="false" final="false" visibility="public"
  19313. deprecated="not deprecated">
  19314. </method>
  19315. <doc>
  19316. <![CDATA[A InputSplit that spans a set of rows]]>
  19317. </doc>
  19318. </class>
  19319. <!-- end class org.apache.hadoop.mapreduce.lib.db.DataDrivenDBInputFormat.DataDrivenDBInputSplit -->
  19320. <!-- start class org.apache.hadoop.mapreduce.lib.db.DataDrivenDBRecordReader -->
  19321. <class name="DataDrivenDBRecordReader" extends="org.apache.hadoop.mapreduce.lib.db.DBRecordReader"
  19322. abstract="false"
  19323. static="false" final="false" visibility="public"
  19324. deprecated="not deprecated">
  19325. <constructor name="DataDrivenDBRecordReader" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit, java.lang.Class, org.apache.hadoop.conf.Configuration, java.sql.Connection, org.apache.hadoop.mapreduce.lib.db.DBConfiguration, java.lang.String, java.lang.String[], java.lang.String, java.lang.String"
  19326. static="false" final="false" visibility="public"
  19327. deprecated="not deprecated">
  19328. <exception name="SQLException" type="java.sql.SQLException"/>
  19329. <doc>
  19330. <![CDATA[@param split The InputSplit to read data for
  19331. @throws SQLException]]>
  19332. </doc>
  19333. </constructor>
  19334. <method name="getSelectQuery" return="java.lang.String"
  19335. abstract="false" native="false" synchronized="false"
  19336. static="false" final="false" visibility="protected"
  19337. deprecated="not deprecated">
  19338. <doc>
  19339. <![CDATA[Returns the query for selecting the records,
  19340. subclasses can override this for custom behaviour.]]>
  19341. </doc>
  19342. </method>
  19343. <doc>
  19344. <![CDATA[A RecordReader that reads records from a SQL table,
  19345. using data-driven WHERE clause splits.
  19346. Emits LongWritables containing the record number as
  19347. key and DBWritables as value.]]>
  19348. </doc>
  19349. </class>
  19350. <!-- end class org.apache.hadoop.mapreduce.lib.db.DataDrivenDBRecordReader -->
  19351. <!-- start class org.apache.hadoop.mapreduce.lib.db.DateSplitter -->
  19352. <class name="DateSplitter" extends="org.apache.hadoop.mapreduce.lib.db.IntegerSplitter"
  19353. abstract="false"
  19354. static="false" final="false" visibility="public"
  19355. deprecated="not deprecated">
  19356. <constructor name="DateSplitter"
  19357. static="false" final="false" visibility="public"
  19358. deprecated="not deprecated">
  19359. </constructor>
  19360. <method name="split" return="java.util.List"
  19361. abstract="false" native="false" synchronized="false"
  19362. static="false" final="false" visibility="public"
  19363. deprecated="not deprecated">
  19364. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19365. <param name="results" type="java.sql.ResultSet"/>
  19366. <param name="colName" type="java.lang.String"/>
  19367. <exception name="SQLException" type="java.sql.SQLException"/>
  19368. </method>
  19369. <method name="dateToString" return="java.lang.String"
  19370. abstract="false" native="false" synchronized="false"
  19371. static="false" final="false" visibility="protected"
  19372. deprecated="not deprecated">
  19373. <param name="d" type="java.util.Date"/>
  19374. <doc>
  19375. <![CDATA[Given a Date 'd', format it as a string for use in a SQL date
  19376. comparison operation.
  19377. @param d the date to format.
  19378. @return the string representing this date in SQL with any appropriate
  19379. quotation characters, etc.]]>
  19380. </doc>
  19381. </method>
  19382. <doc>
  19383. <![CDATA[Implement DBSplitter over date/time values.
  19384. Make use of logic from IntegerSplitter, since date/time are just longs
  19385. in Java.]]>
  19386. </doc>
  19387. </class>
  19388. <!-- end class org.apache.hadoop.mapreduce.lib.db.DateSplitter -->
  19389. <!-- start class org.apache.hadoop.mapreduce.lib.db.DBConfiguration -->
  19390. <class name="DBConfiguration" extends="java.lang.Object"
  19391. abstract="false"
  19392. static="false" final="false" visibility="public"
  19393. deprecated="not deprecated">
  19394. <constructor name="DBConfiguration" type="org.apache.hadoop.conf.Configuration"
  19395. static="false" final="false" visibility="public"
  19396. deprecated="not deprecated">
  19397. </constructor>
  19398. <method name="configureDB"
  19399. abstract="false" native="false" synchronized="false"
  19400. static="true" final="false" visibility="public"
  19401. deprecated="not deprecated">
  19402. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19403. <param name="driverClass" type="java.lang.String"/>
  19404. <param name="dbUrl" type="java.lang.String"/>
  19405. <param name="userName" type="java.lang.String"/>
  19406. <param name="passwd" type="java.lang.String"/>
  19407. <doc>
  19408. <![CDATA[Sets the DB access related fields in the {@link Configuration}.
  19409. @param conf the configuration
  19410. @param driverClass JDBC Driver class name
  19411. @param dbUrl JDBC DB access URL.
  19412. @param userName DB access username
  19413. @param passwd DB access passwd]]>
  19414. </doc>
  19415. </method>
  19416. <method name="configureDB"
  19417. abstract="false" native="false" synchronized="false"
  19418. static="true" final="false" visibility="public"
  19419. deprecated="not deprecated">
  19420. <param name="job" type="org.apache.hadoop.conf.Configuration"/>
  19421. <param name="driverClass" type="java.lang.String"/>
  19422. <param name="dbUrl" type="java.lang.String"/>
  19423. <doc>
  19424. <![CDATA[Sets the DB access related fields in the JobConf.
  19425. @param job the job
  19426. @param driverClass JDBC Driver class name
  19427. @param dbUrl JDBC DB access URL.]]>
  19428. </doc>
  19429. </method>
  19430. <method name="getConnection" return="java.sql.Connection"
  19431. abstract="false" native="false" synchronized="false"
  19432. static="false" final="false" visibility="public"
  19433. deprecated="not deprecated">
  19434. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  19435. <exception name="SQLException" type="java.sql.SQLException"/>
  19436. <doc>
  19437. <![CDATA[Returns a connection object o the DB
  19438. @throws ClassNotFoundException
  19439. @throws SQLException]]>
  19440. </doc>
  19441. </method>
  19442. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  19443. abstract="false" native="false" synchronized="false"
  19444. static="false" final="false" visibility="public"
  19445. deprecated="not deprecated">
  19446. </method>
  19447. <method name="getInputTableName" return="java.lang.String"
  19448. abstract="false" native="false" synchronized="false"
  19449. static="false" final="false" visibility="public"
  19450. deprecated="not deprecated">
  19451. </method>
  19452. <method name="setInputTableName"
  19453. abstract="false" native="false" synchronized="false"
  19454. static="false" final="false" visibility="public"
  19455. deprecated="not deprecated">
  19456. <param name="tableName" type="java.lang.String"/>
  19457. </method>
  19458. <method name="getInputFieldNames" return="java.lang.String[]"
  19459. abstract="false" native="false" synchronized="false"
  19460. static="false" final="false" visibility="public"
  19461. deprecated="not deprecated">
  19462. </method>
  19463. <method name="setInputFieldNames"
  19464. abstract="false" native="false" synchronized="false"
  19465. static="false" final="false" visibility="public"
  19466. deprecated="not deprecated">
  19467. <param name="fieldNames" type="java.lang.String[]"/>
  19468. </method>
  19469. <method name="getInputConditions" return="java.lang.String"
  19470. abstract="false" native="false" synchronized="false"
  19471. static="false" final="false" visibility="public"
  19472. deprecated="not deprecated">
  19473. </method>
  19474. <method name="setInputConditions"
  19475. abstract="false" native="false" synchronized="false"
  19476. static="false" final="false" visibility="public"
  19477. deprecated="not deprecated">
  19478. <param name="conditions" type="java.lang.String"/>
  19479. </method>
  19480. <method name="getInputOrderBy" return="java.lang.String"
  19481. abstract="false" native="false" synchronized="false"
  19482. static="false" final="false" visibility="public"
  19483. deprecated="not deprecated">
  19484. </method>
  19485. <method name="setInputOrderBy"
  19486. abstract="false" native="false" synchronized="false"
  19487. static="false" final="false" visibility="public"
  19488. deprecated="not deprecated">
  19489. <param name="orderby" type="java.lang.String"/>
  19490. </method>
  19491. <method name="getInputQuery" return="java.lang.String"
  19492. abstract="false" native="false" synchronized="false"
  19493. static="false" final="false" visibility="public"
  19494. deprecated="not deprecated">
  19495. </method>
  19496. <method name="setInputQuery"
  19497. abstract="false" native="false" synchronized="false"
  19498. static="false" final="false" visibility="public"
  19499. deprecated="not deprecated">
  19500. <param name="query" type="java.lang.String"/>
  19501. </method>
  19502. <method name="getInputCountQuery" return="java.lang.String"
  19503. abstract="false" native="false" synchronized="false"
  19504. static="false" final="false" visibility="public"
  19505. deprecated="not deprecated">
  19506. </method>
  19507. <method name="setInputCountQuery"
  19508. abstract="false" native="false" synchronized="false"
  19509. static="false" final="false" visibility="public"
  19510. deprecated="not deprecated">
  19511. <param name="query" type="java.lang.String"/>
  19512. </method>
  19513. <method name="setInputBoundingQuery"
  19514. abstract="false" native="false" synchronized="false"
  19515. static="false" final="false" visibility="public"
  19516. deprecated="not deprecated">
  19517. <param name="query" type="java.lang.String"/>
  19518. </method>
  19519. <method name="getInputBoundingQuery" return="java.lang.String"
  19520. abstract="false" native="false" synchronized="false"
  19521. static="false" final="false" visibility="public"
  19522. deprecated="not deprecated">
  19523. </method>
  19524. <method name="getInputClass" return="java.lang.Class"
  19525. abstract="false" native="false" synchronized="false"
  19526. static="false" final="false" visibility="public"
  19527. deprecated="not deprecated">
  19528. </method>
  19529. <method name="setInputClass"
  19530. abstract="false" native="false" synchronized="false"
  19531. static="false" final="false" visibility="public"
  19532. deprecated="not deprecated">
  19533. <param name="inputClass" type="java.lang.Class"/>
  19534. </method>
  19535. <method name="getOutputTableName" return="java.lang.String"
  19536. abstract="false" native="false" synchronized="false"
  19537. static="false" final="false" visibility="public"
  19538. deprecated="not deprecated">
  19539. </method>
  19540. <method name="setOutputTableName"
  19541. abstract="false" native="false" synchronized="false"
  19542. static="false" final="false" visibility="public"
  19543. deprecated="not deprecated">
  19544. <param name="tableName" type="java.lang.String"/>
  19545. </method>
  19546. <method name="getOutputFieldNames" return="java.lang.String[]"
  19547. abstract="false" native="false" synchronized="false"
  19548. static="false" final="false" visibility="public"
  19549. deprecated="not deprecated">
  19550. </method>
  19551. <method name="setOutputFieldNames"
  19552. abstract="false" native="false" synchronized="false"
  19553. static="false" final="false" visibility="public"
  19554. deprecated="not deprecated">
  19555. <param name="fieldNames" type="java.lang.String[]"/>
  19556. </method>
  19557. <method name="setOutputFieldCount"
  19558. abstract="false" native="false" synchronized="false"
  19559. static="false" final="false" visibility="public"
  19560. deprecated="not deprecated">
  19561. <param name="fieldCount" type="int"/>
  19562. </method>
  19563. <method name="getOutputFieldCount" return="int"
  19564. abstract="false" native="false" synchronized="false"
  19565. static="false" final="false" visibility="public"
  19566. deprecated="not deprecated">
  19567. </method>
  19568. <field name="DRIVER_CLASS_PROPERTY" type="java.lang.String"
  19569. transient="false" volatile="false"
  19570. static="true" final="true" visibility="public"
  19571. deprecated="not deprecated">
  19572. <doc>
  19573. <![CDATA[The JDBC Driver class name]]>
  19574. </doc>
  19575. </field>
  19576. <field name="URL_PROPERTY" type="java.lang.String"
  19577. transient="false" volatile="false"
  19578. static="true" final="true" visibility="public"
  19579. deprecated="not deprecated">
  19580. <doc>
  19581. <![CDATA[JDBC Database access URL]]>
  19582. </doc>
  19583. </field>
  19584. <field name="USERNAME_PROPERTY" type="java.lang.String"
  19585. transient="false" volatile="false"
  19586. static="true" final="true" visibility="public"
  19587. deprecated="not deprecated">
  19588. <doc>
  19589. <![CDATA[User name to access the database]]>
  19590. </doc>
  19591. </field>
  19592. <field name="PASSWORD_PROPERTY" type="java.lang.String"
  19593. transient="false" volatile="false"
  19594. static="true" final="true" visibility="public"
  19595. deprecated="not deprecated">
  19596. <doc>
  19597. <![CDATA[Password to access the database]]>
  19598. </doc>
  19599. </field>
  19600. <field name="INPUT_TABLE_NAME_PROPERTY" type="java.lang.String"
  19601. transient="false" volatile="false"
  19602. static="true" final="true" visibility="public"
  19603. deprecated="not deprecated">
  19604. <doc>
  19605. <![CDATA[Input table name]]>
  19606. </doc>
  19607. </field>
  19608. <field name="INPUT_FIELD_NAMES_PROPERTY" type="java.lang.String"
  19609. transient="false" volatile="false"
  19610. static="true" final="true" visibility="public"
  19611. deprecated="not deprecated">
  19612. <doc>
  19613. <![CDATA[Field names in the Input table]]>
  19614. </doc>
  19615. </field>
  19616. <field name="INPUT_CONDITIONS_PROPERTY" type="java.lang.String"
  19617. transient="false" volatile="false"
  19618. static="true" final="true" visibility="public"
  19619. deprecated="not deprecated">
  19620. <doc>
  19621. <![CDATA[WHERE clause in the input SELECT statement]]>
  19622. </doc>
  19623. </field>
  19624. <field name="INPUT_ORDER_BY_PROPERTY" type="java.lang.String"
  19625. transient="false" volatile="false"
  19626. static="true" final="true" visibility="public"
  19627. deprecated="not deprecated">
  19628. <doc>
  19629. <![CDATA[ORDER BY clause in the input SELECT statement]]>
  19630. </doc>
  19631. </field>
  19632. <field name="INPUT_QUERY" type="java.lang.String"
  19633. transient="false" volatile="false"
  19634. static="true" final="true" visibility="public"
  19635. deprecated="not deprecated">
  19636. <doc>
  19637. <![CDATA[Whole input query, exluding LIMIT...OFFSET]]>
  19638. </doc>
  19639. </field>
  19640. <field name="INPUT_COUNT_QUERY" type="java.lang.String"
  19641. transient="false" volatile="false"
  19642. static="true" final="true" visibility="public"
  19643. deprecated="not deprecated">
  19644. <doc>
  19645. <![CDATA[Input query to get the count of records]]>
  19646. </doc>
  19647. </field>
  19648. <field name="INPUT_BOUNDING_QUERY" type="java.lang.String"
  19649. transient="false" volatile="false"
  19650. static="true" final="true" visibility="public"
  19651. deprecated="not deprecated">
  19652. <doc>
  19653. <![CDATA[Input query to get the max and min values of the jdbc.input.query]]>
  19654. </doc>
  19655. </field>
  19656. <field name="INPUT_CLASS_PROPERTY" type="java.lang.String"
  19657. transient="false" volatile="false"
  19658. static="true" final="true" visibility="public"
  19659. deprecated="not deprecated">
  19660. <doc>
  19661. <![CDATA[Class name implementing DBWritable which will hold input tuples]]>
  19662. </doc>
  19663. </field>
  19664. <field name="OUTPUT_TABLE_NAME_PROPERTY" type="java.lang.String"
  19665. transient="false" volatile="false"
  19666. static="true" final="true" visibility="public"
  19667. deprecated="not deprecated">
  19668. <doc>
  19669. <![CDATA[Output table name]]>
  19670. </doc>
  19671. </field>
  19672. <field name="OUTPUT_FIELD_NAMES_PROPERTY" type="java.lang.String"
  19673. transient="false" volatile="false"
  19674. static="true" final="true" visibility="public"
  19675. deprecated="not deprecated">
  19676. <doc>
  19677. <![CDATA[Field names in the Output table]]>
  19678. </doc>
  19679. </field>
  19680. <field name="OUTPUT_FIELD_COUNT_PROPERTY" type="java.lang.String"
  19681. transient="false" volatile="false"
  19682. static="true" final="true" visibility="public"
  19683. deprecated="not deprecated">
  19684. <doc>
  19685. <![CDATA[Number of fields in the Output table]]>
  19686. </doc>
  19687. </field>
  19688. <doc>
  19689. <![CDATA[A container for configuration property names for jobs with DB input/output.
  19690. The job can be configured using the static methods in this class,
  19691. {@link DBInputFormat}, and {@link DBOutputFormat}.
  19692. Alternatively, the properties can be set in the configuration with proper
  19693. values.
  19694. @see DBConfiguration#configureDB(Configuration, String, String, String, String)
  19695. @see DBInputFormat#setInput(Job, Class, String, String)
  19696. @see DBInputFormat#setInput(Job, Class, String, String, String, String...)
  19697. @see DBOutputFormat#setOutput(Job, String, String...)]]>
  19698. </doc>
  19699. </class>
  19700. <!-- end class org.apache.hadoop.mapreduce.lib.db.DBConfiguration -->
  19701. <!-- start class org.apache.hadoop.mapreduce.lib.db.DBInputFormat -->
  19702. <class name="DBInputFormat" extends="org.apache.hadoop.mapreduce.InputFormat"
  19703. abstract="false"
  19704. static="false" final="false" visibility="public"
  19705. deprecated="not deprecated">
  19706. <implements name="org.apache.hadoop.conf.Configurable"/>
  19707. <constructor name="DBInputFormat"
  19708. static="false" final="false" visibility="public"
  19709. deprecated="not deprecated">
  19710. </constructor>
  19711. <method name="setConf"
  19712. abstract="false" native="false" synchronized="false"
  19713. static="false" final="false" visibility="public"
  19714. deprecated="not deprecated">
  19715. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19716. <doc>
  19717. <![CDATA[{@inheritDoc}]]>
  19718. </doc>
  19719. </method>
  19720. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  19721. abstract="false" native="false" synchronized="false"
  19722. static="false" final="false" visibility="public"
  19723. deprecated="not deprecated">
  19724. </method>
  19725. <method name="getDBConf" return="org.apache.hadoop.mapreduce.lib.db.DBConfiguration"
  19726. abstract="false" native="false" synchronized="false"
  19727. static="false" final="false" visibility="public"
  19728. deprecated="not deprecated">
  19729. </method>
  19730. <method name="getConnection" return="java.sql.Connection"
  19731. abstract="false" native="false" synchronized="false"
  19732. static="false" final="false" visibility="public"
  19733. deprecated="not deprecated">
  19734. </method>
  19735. <method name="getDBProductName" return="java.lang.String"
  19736. abstract="false" native="false" synchronized="false"
  19737. static="false" final="false" visibility="public"
  19738. deprecated="not deprecated">
  19739. </method>
  19740. <method name="createDBRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  19741. abstract="false" native="false" synchronized="false"
  19742. static="false" final="false" visibility="protected"
  19743. deprecated="not deprecated">
  19744. <param name="split" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit"/>
  19745. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  19746. <exception name="IOException" type="java.io.IOException"/>
  19747. </method>
  19748. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  19749. abstract="false" native="false" synchronized="false"
  19750. static="false" final="false" visibility="public"
  19751. deprecated="not deprecated">
  19752. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  19753. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  19754. <exception name="IOException" type="java.io.IOException"/>
  19755. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  19756. <doc>
  19757. <![CDATA[{@inheritDoc}]]>
  19758. </doc>
  19759. </method>
  19760. <method name="getSplits" return="java.util.List"
  19761. abstract="false" native="false" synchronized="false"
  19762. static="false" final="false" visibility="public"
  19763. deprecated="not deprecated">
  19764. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  19765. <exception name="IOException" type="java.io.IOException"/>
  19766. <doc>
  19767. <![CDATA[{@inheritDoc}]]>
  19768. </doc>
  19769. </method>
  19770. <method name="getCountQuery" return="java.lang.String"
  19771. abstract="false" native="false" synchronized="false"
  19772. static="false" final="false" visibility="protected"
  19773. deprecated="not deprecated">
  19774. <doc>
  19775. <![CDATA[Returns the query for getting the total number of rows,
  19776. subclasses can override this for custom behaviour.]]>
  19777. </doc>
  19778. </method>
  19779. <method name="setInput"
  19780. abstract="false" native="false" synchronized="false"
  19781. static="true" final="false" visibility="public"
  19782. deprecated="not deprecated">
  19783. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  19784. <param name="inputClass" type="java.lang.Class"/>
  19785. <param name="tableName" type="java.lang.String"/>
  19786. <param name="conditions" type="java.lang.String"/>
  19787. <param name="orderBy" type="java.lang.String"/>
  19788. <param name="fieldNames" type="java.lang.String[]"/>
  19789. <doc>
  19790. <![CDATA[Initializes the map-part of the job with the appropriate input settings.
  19791. @param job The map-reduce job
  19792. @param inputClass the class object implementing DBWritable, which is the
  19793. Java object holding tuple fields.
  19794. @param tableName The table to read data from
  19795. @param conditions The condition which to select data with,
  19796. eg. '(updated > 20070101 AND length > 0)'
  19797. @param orderBy the fieldNames in the orderBy clause.
  19798. @param fieldNames The field names in the table
  19799. @see #setInput(Job, Class, String, String)]]>
  19800. </doc>
  19801. </method>
  19802. <method name="setInput"
  19803. abstract="false" native="false" synchronized="false"
  19804. static="true" final="false" visibility="public"
  19805. deprecated="not deprecated">
  19806. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  19807. <param name="inputClass" type="java.lang.Class"/>
  19808. <param name="inputQuery" type="java.lang.String"/>
  19809. <param name="inputCountQuery" type="java.lang.String"/>
  19810. <doc>
  19811. <![CDATA[Initializes the map-part of the job with the appropriate input settings.
  19812. @param job The map-reduce job
  19813. @param inputClass the class object implementing DBWritable, which is the
  19814. Java object holding tuple fields.
  19815. @param inputQuery the input query to select fields. Example :
  19816. "SELECT f1, f2, f3 FROM Mytable ORDER BY f1"
  19817. @param inputCountQuery the input query that returns
  19818. the number of records in the table.
  19819. Example : "SELECT COUNT(f1) FROM Mytable"
  19820. @see #setInput(Job, Class, String, String, String, String...)]]>
  19821. </doc>
  19822. </method>
  19823. <method name="closeConnection"
  19824. abstract="false" native="false" synchronized="false"
  19825. static="false" final="false" visibility="protected"
  19826. deprecated="not deprecated">
  19827. </method>
  19828. <doc>
  19829. <![CDATA[A InputFormat that reads input data from an SQL table.
  19830. <p>
  19831. DBInputFormat emits LongWritables containing the record number as
  19832. key and DBWritables as value.
  19833. The SQL query, and input class can be using one of the two
  19834. setInput methods.]]>
  19835. </doc>
  19836. </class>
  19837. <!-- end class org.apache.hadoop.mapreduce.lib.db.DBInputFormat -->
  19838. <!-- start class org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit -->
  19839. <class name="DBInputFormat.DBInputSplit" extends="org.apache.hadoop.mapreduce.InputSplit"
  19840. abstract="false"
  19841. static="true" final="false" visibility="public"
  19842. deprecated="not deprecated">
  19843. <implements name="org.apache.hadoop.io.Writable"/>
  19844. <constructor name="DBInputFormat.DBInputSplit"
  19845. static="false" final="false" visibility="public"
  19846. deprecated="not deprecated">
  19847. <doc>
  19848. <![CDATA[Default Constructor]]>
  19849. </doc>
  19850. </constructor>
  19851. <constructor name="DBInputFormat.DBInputSplit" type="long, long"
  19852. static="false" final="false" visibility="public"
  19853. deprecated="not deprecated">
  19854. <doc>
  19855. <![CDATA[Convenience Constructor
  19856. @param start the index of the first row to select
  19857. @param end the index of the last row to select]]>
  19858. </doc>
  19859. </constructor>
  19860. <method name="getLocations" return="java.lang.String[]"
  19861. abstract="false" native="false" synchronized="false"
  19862. static="false" final="false" visibility="public"
  19863. deprecated="not deprecated">
  19864. <exception name="IOException" type="java.io.IOException"/>
  19865. <doc>
  19866. <![CDATA[{@inheritDoc}]]>
  19867. </doc>
  19868. </method>
  19869. <method name="getStart" return="long"
  19870. abstract="false" native="false" synchronized="false"
  19871. static="false" final="false" visibility="public"
  19872. deprecated="not deprecated">
  19873. <doc>
  19874. <![CDATA[@return The index of the first row to select]]>
  19875. </doc>
  19876. </method>
  19877. <method name="getEnd" return="long"
  19878. abstract="false" native="false" synchronized="false"
  19879. static="false" final="false" visibility="public"
  19880. deprecated="not deprecated">
  19881. <doc>
  19882. <![CDATA[@return The index of the last row to select]]>
  19883. </doc>
  19884. </method>
  19885. <method name="getLength" return="long"
  19886. abstract="false" native="false" synchronized="false"
  19887. static="false" final="false" visibility="public"
  19888. deprecated="not deprecated">
  19889. <exception name="IOException" type="java.io.IOException"/>
  19890. <doc>
  19891. <![CDATA[@return The total row count in this split]]>
  19892. </doc>
  19893. </method>
  19894. <method name="readFields"
  19895. abstract="false" native="false" synchronized="false"
  19896. static="false" final="false" visibility="public"
  19897. deprecated="not deprecated">
  19898. <param name="input" type="java.io.DataInput"/>
  19899. <exception name="IOException" type="java.io.IOException"/>
  19900. <doc>
  19901. <![CDATA[{@inheritDoc}]]>
  19902. </doc>
  19903. </method>
  19904. <method name="write"
  19905. abstract="false" native="false" synchronized="false"
  19906. static="false" final="false" visibility="public"
  19907. deprecated="not deprecated">
  19908. <param name="output" type="java.io.DataOutput"/>
  19909. <exception name="IOException" type="java.io.IOException"/>
  19910. <doc>
  19911. <![CDATA[{@inheritDoc}]]>
  19912. </doc>
  19913. </method>
  19914. <doc>
  19915. <![CDATA[A InputSplit that spans a set of rows]]>
  19916. </doc>
  19917. </class>
  19918. <!-- end class org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit -->
  19919. <!-- start class org.apache.hadoop.mapreduce.lib.db.DBInputFormat.NullDBWritable -->
  19920. <class name="DBInputFormat.NullDBWritable" extends="java.lang.Object"
  19921. abstract="false"
  19922. static="true" final="false" visibility="public"
  19923. deprecated="not deprecated">
  19924. <implements name="org.apache.hadoop.mapreduce.lib.db.DBWritable"/>
  19925. <implements name="org.apache.hadoop.io.Writable"/>
  19926. <constructor name="DBInputFormat.NullDBWritable"
  19927. static="false" final="false" visibility="public"
  19928. deprecated="not deprecated">
  19929. </constructor>
  19930. <method name="readFields"
  19931. abstract="false" native="false" synchronized="false"
  19932. static="false" final="false" visibility="public"
  19933. deprecated="not deprecated">
  19934. <param name="in" type="java.io.DataInput"/>
  19935. <exception name="IOException" type="java.io.IOException"/>
  19936. </method>
  19937. <method name="readFields"
  19938. abstract="false" native="false" synchronized="false"
  19939. static="false" final="false" visibility="public"
  19940. deprecated="not deprecated">
  19941. <param name="arg0" type="java.sql.ResultSet"/>
  19942. <exception name="SQLException" type="java.sql.SQLException"/>
  19943. </method>
  19944. <method name="write"
  19945. abstract="false" native="false" synchronized="false"
  19946. static="false" final="false" visibility="public"
  19947. deprecated="not deprecated">
  19948. <param name="out" type="java.io.DataOutput"/>
  19949. <exception name="IOException" type="java.io.IOException"/>
  19950. </method>
  19951. <method name="write"
  19952. abstract="false" native="false" synchronized="false"
  19953. static="false" final="false" visibility="public"
  19954. deprecated="not deprecated">
  19955. <param name="arg0" type="java.sql.PreparedStatement"/>
  19956. <exception name="SQLException" type="java.sql.SQLException"/>
  19957. </method>
  19958. <doc>
  19959. <![CDATA[A Class that does nothing, implementing DBWritable]]>
  19960. </doc>
  19961. </class>
  19962. <!-- end class org.apache.hadoop.mapreduce.lib.db.DBInputFormat.NullDBWritable -->
  19963. <!-- start class org.apache.hadoop.mapreduce.lib.db.DBOutputFormat -->
  19964. <class name="DBOutputFormat" extends="org.apache.hadoop.mapreduce.OutputFormat"
  19965. abstract="false"
  19966. static="false" final="false" visibility="public"
  19967. deprecated="not deprecated">
  19968. <constructor name="DBOutputFormat"
  19969. static="false" final="false" visibility="public"
  19970. deprecated="not deprecated">
  19971. </constructor>
  19972. <method name="checkOutputSpecs"
  19973. abstract="false" native="false" synchronized="false"
  19974. static="false" final="false" visibility="public"
  19975. deprecated="not deprecated">
  19976. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  19977. <exception name="IOException" type="java.io.IOException"/>
  19978. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  19979. </method>
  19980. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  19981. abstract="false" native="false" synchronized="false"
  19982. static="false" final="false" visibility="public"
  19983. deprecated="not deprecated">
  19984. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  19985. <exception name="IOException" type="java.io.IOException"/>
  19986. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  19987. </method>
  19988. <method name="constructQuery" return="java.lang.String"
  19989. abstract="false" native="false" synchronized="false"
  19990. static="false" final="false" visibility="public"
  19991. deprecated="not deprecated">
  19992. <param name="table" type="java.lang.String"/>
  19993. <param name="fieldNames" type="java.lang.String[]"/>
  19994. <doc>
  19995. <![CDATA[Constructs the query used as the prepared statement to insert data.
  19996. @param table
  19997. the table to insert into
  19998. @param fieldNames
  19999. the fields to insert into. If field names are unknown, supply an
  20000. array of nulls.]]>
  20001. </doc>
  20002. </method>
  20003. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  20004. abstract="false" native="false" synchronized="false"
  20005. static="false" final="false" visibility="public"
  20006. deprecated="not deprecated">
  20007. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  20008. <exception name="IOException" type="java.io.IOException"/>
  20009. <doc>
  20010. <![CDATA[{@inheritDoc}]]>
  20011. </doc>
  20012. </method>
  20013. <method name="setOutput"
  20014. abstract="false" native="false" synchronized="false"
  20015. static="true" final="false" visibility="public"
  20016. deprecated="not deprecated">
  20017. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  20018. <param name="tableName" type="java.lang.String"/>
  20019. <param name="fieldNames" type="java.lang.String[]"/>
  20020. <exception name="IOException" type="java.io.IOException"/>
  20021. <doc>
  20022. <![CDATA[Initializes the reduce-part of the job with
  20023. the appropriate output settings
  20024. @param job The job
  20025. @param tableName The table to insert data into
  20026. @param fieldNames The field names in the table.]]>
  20027. </doc>
  20028. </method>
  20029. <method name="setOutput"
  20030. abstract="false" native="false" synchronized="false"
  20031. static="true" final="false" visibility="public"
  20032. deprecated="not deprecated">
  20033. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  20034. <param name="tableName" type="java.lang.String"/>
  20035. <param name="fieldCount" type="int"/>
  20036. <exception name="IOException" type="java.io.IOException"/>
  20037. <doc>
  20038. <![CDATA[Initializes the reduce-part of the job
  20039. with the appropriate output settings
  20040. @param job The job
  20041. @param tableName The table to insert data into
  20042. @param fieldCount the number of fields in the table.]]>
  20043. </doc>
  20044. </method>
  20045. <doc>
  20046. <![CDATA[A OutputFormat that sends the reduce output to a SQL table.
  20047. <p>
  20048. {@link DBOutputFormat} accepts &lt;key,value&gt; pairs, where
  20049. key has a type extending DBWritable. Returned {@link RecordWriter}
  20050. writes <b>only the key</b> to the database with a batch SQL query.]]>
  20051. </doc>
  20052. </class>
  20053. <!-- end class org.apache.hadoop.mapreduce.lib.db.DBOutputFormat -->
  20054. <!-- start class org.apache.hadoop.mapreduce.lib.db.DBOutputFormat.DBRecordWriter -->
  20055. <class name="DBOutputFormat.DBRecordWriter" extends="org.apache.hadoop.mapreduce.RecordWriter"
  20056. abstract="false"
  20057. static="false" final="false" visibility="public"
  20058. deprecated="not deprecated">
  20059. <constructor name="DBOutputFormat.DBRecordWriter"
  20060. static="false" final="false" visibility="public"
  20061. deprecated="not deprecated">
  20062. <exception name="SQLException" type="java.sql.SQLException"/>
  20063. </constructor>
  20064. <constructor name="DBOutputFormat.DBRecordWriter" type="java.sql.Connection, java.sql.PreparedStatement"
  20065. static="false" final="false" visibility="public"
  20066. deprecated="not deprecated">
  20067. <exception name="SQLException" type="java.sql.SQLException"/>
  20068. </constructor>
  20069. <method name="getConnection" return="java.sql.Connection"
  20070. abstract="false" native="false" synchronized="false"
  20071. static="false" final="false" visibility="public"
  20072. deprecated="not deprecated">
  20073. </method>
  20074. <method name="getStatement" return="java.sql.PreparedStatement"
  20075. abstract="false" native="false" synchronized="false"
  20076. static="false" final="false" visibility="public"
  20077. deprecated="not deprecated">
  20078. </method>
  20079. <method name="close"
  20080. abstract="false" native="false" synchronized="false"
  20081. static="false" final="false" visibility="public"
  20082. deprecated="not deprecated">
  20083. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  20084. <exception name="IOException" type="java.io.IOException"/>
  20085. <doc>
  20086. <![CDATA[{@inheritDoc}]]>
  20087. </doc>
  20088. </method>
  20089. <method name="write"
  20090. abstract="false" native="false" synchronized="false"
  20091. static="false" final="false" visibility="public"
  20092. deprecated="not deprecated">
  20093. <param name="key" type="K"/>
  20094. <param name="value" type="V"/>
  20095. <exception name="IOException" type="java.io.IOException"/>
  20096. <doc>
  20097. <![CDATA[{@inheritDoc}]]>
  20098. </doc>
  20099. </method>
  20100. <doc>
  20101. <![CDATA[A RecordWriter that writes the reduce output to a SQL table]]>
  20102. </doc>
  20103. </class>
  20104. <!-- end class org.apache.hadoop.mapreduce.lib.db.DBOutputFormat.DBRecordWriter -->
  20105. <!-- start class org.apache.hadoop.mapreduce.lib.db.DBRecordReader -->
  20106. <class name="DBRecordReader" extends="org.apache.hadoop.mapreduce.RecordReader"
  20107. abstract="false"
  20108. static="false" final="false" visibility="public"
  20109. deprecated="not deprecated">
  20110. <constructor name="DBRecordReader" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit, java.lang.Class, org.apache.hadoop.conf.Configuration, java.sql.Connection, org.apache.hadoop.mapreduce.lib.db.DBConfiguration, java.lang.String, java.lang.String[], java.lang.String"
  20111. static="false" final="false" visibility="public"
  20112. deprecated="not deprecated">
  20113. <exception name="SQLException" type="java.sql.SQLException"/>
  20114. <doc>
  20115. <![CDATA[@param split The InputSplit to read data for
  20116. @throws SQLException]]>
  20117. </doc>
  20118. </constructor>
  20119. <method name="executeQuery" return="java.sql.ResultSet"
  20120. abstract="false" native="false" synchronized="false"
  20121. static="false" final="false" visibility="protected"
  20122. deprecated="not deprecated">
  20123. <param name="query" type="java.lang.String"/>
  20124. <exception name="SQLException" type="java.sql.SQLException"/>
  20125. </method>
  20126. <method name="getSelectQuery" return="java.lang.String"
  20127. abstract="false" native="false" synchronized="false"
  20128. static="false" final="false" visibility="protected"
  20129. deprecated="not deprecated">
  20130. <doc>
  20131. <![CDATA[Returns the query for selecting the records,
  20132. subclasses can override this for custom behaviour.]]>
  20133. </doc>
  20134. </method>
  20135. <method name="close"
  20136. abstract="false" native="false" synchronized="false"
  20137. static="false" final="false" visibility="public"
  20138. deprecated="not deprecated">
  20139. <exception name="IOException" type="java.io.IOException"/>
  20140. <doc>
  20141. <![CDATA[{@inheritDoc}]]>
  20142. </doc>
  20143. </method>
  20144. <method name="initialize"
  20145. abstract="false" native="false" synchronized="false"
  20146. static="false" final="false" visibility="public"
  20147. deprecated="not deprecated">
  20148. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  20149. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  20150. <exception name="IOException" type="java.io.IOException"/>
  20151. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20152. </method>
  20153. <method name="getCurrentKey" return="org.apache.hadoop.io.LongWritable"
  20154. abstract="false" native="false" synchronized="false"
  20155. static="false" final="false" visibility="public"
  20156. deprecated="not deprecated">
  20157. <doc>
  20158. <![CDATA[{@inheritDoc}]]>
  20159. </doc>
  20160. </method>
  20161. <method name="getCurrentValue" return="T"
  20162. abstract="false" native="false" synchronized="false"
  20163. static="false" final="false" visibility="public"
  20164. deprecated="not deprecated">
  20165. <doc>
  20166. <![CDATA[{@inheritDoc}]]>
  20167. </doc>
  20168. </method>
  20169. <method name="createValue" return="T"
  20170. abstract="false" native="false" synchronized="false"
  20171. static="false" final="false" visibility="public"
  20172. deprecated="deprecated, no comment">
  20173. <doc>
  20174. <![CDATA[@deprecated]]>
  20175. </doc>
  20176. </method>
  20177. <method name="getPos" return="long"
  20178. abstract="false" native="false" synchronized="false"
  20179. static="false" final="false" visibility="public"
  20180. deprecated="deprecated, no comment">
  20181. <exception name="IOException" type="java.io.IOException"/>
  20182. <doc>
  20183. <![CDATA[@deprecated]]>
  20184. </doc>
  20185. </method>
  20186. <method name="next" return="boolean"
  20187. abstract="false" native="false" synchronized="false"
  20188. static="false" final="false" visibility="public"
  20189. deprecated="Use {@link #nextKeyValue()}">
  20190. <param name="key" type="org.apache.hadoop.io.LongWritable"/>
  20191. <param name="value" type="T"/>
  20192. <exception name="IOException" type="java.io.IOException"/>
  20193. <doc>
  20194. <![CDATA[@deprecated Use {@link #nextKeyValue()}]]>
  20195. </doc>
  20196. </method>
  20197. <method name="getProgress" return="float"
  20198. abstract="false" native="false" synchronized="false"
  20199. static="false" final="false" visibility="public"
  20200. deprecated="not deprecated">
  20201. <exception name="IOException" type="java.io.IOException"/>
  20202. <doc>
  20203. <![CDATA[{@inheritDoc}]]>
  20204. </doc>
  20205. </method>
  20206. <method name="nextKeyValue" return="boolean"
  20207. abstract="false" native="false" synchronized="false"
  20208. static="false" final="false" visibility="public"
  20209. deprecated="not deprecated">
  20210. <exception name="IOException" type="java.io.IOException"/>
  20211. <doc>
  20212. <![CDATA[{@inheritDoc}]]>
  20213. </doc>
  20214. </method>
  20215. <method name="getSplit" return="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit"
  20216. abstract="false" native="false" synchronized="false"
  20217. static="false" final="false" visibility="protected"
  20218. deprecated="not deprecated">
  20219. </method>
  20220. <method name="getFieldNames" return="java.lang.String[]"
  20221. abstract="false" native="false" synchronized="false"
  20222. static="false" final="false" visibility="protected"
  20223. deprecated="not deprecated">
  20224. </method>
  20225. <method name="getTableName" return="java.lang.String"
  20226. abstract="false" native="false" synchronized="false"
  20227. static="false" final="false" visibility="protected"
  20228. deprecated="not deprecated">
  20229. </method>
  20230. <method name="getConditions" return="java.lang.String"
  20231. abstract="false" native="false" synchronized="false"
  20232. static="false" final="false" visibility="protected"
  20233. deprecated="not deprecated">
  20234. </method>
  20235. <method name="getDBConf" return="org.apache.hadoop.mapreduce.lib.db.DBConfiguration"
  20236. abstract="false" native="false" synchronized="false"
  20237. static="false" final="false" visibility="protected"
  20238. deprecated="not deprecated">
  20239. </method>
  20240. <method name="getConnection" return="java.sql.Connection"
  20241. abstract="false" native="false" synchronized="false"
  20242. static="false" final="false" visibility="protected"
  20243. deprecated="not deprecated">
  20244. </method>
  20245. <method name="getStatement" return="java.sql.PreparedStatement"
  20246. abstract="false" native="false" synchronized="false"
  20247. static="false" final="false" visibility="protected"
  20248. deprecated="not deprecated">
  20249. </method>
  20250. <method name="setStatement"
  20251. abstract="false" native="false" synchronized="false"
  20252. static="false" final="false" visibility="protected"
  20253. deprecated="not deprecated">
  20254. <param name="stmt" type="java.sql.PreparedStatement"/>
  20255. </method>
  20256. <field name="statement" type="java.sql.PreparedStatement"
  20257. transient="false" volatile="false"
  20258. static="false" final="false" visibility="protected"
  20259. deprecated="not deprecated">
  20260. </field>
  20261. <doc>
  20262. <![CDATA[A RecordReader that reads records from a SQL table.
  20263. Emits LongWritables containing the record number as
  20264. key and DBWritables as value.]]>
  20265. </doc>
  20266. </class>
  20267. <!-- end class org.apache.hadoop.mapreduce.lib.db.DBRecordReader -->
  20268. <!-- start interface org.apache.hadoop.mapreduce.lib.db.DBSplitter -->
  20269. <interface name="DBSplitter" abstract="true"
  20270. static="false" final="false" visibility="public"
  20271. deprecated="not deprecated">
  20272. <method name="split" return="java.util.List"
  20273. abstract="false" native="false" synchronized="false"
  20274. static="false" final="false" visibility="public"
  20275. deprecated="not deprecated">
  20276. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  20277. <param name="results" type="java.sql.ResultSet"/>
  20278. <param name="colName" type="java.lang.String"/>
  20279. <exception name="SQLException" type="java.sql.SQLException"/>
  20280. <doc>
  20281. <![CDATA[Given a ResultSet containing one record (and already advanced to that record)
  20282. with two columns (a low value, and a high value, both of the same type), determine
  20283. a set of splits that span the given values.]]>
  20284. </doc>
  20285. </method>
  20286. <doc>
  20287. <![CDATA[DBSplitter will generate DBInputSplits to use with DataDrivenDBInputFormat.
  20288. DataDrivenDBInputFormat needs to interpolate between two values that
  20289. represent the lowest and highest valued records to import. Depending
  20290. on the data-type of the column, this requires different behavior.
  20291. DBSplitter implementations should perform this for a data type or family
  20292. of data types.]]>
  20293. </doc>
  20294. </interface>
  20295. <!-- end interface org.apache.hadoop.mapreduce.lib.db.DBSplitter -->
  20296. <!-- start interface org.apache.hadoop.mapreduce.lib.db.DBWritable -->
  20297. <interface name="DBWritable" abstract="true"
  20298. static="false" final="false" visibility="public"
  20299. deprecated="not deprecated">
  20300. <method name="write"
  20301. abstract="false" native="false" synchronized="false"
  20302. static="false" final="false" visibility="public"
  20303. deprecated="not deprecated">
  20304. <param name="statement" type="java.sql.PreparedStatement"/>
  20305. <exception name="SQLException" type="java.sql.SQLException"/>
  20306. <doc>
  20307. <![CDATA[Sets the fields of the object in the {@link PreparedStatement}.
  20308. @param statement the statement that the fields are put into.
  20309. @throws SQLException]]>
  20310. </doc>
  20311. </method>
  20312. <method name="readFields"
  20313. abstract="false" native="false" synchronized="false"
  20314. static="false" final="false" visibility="public"
  20315. deprecated="not deprecated">
  20316. <param name="resultSet" type="java.sql.ResultSet"/>
  20317. <exception name="SQLException" type="java.sql.SQLException"/>
  20318. <doc>
  20319. <![CDATA[Reads the fields of the object from the {@link ResultSet}.
  20320. @param resultSet the {@link ResultSet} to get the fields from.
  20321. @throws SQLException]]>
  20322. </doc>
  20323. </method>
  20324. <doc>
  20325. <![CDATA[Objects that are read from/written to a database should implement
  20326. <code>DBWritable</code>. DBWritable, is similar to {@link Writable}
  20327. except that the {@link #write(PreparedStatement)} method takes a
  20328. {@link PreparedStatement}, and {@link #readFields(ResultSet)}
  20329. takes a {@link ResultSet}.
  20330. <p>
  20331. Implementations are responsible for writing the fields of the object
  20332. to PreparedStatement, and reading the fields of the object from the
  20333. ResultSet.
  20334. <p>Example:</p>
  20335. If we have the following table in the database :
  20336. <pre>
  20337. CREATE TABLE MyTable (
  20338. counter INTEGER NOT NULL,
  20339. timestamp BIGINT NOT NULL,
  20340. );
  20341. </pre>
  20342. then we can read/write the tuples from/to the table with :
  20343. <p><pre>
  20344. public class MyWritable implements Writable, DBWritable {
  20345. // Some data
  20346. private int counter;
  20347. private long timestamp;
  20348. //Writable#write() implementation
  20349. public void write(DataOutput out) throws IOException {
  20350. out.writeInt(counter);
  20351. out.writeLong(timestamp);
  20352. }
  20353. //Writable#readFields() implementation
  20354. public void readFields(DataInput in) throws IOException {
  20355. counter = in.readInt();
  20356. timestamp = in.readLong();
  20357. }
  20358. public void write(PreparedStatement statement) throws SQLException {
  20359. statement.setInt(1, counter);
  20360. statement.setLong(2, timestamp);
  20361. }
  20362. public void readFields(ResultSet resultSet) throws SQLException {
  20363. counter = resultSet.getInt(1);
  20364. timestamp = resultSet.getLong(2);
  20365. }
  20366. }
  20367. </pre></p>]]>
  20368. </doc>
  20369. </interface>
  20370. <!-- end interface org.apache.hadoop.mapreduce.lib.db.DBWritable -->
  20371. <!-- start class org.apache.hadoop.mapreduce.lib.db.FloatSplitter -->
  20372. <class name="FloatSplitter" extends="java.lang.Object"
  20373. abstract="false"
  20374. static="false" final="false" visibility="public"
  20375. deprecated="not deprecated">
  20376. <implements name="org.apache.hadoop.mapreduce.lib.db.DBSplitter"/>
  20377. <constructor name="FloatSplitter"
  20378. static="false" final="false" visibility="public"
  20379. deprecated="not deprecated">
  20380. </constructor>
  20381. <method name="split" return="java.util.List"
  20382. abstract="false" native="false" synchronized="false"
  20383. static="false" final="false" visibility="public"
  20384. deprecated="not deprecated">
  20385. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  20386. <param name="results" type="java.sql.ResultSet"/>
  20387. <param name="colName" type="java.lang.String"/>
  20388. <exception name="SQLException" type="java.sql.SQLException"/>
  20389. </method>
  20390. <doc>
  20391. <![CDATA[Implement DBSplitter over floating-point values.]]>
  20392. </doc>
  20393. </class>
  20394. <!-- end class org.apache.hadoop.mapreduce.lib.db.FloatSplitter -->
  20395. <!-- start class org.apache.hadoop.mapreduce.lib.db.IntegerSplitter -->
  20396. <class name="IntegerSplitter" extends="java.lang.Object"
  20397. abstract="false"
  20398. static="false" final="false" visibility="public"
  20399. deprecated="not deprecated">
  20400. <implements name="org.apache.hadoop.mapreduce.lib.db.DBSplitter"/>
  20401. <constructor name="IntegerSplitter"
  20402. static="false" final="false" visibility="public"
  20403. deprecated="not deprecated">
  20404. </constructor>
  20405. <method name="split" return="java.util.List"
  20406. abstract="false" native="false" synchronized="false"
  20407. static="false" final="false" visibility="public"
  20408. deprecated="not deprecated">
  20409. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  20410. <param name="results" type="java.sql.ResultSet"/>
  20411. <param name="colName" type="java.lang.String"/>
  20412. <exception name="SQLException" type="java.sql.SQLException"/>
  20413. </method>
  20414. <doc>
  20415. <![CDATA[Implement DBSplitter over integer values.]]>
  20416. </doc>
  20417. </class>
  20418. <!-- end class org.apache.hadoop.mapreduce.lib.db.IntegerSplitter -->
  20419. <!-- start class org.apache.hadoop.mapreduce.lib.db.MySQLDataDrivenDBRecordReader -->
  20420. <class name="MySQLDataDrivenDBRecordReader" extends="org.apache.hadoop.mapreduce.lib.db.DataDrivenDBRecordReader"
  20421. abstract="false"
  20422. static="false" final="false" visibility="public"
  20423. deprecated="not deprecated">
  20424. <constructor name="MySQLDataDrivenDBRecordReader" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit, java.lang.Class, org.apache.hadoop.conf.Configuration, java.sql.Connection, org.apache.hadoop.mapreduce.lib.db.DBConfiguration, java.lang.String, java.lang.String[], java.lang.String"
  20425. static="false" final="false" visibility="public"
  20426. deprecated="not deprecated">
  20427. <exception name="SQLException" type="java.sql.SQLException"/>
  20428. </constructor>
  20429. <method name="executeQuery" return="java.sql.ResultSet"
  20430. abstract="false" native="false" synchronized="false"
  20431. static="false" final="false" visibility="protected"
  20432. deprecated="not deprecated">
  20433. <param name="query" type="java.lang.String"/>
  20434. <exception name="SQLException" type="java.sql.SQLException"/>
  20435. </method>
  20436. <doc>
  20437. <![CDATA[A RecordReader that reads records from a MySQL table via DataDrivenDBRecordReader]]>
  20438. </doc>
  20439. </class>
  20440. <!-- end class org.apache.hadoop.mapreduce.lib.db.MySQLDataDrivenDBRecordReader -->
  20441. <!-- start class org.apache.hadoop.mapreduce.lib.db.MySQLDBRecordReader -->
  20442. <class name="MySQLDBRecordReader" extends="org.apache.hadoop.mapreduce.lib.db.DBRecordReader"
  20443. abstract="false"
  20444. static="false" final="false" visibility="public"
  20445. deprecated="not deprecated">
  20446. <constructor name="MySQLDBRecordReader" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit, java.lang.Class, org.apache.hadoop.conf.Configuration, java.sql.Connection, org.apache.hadoop.mapreduce.lib.db.DBConfiguration, java.lang.String, java.lang.String[], java.lang.String"
  20447. static="false" final="false" visibility="public"
  20448. deprecated="not deprecated">
  20449. <exception name="SQLException" type="java.sql.SQLException"/>
  20450. </constructor>
  20451. <method name="executeQuery" return="java.sql.ResultSet"
  20452. abstract="false" native="false" synchronized="false"
  20453. static="false" final="false" visibility="protected"
  20454. deprecated="not deprecated">
  20455. <param name="query" type="java.lang.String"/>
  20456. <exception name="SQLException" type="java.sql.SQLException"/>
  20457. </method>
  20458. <doc>
  20459. <![CDATA[A RecordReader that reads records from a MySQL table.]]>
  20460. </doc>
  20461. </class>
  20462. <!-- end class org.apache.hadoop.mapreduce.lib.db.MySQLDBRecordReader -->
  20463. <!-- start class org.apache.hadoop.mapreduce.lib.db.OracleDataDrivenDBInputFormat -->
  20464. <class name="OracleDataDrivenDBInputFormat" extends="org.apache.hadoop.mapreduce.lib.db.DataDrivenDBInputFormat"
  20465. abstract="false"
  20466. static="false" final="false" visibility="public"
  20467. deprecated="not deprecated">
  20468. <implements name="org.apache.hadoop.conf.Configurable"/>
  20469. <constructor name="OracleDataDrivenDBInputFormat"
  20470. static="false" final="false" visibility="public"
  20471. deprecated="not deprecated">
  20472. </constructor>
  20473. <method name="getSplitter" return="org.apache.hadoop.mapreduce.lib.db.DBSplitter"
  20474. abstract="false" native="false" synchronized="false"
  20475. static="false" final="false" visibility="protected"
  20476. deprecated="not deprecated">
  20477. <param name="sqlDataType" type="int"/>
  20478. <doc>
  20479. <![CDATA[@return the DBSplitter implementation to use to divide the table/query into InputSplits.]]>
  20480. </doc>
  20481. </method>
  20482. <method name="createDBRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  20483. abstract="false" native="false" synchronized="false"
  20484. static="false" final="false" visibility="protected"
  20485. deprecated="not deprecated">
  20486. <param name="split" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit"/>
  20487. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  20488. <exception name="IOException" type="java.io.IOException"/>
  20489. </method>
  20490. <doc>
  20491. <![CDATA[A InputFormat that reads input data from an SQL table in an Oracle db.]]>
  20492. </doc>
  20493. </class>
  20494. <!-- end class org.apache.hadoop.mapreduce.lib.db.OracleDataDrivenDBInputFormat -->
  20495. <!-- start class org.apache.hadoop.mapreduce.lib.db.OracleDataDrivenDBRecordReader -->
  20496. <class name="OracleDataDrivenDBRecordReader" extends="org.apache.hadoop.mapreduce.lib.db.DataDrivenDBRecordReader"
  20497. abstract="false"
  20498. static="false" final="false" visibility="public"
  20499. deprecated="not deprecated">
  20500. <constructor name="OracleDataDrivenDBRecordReader" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit, java.lang.Class, org.apache.hadoop.conf.Configuration, java.sql.Connection, org.apache.hadoop.mapreduce.lib.db.DBConfiguration, java.lang.String, java.lang.String[], java.lang.String"
  20501. static="false" final="false" visibility="public"
  20502. deprecated="not deprecated">
  20503. <exception name="SQLException" type="java.sql.SQLException"/>
  20504. </constructor>
  20505. <doc>
  20506. <![CDATA[A RecordReader that reads records from a Oracle table via DataDrivenDBRecordReader]]>
  20507. </doc>
  20508. </class>
  20509. <!-- end class org.apache.hadoop.mapreduce.lib.db.OracleDataDrivenDBRecordReader -->
  20510. <!-- start class org.apache.hadoop.mapreduce.lib.db.OracleDateSplitter -->
  20511. <class name="OracleDateSplitter" extends="org.apache.hadoop.mapreduce.lib.db.DateSplitter"
  20512. abstract="false"
  20513. static="false" final="false" visibility="public"
  20514. deprecated="not deprecated">
  20515. <constructor name="OracleDateSplitter"
  20516. static="false" final="false" visibility="public"
  20517. deprecated="not deprecated">
  20518. </constructor>
  20519. <method name="dateToString" return="java.lang.String"
  20520. abstract="false" native="false" synchronized="false"
  20521. static="false" final="false" visibility="protected"
  20522. deprecated="not deprecated">
  20523. <param name="d" type="java.util.Date"/>
  20524. </method>
  20525. <doc>
  20526. <![CDATA[Implement DBSplitter over date/time values returned by an Oracle db.
  20527. Make use of logic from DateSplitter, since this just needs to use
  20528. some Oracle-specific functions on the formatting end when generating
  20529. InputSplits.]]>
  20530. </doc>
  20531. </class>
  20532. <!-- end class org.apache.hadoop.mapreduce.lib.db.OracleDateSplitter -->
  20533. <!-- start class org.apache.hadoop.mapreduce.lib.db.OracleDBRecordReader -->
  20534. <class name="OracleDBRecordReader" extends="org.apache.hadoop.mapreduce.lib.db.DBRecordReader"
  20535. abstract="false"
  20536. static="false" final="false" visibility="public"
  20537. deprecated="not deprecated">
  20538. <constructor name="OracleDBRecordReader" type="org.apache.hadoop.mapreduce.lib.db.DBInputFormat.DBInputSplit, java.lang.Class, org.apache.hadoop.conf.Configuration, java.sql.Connection, org.apache.hadoop.mapreduce.lib.db.DBConfiguration, java.lang.String, java.lang.String[], java.lang.String"
  20539. static="false" final="false" visibility="public"
  20540. deprecated="not deprecated">
  20541. <exception name="SQLException" type="java.sql.SQLException"/>
  20542. </constructor>
  20543. <method name="getSelectQuery" return="java.lang.String"
  20544. abstract="false" native="false" synchronized="false"
  20545. static="false" final="false" visibility="protected"
  20546. deprecated="not deprecated">
  20547. <doc>
  20548. <![CDATA[Returns the query for selecting the records from an Oracle DB.]]>
  20549. </doc>
  20550. </method>
  20551. <method name="setSessionTimeZone"
  20552. abstract="false" native="false" synchronized="false"
  20553. static="true" final="false" visibility="public"
  20554. deprecated="not deprecated">
  20555. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  20556. <param name="conn" type="java.sql.Connection"/>
  20557. <exception name="SQLException" type="java.sql.SQLException"/>
  20558. <doc>
  20559. <![CDATA[Set session time zone
  20560. @param conf The current configuration.
  20561. We read the 'oracle.sessionTimeZone' property from here.
  20562. @param conn The connection to alter the timezone properties of.]]>
  20563. </doc>
  20564. </method>
  20565. <field name="SESSION_TIMEZONE_KEY" type="java.lang.String"
  20566. transient="false" volatile="false"
  20567. static="true" final="true" visibility="public"
  20568. deprecated="not deprecated">
  20569. <doc>
  20570. <![CDATA[Configuration key to set to a timezone string.]]>
  20571. </doc>
  20572. </field>
  20573. <doc>
  20574. <![CDATA[A RecordReader that reads records from an Oracle SQL table.]]>
  20575. </doc>
  20576. </class>
  20577. <!-- end class org.apache.hadoop.mapreduce.lib.db.OracleDBRecordReader -->
  20578. <!-- start class org.apache.hadoop.mapreduce.lib.db.TextSplitter -->
  20579. <class name="TextSplitter" extends="org.apache.hadoop.mapreduce.lib.db.BigDecimalSplitter"
  20580. abstract="false"
  20581. static="false" final="false" visibility="public"
  20582. deprecated="not deprecated">
  20583. <constructor name="TextSplitter"
  20584. static="false" final="false" visibility="public"
  20585. deprecated="not deprecated">
  20586. </constructor>
  20587. <method name="split" return="java.util.List"
  20588. abstract="false" native="false" synchronized="false"
  20589. static="false" final="false" visibility="public"
  20590. deprecated="not deprecated">
  20591. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  20592. <param name="results" type="java.sql.ResultSet"/>
  20593. <param name="colName" type="java.lang.String"/>
  20594. <exception name="SQLException" type="java.sql.SQLException"/>
  20595. <doc>
  20596. <![CDATA[This method needs to determine the splits between two user-provided strings.
  20597. In the case where the user's strings are 'A' and 'Z', this is not hard; we
  20598. could create two splits from ['A', 'M') and ['M', 'Z'], 26 splits for strings
  20599. beginning with each letter, etc.
  20600. If a user has provided us with the strings "Ham" and "Haze", however, we need
  20601. to create splits that differ in the third letter.
  20602. The algorithm used is as follows:
  20603. Since there are 2**16 unicode characters, we interpret characters as digits in
  20604. base 65536. Given a string 's' containing characters s_0, s_1 .. s_n, we interpret
  20605. the string as the number: 0.s_0 s_1 s_2.. s_n in base 65536. Having mapped the
  20606. low and high strings into floating-point values, we then use the BigDecimalSplitter
  20607. to establish the even split points, then map the resulting floating point values
  20608. back into strings.]]>
  20609. </doc>
  20610. </method>
  20611. <doc>
  20612. <![CDATA[Implement DBSplitter over text strings.]]>
  20613. </doc>
  20614. </class>
  20615. <!-- end class org.apache.hadoop.mapreduce.lib.db.TextSplitter -->
  20616. </package>
  20617. <package name="org.apache.hadoop.mapreduce.lib.fieldsel">
  20618. <!-- start class org.apache.hadoop.mapreduce.lib.fieldsel.FieldSelectionHelper -->
  20619. <class name="FieldSelectionHelper" extends="java.lang.Object"
  20620. abstract="false"
  20621. static="false" final="false" visibility="public"
  20622. deprecated="not deprecated">
  20623. <constructor name="FieldSelectionHelper"
  20624. static="false" final="false" visibility="public"
  20625. deprecated="not deprecated">
  20626. </constructor>
  20627. <constructor name="FieldSelectionHelper" type="org.apache.hadoop.io.Text, org.apache.hadoop.io.Text"
  20628. static="false" final="false" visibility="public"
  20629. deprecated="not deprecated">
  20630. </constructor>
  20631. <method name="parseOutputKeyValueSpec" return="int"
  20632. abstract="false" native="false" synchronized="false"
  20633. static="true" final="false" visibility="public"
  20634. deprecated="not deprecated">
  20635. <param name="keyValueSpec" type="java.lang.String"/>
  20636. <param name="keyFieldList" type="java.util.List"/>
  20637. <param name="valueFieldList" type="java.util.List"/>
  20638. </method>
  20639. <method name="specToString" return="java.lang.String"
  20640. abstract="false" native="false" synchronized="false"
  20641. static="true" final="false" visibility="public"
  20642. deprecated="not deprecated">
  20643. <param name="fieldSeparator" type="java.lang.String"/>
  20644. <param name="keyValueSpec" type="java.lang.String"/>
  20645. <param name="allValueFieldsFrom" type="int"/>
  20646. <param name="keyFieldList" type="java.util.List"/>
  20647. <param name="valueFieldList" type="java.util.List"/>
  20648. </method>
  20649. <method name="getKey" return="org.apache.hadoop.io.Text"
  20650. abstract="false" native="false" synchronized="false"
  20651. static="false" final="false" visibility="public"
  20652. deprecated="not deprecated">
  20653. </method>
  20654. <method name="getValue" return="org.apache.hadoop.io.Text"
  20655. abstract="false" native="false" synchronized="false"
  20656. static="false" final="false" visibility="public"
  20657. deprecated="not deprecated">
  20658. </method>
  20659. <method name="extractOutputKeyValue"
  20660. abstract="false" native="false" synchronized="false"
  20661. static="false" final="false" visibility="public"
  20662. deprecated="not deprecated">
  20663. <param name="key" type="java.lang.String"/>
  20664. <param name="val" type="java.lang.String"/>
  20665. <param name="fieldSep" type="java.lang.String"/>
  20666. <param name="keyFieldList" type="java.util.List"/>
  20667. <param name="valFieldList" type="java.util.List"/>
  20668. <param name="allValueFieldsFrom" type="int"/>
  20669. <param name="ignoreKey" type="boolean"/>
  20670. <param name="isMap" type="boolean"/>
  20671. </method>
  20672. <field name="emptyText" type="org.apache.hadoop.io.Text"
  20673. transient="false" volatile="false"
  20674. static="true" final="false" visibility="public"
  20675. deprecated="not deprecated">
  20676. </field>
  20677. <field name="DATA_FIELD_SEPERATOR" type="java.lang.String"
  20678. transient="false" volatile="false"
  20679. static="true" final="true" visibility="public"
  20680. deprecated="not deprecated">
  20681. </field>
  20682. <field name="MAP_OUTPUT_KEY_VALUE_SPEC" type="java.lang.String"
  20683. transient="false" volatile="false"
  20684. static="true" final="true" visibility="public"
  20685. deprecated="not deprecated">
  20686. </field>
  20687. <field name="REDUCE_OUTPUT_KEY_VALUE_SPEC" type="java.lang.String"
  20688. transient="false" volatile="false"
  20689. static="true" final="true" visibility="public"
  20690. deprecated="not deprecated">
  20691. </field>
  20692. <doc>
  20693. <![CDATA[This class implements a mapper/reducer class that can be used to perform
  20694. field selections in a manner similar to unix cut. The input data is treated
  20695. as fields separated by a user specified separator (the default value is
  20696. "\t"). The user can specify a list of fields that form the map output keys,
  20697. and a list of fields that form the map output values. If the inputformat is
  20698. TextInputFormat, the mapper will ignore the key to the map function. and the
  20699. fields are from the value only. Otherwise, the fields are the union of those
  20700. from the key and those from the value.
  20701. The field separator is under attribute "mapreduce.fieldsel.data.field.separator"
  20702. The map output field list spec is under attribute
  20703. "mapreduce.fieldsel.map.output.key.value.fields.spec".
  20704. The value is expected to be like "keyFieldsSpec:valueFieldsSpec"
  20705. key/valueFieldsSpec are comma (,) separated field spec: fieldSpec,fieldSpec,fieldSpec ...
  20706. Each field spec can be a simple number (e.g. 5) specifying a specific field, or a range
  20707. (like 2-5) to specify a range of fields, or an open range (like 3-) specifying all
  20708. the fields starting from field 3. The open range field spec applies value fields only.
  20709. They have no effect on the key fields.
  20710. Here is an example: "4,3,0,1:6,5,1-3,7-". It specifies to use fields 4,3,0 and 1 for keys,
  20711. and use fields 6,5,1,2,3,7 and above for values.
  20712. The reduce output field list spec is under attribute
  20713. "mapreduce.fieldsel.reduce.output.key.value.fields.spec".
  20714. The reducer extracts output key/value pairs in a similar manner, except that
  20715. the key is never ignored.]]>
  20716. </doc>
  20717. </class>
  20718. <!-- end class org.apache.hadoop.mapreduce.lib.fieldsel.FieldSelectionHelper -->
  20719. <!-- start class org.apache.hadoop.mapreduce.lib.fieldsel.FieldSelectionMapper -->
  20720. <class name="FieldSelectionMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  20721. abstract="false"
  20722. static="false" final="false" visibility="public"
  20723. deprecated="not deprecated">
  20724. <constructor name="FieldSelectionMapper"
  20725. static="false" final="false" visibility="public"
  20726. deprecated="not deprecated">
  20727. </constructor>
  20728. <method name="setup"
  20729. abstract="false" native="false" synchronized="false"
  20730. static="false" final="false" visibility="public"
  20731. deprecated="not deprecated">
  20732. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  20733. <exception name="IOException" type="java.io.IOException"/>
  20734. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20735. </method>
  20736. <method name="map"
  20737. abstract="false" native="false" synchronized="false"
  20738. static="false" final="false" visibility="public"
  20739. deprecated="not deprecated">
  20740. <param name="key" type="K"/>
  20741. <param name="val" type="V"/>
  20742. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  20743. <exception name="IOException" type="java.io.IOException"/>
  20744. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20745. <doc>
  20746. <![CDATA[The identify function. Input key/value pair is written directly to output.]]>
  20747. </doc>
  20748. </method>
  20749. <field name="LOG" type="org.apache.commons.logging.Log"
  20750. transient="false" volatile="false"
  20751. static="true" final="true" visibility="public"
  20752. deprecated="not deprecated">
  20753. </field>
  20754. <doc>
  20755. <![CDATA[This class implements a mapper class that can be used to perform
  20756. field selections in a manner similar to unix cut. The input data is treated
  20757. as fields separated by a user specified separator (the default value is
  20758. "\t"). The user can specify a list of fields that form the map output keys,
  20759. and a list of fields that form the map output values. If the inputformat is
  20760. TextInputFormat, the mapper will ignore the key to the map function. and the
  20761. fields are from the value only. Otherwise, the fields are the union of those
  20762. from the key and those from the value.
  20763. The field separator is under attribute "mapreduce.fieldsel.data.field.separator"
  20764. The map output field list spec is under attribute
  20765. "mapreduce.fieldsel.map.output.key.value.fields.spec".
  20766. The value is expected to be like
  20767. "keyFieldsSpec:valueFieldsSpec" key/valueFieldsSpec are comma (,) separated
  20768. field spec: fieldSpec,fieldSpec,fieldSpec ... Each field spec can be a
  20769. simple number (e.g. 5) specifying a specific field, or a range (like 2-5)
  20770. to specify a range of fields, or an open range (like 3-) specifying all
  20771. the fields starting from field 3. The open range field spec applies value
  20772. fields only. They have no effect on the key fields.
  20773. Here is an example: "4,3,0,1:6,5,1-3,7-". It specifies to use fields
  20774. 4,3,0 and 1 for keys, and use fields 6,5,1,2,3,7 and above for values.]]>
  20775. </doc>
  20776. </class>
  20777. <!-- end class org.apache.hadoop.mapreduce.lib.fieldsel.FieldSelectionMapper -->
  20778. <!-- start class org.apache.hadoop.mapreduce.lib.fieldsel.FieldSelectionReducer -->
  20779. <class name="FieldSelectionReducer" extends="org.apache.hadoop.mapreduce.Reducer"
  20780. abstract="false"
  20781. static="false" final="false" visibility="public"
  20782. deprecated="not deprecated">
  20783. <constructor name="FieldSelectionReducer"
  20784. static="false" final="false" visibility="public"
  20785. deprecated="not deprecated">
  20786. </constructor>
  20787. <method name="setup"
  20788. abstract="false" native="false" synchronized="false"
  20789. static="false" final="false" visibility="public"
  20790. deprecated="not deprecated">
  20791. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  20792. <exception name="IOException" type="java.io.IOException"/>
  20793. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20794. </method>
  20795. <method name="reduce"
  20796. abstract="false" native="false" synchronized="false"
  20797. static="false" final="false" visibility="public"
  20798. deprecated="not deprecated">
  20799. <param name="key" type="org.apache.hadoop.io.Text"/>
  20800. <param name="values" type="java.lang.Iterable"/>
  20801. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  20802. <exception name="IOException" type="java.io.IOException"/>
  20803. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20804. </method>
  20805. <field name="LOG" type="org.apache.commons.logging.Log"
  20806. transient="false" volatile="false"
  20807. static="true" final="true" visibility="public"
  20808. deprecated="not deprecated">
  20809. </field>
  20810. <doc>
  20811. <![CDATA[This class implements a reducer class that can be used to perform field
  20812. selections in a manner similar to unix cut.
  20813. The input data is treated as fields separated by a user specified
  20814. separator (the default value is "\t"). The user can specify a list of
  20815. fields that form the reduce output keys, and a list of fields that form
  20816. the reduce output values. The fields are the union of those from the key
  20817. and those from the value.
  20818. The field separator is under attribute "mapreduce.fieldsel.data.field.separator"
  20819. The reduce output field list spec is under attribute
  20820. "mapreduce.fieldsel.reduce.output.key.value.fields.spec".
  20821. The value is expected to be like
  20822. "keyFieldsSpec:valueFieldsSpec" key/valueFieldsSpec are comma (,)
  20823. separated field spec: fieldSpec,fieldSpec,fieldSpec ... Each field spec
  20824. can be a simple number (e.g. 5) specifying a specific field, or a range
  20825. (like 2-5) to specify a range of fields, or an open range (like 3-)
  20826. specifying all the fields starting from field 3. The open range field
  20827. spec applies value fields only. They have no effect on the key fields.
  20828. Here is an example: "4,3,0,1:6,5,1-3,7-". It specifies to use fields
  20829. 4,3,0 and 1 for keys, and use fields 6,5,1,2,3,7 and above for values.]]>
  20830. </doc>
  20831. </class>
  20832. <!-- end class org.apache.hadoop.mapreduce.lib.fieldsel.FieldSelectionReducer -->
  20833. </package>
  20834. <package name="org.apache.hadoop.mapreduce.lib.input">
  20835. <!-- start class org.apache.hadoop.mapreduce.lib.input.CombineFileInputFormat -->
  20836. <class name="CombineFileInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.FileInputFormat"
  20837. abstract="true"
  20838. static="false" final="false" visibility="public"
  20839. deprecated="not deprecated">
  20840. <constructor name="CombineFileInputFormat"
  20841. static="false" final="false" visibility="public"
  20842. deprecated="not deprecated">
  20843. <doc>
  20844. <![CDATA[default constructor]]>
  20845. </doc>
  20846. </constructor>
  20847. <method name="setMaxSplitSize"
  20848. abstract="false" native="false" synchronized="false"
  20849. static="false" final="false" visibility="protected"
  20850. deprecated="not deprecated">
  20851. <param name="maxSplitSize" type="long"/>
  20852. <doc>
  20853. <![CDATA[Specify the maximum size (in bytes) of each split. Each split is
  20854. approximately equal to the specified size.]]>
  20855. </doc>
  20856. </method>
  20857. <method name="setMinSplitSizeNode"
  20858. abstract="false" native="false" synchronized="false"
  20859. static="false" final="false" visibility="protected"
  20860. deprecated="not deprecated">
  20861. <param name="minSplitSizeNode" type="long"/>
  20862. <doc>
  20863. <![CDATA[Specify the minimum size (in bytes) of each split per node.
  20864. This applies to data that is left over after combining data on a single
  20865. node into splits that are of maximum size specified by maxSplitSize.
  20866. This leftover data will be combined into its own split if its size
  20867. exceeds minSplitSizeNode.]]>
  20868. </doc>
  20869. </method>
  20870. <method name="setMinSplitSizeRack"
  20871. abstract="false" native="false" synchronized="false"
  20872. static="false" final="false" visibility="protected"
  20873. deprecated="not deprecated">
  20874. <param name="minSplitSizeRack" type="long"/>
  20875. <doc>
  20876. <![CDATA[Specify the minimum size (in bytes) of each split per rack.
  20877. This applies to data that is left over after combining data on a single
  20878. rack into splits that are of maximum size specified by maxSplitSize.
  20879. This leftover data will be combined into its own split if its size
  20880. exceeds minSplitSizeRack.]]>
  20881. </doc>
  20882. </method>
  20883. <method name="createPool"
  20884. abstract="false" native="false" synchronized="false"
  20885. static="false" final="false" visibility="protected"
  20886. deprecated="not deprecated">
  20887. <param name="filters" type="java.util.List"/>
  20888. <doc>
  20889. <![CDATA[Create a new pool and add the filters to it.
  20890. A split cannot have files from different pools.]]>
  20891. </doc>
  20892. </method>
  20893. <method name="createPool"
  20894. abstract="false" native="false" synchronized="false"
  20895. static="false" final="false" visibility="protected"
  20896. deprecated="not deprecated">
  20897. <param name="filters" type="org.apache.hadoop.fs.PathFilter[]"/>
  20898. <doc>
  20899. <![CDATA[Create a new pool and add the filters to it.
  20900. A pathname can satisfy any one of the specified filters.
  20901. A split cannot have files from different pools.]]>
  20902. </doc>
  20903. </method>
  20904. <method name="isSplitable" return="boolean"
  20905. abstract="false" native="false" synchronized="false"
  20906. static="false" final="false" visibility="protected"
  20907. deprecated="not deprecated">
  20908. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  20909. <param name="file" type="org.apache.hadoop.fs.Path"/>
  20910. </method>
  20911. <method name="getSplits" return="java.util.List"
  20912. abstract="false" native="false" synchronized="false"
  20913. static="false" final="false" visibility="public"
  20914. deprecated="not deprecated">
  20915. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  20916. <exception name="IOException" type="java.io.IOException"/>
  20917. </method>
  20918. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  20919. abstract="true" native="false" synchronized="false"
  20920. static="false" final="false" visibility="public"
  20921. deprecated="not deprecated">
  20922. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  20923. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  20924. <exception name="IOException" type="java.io.IOException"/>
  20925. <doc>
  20926. <![CDATA[This is not implemented yet.]]>
  20927. </doc>
  20928. </method>
  20929. <field name="SPLIT_MINSIZE_PERNODE" type="java.lang.String"
  20930. transient="false" volatile="false"
  20931. static="true" final="true" visibility="public"
  20932. deprecated="not deprecated">
  20933. </field>
  20934. <field name="SPLIT_MINSIZE_PERRACK" type="java.lang.String"
  20935. transient="false" volatile="false"
  20936. static="true" final="true" visibility="public"
  20937. deprecated="not deprecated">
  20938. </field>
  20939. <doc>
  20940. <![CDATA[An abstract {@link InputFormat} that returns {@link CombineFileSplit}'s in
  20941. {@link InputFormat#getSplits(JobContext)} method.
  20942. Splits are constructed from the files under the input paths.
  20943. A split cannot have files from different pools.
  20944. Each split returned may contain blocks from different files.
  20945. If a maxSplitSize is specified, then blocks on the same node are
  20946. combined to form a single split. Blocks that are left over are
  20947. then combined with other blocks in the same rack.
  20948. If maxSplitSize is not specified, then blocks from the same rack
  20949. are combined in a single split; no attempt is made to create
  20950. node-local splits.
  20951. If the maxSplitSize is equal to the block size, then this class
  20952. is similar to the default splitting behavior in Hadoop: each
  20953. block is a locally processed split.
  20954. Subclasses implement
  20955. {@link InputFormat#createRecordReader(InputSplit, TaskAttemptContext)}
  20956. to construct <code>RecordReader</code>'s for
  20957. <code>CombineFileSplit</code>'s.
  20958. @see CombineFileSplit]]>
  20959. </doc>
  20960. </class>
  20961. <!-- end class org.apache.hadoop.mapreduce.lib.input.CombineFileInputFormat -->
  20962. <!-- start class org.apache.hadoop.mapreduce.lib.input.CombineFileRecordReader -->
  20963. <class name="CombineFileRecordReader" extends="org.apache.hadoop.mapreduce.RecordReader"
  20964. abstract="false"
  20965. static="false" final="false" visibility="public"
  20966. deprecated="not deprecated">
  20967. <constructor name="CombineFileRecordReader" type="org.apache.hadoop.mapreduce.lib.input.CombineFileSplit, org.apache.hadoop.mapreduce.TaskAttemptContext, java.lang.Class"
  20968. static="false" final="false" visibility="public"
  20969. deprecated="not deprecated">
  20970. <exception name="IOException" type="java.io.IOException"/>
  20971. <doc>
  20972. <![CDATA[A generic RecordReader that can hand out different recordReaders
  20973. for each chunk in the CombineFileSplit.]]>
  20974. </doc>
  20975. </constructor>
  20976. <method name="initialize"
  20977. abstract="false" native="false" synchronized="false"
  20978. static="false" final="false" visibility="public"
  20979. deprecated="not deprecated">
  20980. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  20981. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  20982. <exception name="IOException" type="java.io.IOException"/>
  20983. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20984. </method>
  20985. <method name="nextKeyValue" return="boolean"
  20986. abstract="false" native="false" synchronized="false"
  20987. static="false" final="false" visibility="public"
  20988. deprecated="not deprecated">
  20989. <exception name="IOException" type="java.io.IOException"/>
  20990. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20991. </method>
  20992. <method name="getCurrentKey" return="K"
  20993. abstract="false" native="false" synchronized="false"
  20994. static="false" final="false" visibility="public"
  20995. deprecated="not deprecated">
  20996. <exception name="IOException" type="java.io.IOException"/>
  20997. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  20998. </method>
  20999. <method name="getCurrentValue" return="V"
  21000. abstract="false" native="false" synchronized="false"
  21001. static="false" final="false" visibility="public"
  21002. deprecated="not deprecated">
  21003. <exception name="IOException" type="java.io.IOException"/>
  21004. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  21005. </method>
  21006. <method name="close"
  21007. abstract="false" native="false" synchronized="false"
  21008. static="false" final="false" visibility="public"
  21009. deprecated="not deprecated">
  21010. <exception name="IOException" type="java.io.IOException"/>
  21011. </method>
  21012. <method name="getProgress" return="float"
  21013. abstract="false" native="false" synchronized="false"
  21014. static="false" final="false" visibility="public"
  21015. deprecated="not deprecated">
  21016. <exception name="IOException" type="java.io.IOException"/>
  21017. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  21018. <doc>
  21019. <![CDATA[return progress based on the amount of data processed so far.]]>
  21020. </doc>
  21021. </method>
  21022. <method name="initNextRecordReader" return="boolean"
  21023. abstract="false" native="false" synchronized="false"
  21024. static="false" final="false" visibility="protected"
  21025. deprecated="not deprecated">
  21026. <exception name="IOException" type="java.io.IOException"/>
  21027. <doc>
  21028. <![CDATA[Get the record reader for the next chunk in this CombineFileSplit.]]>
  21029. </doc>
  21030. </method>
  21031. <field name="split" type="org.apache.hadoop.mapreduce.lib.input.CombineFileSplit"
  21032. transient="false" volatile="false"
  21033. static="false" final="false" visibility="protected"
  21034. deprecated="not deprecated">
  21035. </field>
  21036. <field name="rrClass" type="java.lang.Class"
  21037. transient="false" volatile="false"
  21038. static="false" final="false" visibility="protected"
  21039. deprecated="not deprecated">
  21040. </field>
  21041. <field name="rrConstructor" type="java.lang.reflect.Constructor"
  21042. transient="false" volatile="false"
  21043. static="false" final="false" visibility="protected"
  21044. deprecated="not deprecated">
  21045. </field>
  21046. <field name="fs" type="org.apache.hadoop.fs.FileSystem"
  21047. transient="false" volatile="false"
  21048. static="false" final="false" visibility="protected"
  21049. deprecated="not deprecated">
  21050. </field>
  21051. <field name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"
  21052. transient="false" volatile="false"
  21053. static="false" final="false" visibility="protected"
  21054. deprecated="not deprecated">
  21055. </field>
  21056. <field name="idx" type="int"
  21057. transient="false" volatile="false"
  21058. static="false" final="false" visibility="protected"
  21059. deprecated="not deprecated">
  21060. </field>
  21061. <field name="progress" type="long"
  21062. transient="false" volatile="false"
  21063. static="false" final="false" visibility="protected"
  21064. deprecated="not deprecated">
  21065. </field>
  21066. <field name="curReader" type="org.apache.hadoop.mapreduce.RecordReader"
  21067. transient="false" volatile="false"
  21068. static="false" final="false" visibility="protected"
  21069. deprecated="not deprecated">
  21070. </field>
  21071. <doc>
  21072. <![CDATA[A generic RecordReader that can hand out different recordReaders
  21073. for each chunk in a {@link CombineFileSplit}.
  21074. A CombineFileSplit can combine data chunks from multiple files.
  21075. This class allows using different RecordReaders for processing
  21076. these data chunks from different files.
  21077. @see CombineFileSplit]]>
  21078. </doc>
  21079. </class>
  21080. <!-- end class org.apache.hadoop.mapreduce.lib.input.CombineFileRecordReader -->
  21081. <!-- start class org.apache.hadoop.mapreduce.lib.input.CombineFileSplit -->
  21082. <class name="CombineFileSplit" extends="org.apache.hadoop.mapreduce.InputSplit"
  21083. abstract="false"
  21084. static="false" final="false" visibility="public"
  21085. deprecated="not deprecated">
  21086. <implements name="org.apache.hadoop.io.Writable"/>
  21087. <constructor name="CombineFileSplit"
  21088. static="false" final="false" visibility="public"
  21089. deprecated="not deprecated">
  21090. <doc>
  21091. <![CDATA[default constructor]]>
  21092. </doc>
  21093. </constructor>
  21094. <constructor name="CombineFileSplit" type="org.apache.hadoop.fs.Path[], long[], long[], java.lang.String[]"
  21095. static="false" final="false" visibility="public"
  21096. deprecated="not deprecated">
  21097. </constructor>
  21098. <constructor name="CombineFileSplit" type="org.apache.hadoop.fs.Path[], long[]"
  21099. static="false" final="false" visibility="public"
  21100. deprecated="not deprecated">
  21101. </constructor>
  21102. <constructor name="CombineFileSplit" type="org.apache.hadoop.mapreduce.lib.input.CombineFileSplit"
  21103. static="false" final="false" visibility="public"
  21104. deprecated="not deprecated">
  21105. <exception name="IOException" type="java.io.IOException"/>
  21106. <doc>
  21107. <![CDATA[Copy constructor]]>
  21108. </doc>
  21109. </constructor>
  21110. <method name="getLength" return="long"
  21111. abstract="false" native="false" synchronized="false"
  21112. static="false" final="false" visibility="public"
  21113. deprecated="not deprecated">
  21114. </method>
  21115. <method name="getStartOffsets" return="long[]"
  21116. abstract="false" native="false" synchronized="false"
  21117. static="false" final="false" visibility="public"
  21118. deprecated="not deprecated">
  21119. <doc>
  21120. <![CDATA[Returns an array containing the start offsets of the files in the split]]>
  21121. </doc>
  21122. </method>
  21123. <method name="getLengths" return="long[]"
  21124. abstract="false" native="false" synchronized="false"
  21125. static="false" final="false" visibility="public"
  21126. deprecated="not deprecated">
  21127. <doc>
  21128. <![CDATA[Returns an array containing the lengths of the files in the split]]>
  21129. </doc>
  21130. </method>
  21131. <method name="getOffset" return="long"
  21132. abstract="false" native="false" synchronized="false"
  21133. static="false" final="false" visibility="public"
  21134. deprecated="not deprecated">
  21135. <param name="i" type="int"/>
  21136. <doc>
  21137. <![CDATA[Returns the start offset of the i<sup>th</sup> Path]]>
  21138. </doc>
  21139. </method>
  21140. <method name="getLength" return="long"
  21141. abstract="false" native="false" synchronized="false"
  21142. static="false" final="false" visibility="public"
  21143. deprecated="not deprecated">
  21144. <param name="i" type="int"/>
  21145. <doc>
  21146. <![CDATA[Returns the length of the i<sup>th</sup> Path]]>
  21147. </doc>
  21148. </method>
  21149. <method name="getNumPaths" return="int"
  21150. abstract="false" native="false" synchronized="false"
  21151. static="false" final="false" visibility="public"
  21152. deprecated="not deprecated">
  21153. <doc>
  21154. <![CDATA[Returns the number of Paths in the split]]>
  21155. </doc>
  21156. </method>
  21157. <method name="getPath" return="org.apache.hadoop.fs.Path"
  21158. abstract="false" native="false" synchronized="false"
  21159. static="false" final="false" visibility="public"
  21160. deprecated="not deprecated">
  21161. <param name="i" type="int"/>
  21162. <doc>
  21163. <![CDATA[Returns the i<sup>th</sup> Path]]>
  21164. </doc>
  21165. </method>
  21166. <method name="getPaths" return="org.apache.hadoop.fs.Path[]"
  21167. abstract="false" native="false" synchronized="false"
  21168. static="false" final="false" visibility="public"
  21169. deprecated="not deprecated">
  21170. <doc>
  21171. <![CDATA[Returns all the Paths in the split]]>
  21172. </doc>
  21173. </method>
  21174. <method name="getLocations" return="java.lang.String[]"
  21175. abstract="false" native="false" synchronized="false"
  21176. static="false" final="false" visibility="public"
  21177. deprecated="not deprecated">
  21178. <exception name="IOException" type="java.io.IOException"/>
  21179. <doc>
  21180. <![CDATA[Returns all the Paths where this input-split resides]]>
  21181. </doc>
  21182. </method>
  21183. <method name="readFields"
  21184. abstract="false" native="false" synchronized="false"
  21185. static="false" final="false" visibility="public"
  21186. deprecated="not deprecated">
  21187. <param name="in" type="java.io.DataInput"/>
  21188. <exception name="IOException" type="java.io.IOException"/>
  21189. </method>
  21190. <method name="write"
  21191. abstract="false" native="false" synchronized="false"
  21192. static="false" final="false" visibility="public"
  21193. deprecated="not deprecated">
  21194. <param name="out" type="java.io.DataOutput"/>
  21195. <exception name="IOException" type="java.io.IOException"/>
  21196. </method>
  21197. <method name="toString" return="java.lang.String"
  21198. abstract="false" native="false" synchronized="false"
  21199. static="false" final="false" visibility="public"
  21200. deprecated="not deprecated">
  21201. </method>
  21202. <doc>
  21203. <![CDATA[A sub-collection of input files.
  21204. Unlike {@link FileSplit}, CombineFileSplit class does not represent
  21205. a split of a file, but a split of input files into smaller sets.
  21206. A split may contain blocks from different file but all
  21207. the blocks in the same split are probably local to some rack <br>
  21208. CombineFileSplit can be used to implement {@link RecordReader}'s,
  21209. with reading one record per file.
  21210. @see FileSplit
  21211. @see CombineFileInputFormat]]>
  21212. </doc>
  21213. </class>
  21214. <!-- end class org.apache.hadoop.mapreduce.lib.input.CombineFileSplit -->
  21215. <!-- start class org.apache.hadoop.mapreduce.lib.input.FileInputFormat -->
  21216. <class name="FileInputFormat" extends="org.apache.hadoop.mapreduce.InputFormat"
  21217. abstract="true"
  21218. static="false" final="false" visibility="public"
  21219. deprecated="not deprecated">
  21220. <constructor name="FileInputFormat"
  21221. static="false" final="false" visibility="public"
  21222. deprecated="not deprecated">
  21223. </constructor>
  21224. <method name="getFormatMinSplitSize" return="long"
  21225. abstract="false" native="false" synchronized="false"
  21226. static="false" final="false" visibility="protected"
  21227. deprecated="not deprecated">
  21228. <doc>
  21229. <![CDATA[Get the lower bound on split size imposed by the format.
  21230. @return the number of bytes of the minimal split for this format]]>
  21231. </doc>
  21232. </method>
  21233. <method name="isSplitable" return="boolean"
  21234. abstract="false" native="false" synchronized="false"
  21235. static="false" final="false" visibility="protected"
  21236. deprecated="not deprecated">
  21237. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  21238. <param name="filename" type="org.apache.hadoop.fs.Path"/>
  21239. <doc>
  21240. <![CDATA[Is the given filename splitable? Usually, true, but if the file is
  21241. stream compressed, it will not be.
  21242. <code>FileInputFormat</code> implementations can override this and return
  21243. <code>false</code> to ensure that individual input files are never split-up
  21244. so that {@link Mapper}s process entire files.
  21245. @param context the job context
  21246. @param filename the file name to check
  21247. @return is this file splitable?]]>
  21248. </doc>
  21249. </method>
  21250. <method name="setInputPathFilter"
  21251. abstract="false" native="false" synchronized="false"
  21252. static="true" final="false" visibility="public"
  21253. deprecated="not deprecated">
  21254. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21255. <param name="filter" type="java.lang.Class"/>
  21256. <doc>
  21257. <![CDATA[Set a PathFilter to be applied to the input paths for the map-reduce job.
  21258. @param job the job to modify
  21259. @param filter the PathFilter class use for filtering the input paths.]]>
  21260. </doc>
  21261. </method>
  21262. <method name="setMinInputSplitSize"
  21263. abstract="false" native="false" synchronized="false"
  21264. static="true" final="false" visibility="public"
  21265. deprecated="not deprecated">
  21266. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21267. <param name="size" type="long"/>
  21268. <doc>
  21269. <![CDATA[Set the minimum input split size
  21270. @param job the job to modify
  21271. @param size the minimum size]]>
  21272. </doc>
  21273. </method>
  21274. <method name="getMinSplitSize" return="long"
  21275. abstract="false" native="false" synchronized="false"
  21276. static="true" final="false" visibility="public"
  21277. deprecated="not deprecated">
  21278. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  21279. <doc>
  21280. <![CDATA[Get the minimum split size
  21281. @param job the job
  21282. @return the minimum number of bytes that can be in a split]]>
  21283. </doc>
  21284. </method>
  21285. <method name="setMaxInputSplitSize"
  21286. abstract="false" native="false" synchronized="false"
  21287. static="true" final="false" visibility="public"
  21288. deprecated="not deprecated">
  21289. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21290. <param name="size" type="long"/>
  21291. <doc>
  21292. <![CDATA[Set the maximum split size
  21293. @param job the job to modify
  21294. @param size the maximum split size]]>
  21295. </doc>
  21296. </method>
  21297. <method name="getMaxSplitSize" return="long"
  21298. abstract="false" native="false" synchronized="false"
  21299. static="true" final="false" visibility="public"
  21300. deprecated="not deprecated">
  21301. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  21302. <doc>
  21303. <![CDATA[Get the maximum split size.
  21304. @param context the job to look at.
  21305. @return the maximum number of bytes a split can include]]>
  21306. </doc>
  21307. </method>
  21308. <method name="getInputPathFilter" return="org.apache.hadoop.fs.PathFilter"
  21309. abstract="false" native="false" synchronized="false"
  21310. static="true" final="false" visibility="public"
  21311. deprecated="not deprecated">
  21312. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  21313. <doc>
  21314. <![CDATA[Get a PathFilter instance of the filter set for the input paths.
  21315. @return the PathFilter instance set for the job, NULL if none has been set.]]>
  21316. </doc>
  21317. </method>
  21318. <method name="listStatus" return="java.util.List"
  21319. abstract="false" native="false" synchronized="false"
  21320. static="false" final="false" visibility="protected"
  21321. deprecated="not deprecated">
  21322. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  21323. <exception name="IOException" type="java.io.IOException"/>
  21324. <doc>
  21325. <![CDATA[List input directories.
  21326. Subclasses may override to, e.g., select only files matching a regular
  21327. expression.
  21328. @param job the job to list input paths for
  21329. @return array of FileStatus objects
  21330. @throws IOException if zero items.]]>
  21331. </doc>
  21332. </method>
  21333. <method name="makeSplit" return="org.apache.hadoop.mapreduce.lib.input.FileSplit"
  21334. abstract="false" native="false" synchronized="false"
  21335. static="false" final="false" visibility="protected"
  21336. deprecated="not deprecated">
  21337. <param name="file" type="org.apache.hadoop.fs.Path"/>
  21338. <param name="start" type="long"/>
  21339. <param name="length" type="long"/>
  21340. <param name="hosts" type="java.lang.String[]"/>
  21341. <doc>
  21342. <![CDATA[A factory that makes the split for this class. It can be overridden
  21343. by sub-classes to make sub-types]]>
  21344. </doc>
  21345. </method>
  21346. <method name="getSplits" return="java.util.List"
  21347. abstract="false" native="false" synchronized="false"
  21348. static="false" final="false" visibility="public"
  21349. deprecated="not deprecated">
  21350. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  21351. <exception name="IOException" type="java.io.IOException"/>
  21352. <doc>
  21353. <![CDATA[Generate the list of files and make them into FileSplits.
  21354. @param job the job context
  21355. @throws IOException]]>
  21356. </doc>
  21357. </method>
  21358. <method name="computeSplitSize" return="long"
  21359. abstract="false" native="false" synchronized="false"
  21360. static="false" final="false" visibility="protected"
  21361. deprecated="not deprecated">
  21362. <param name="blockSize" type="long"/>
  21363. <param name="minSize" type="long"/>
  21364. <param name="maxSize" type="long"/>
  21365. </method>
  21366. <method name="getBlockIndex" return="int"
  21367. abstract="false" native="false" synchronized="false"
  21368. static="false" final="false" visibility="protected"
  21369. deprecated="not deprecated">
  21370. <param name="blkLocations" type="org.apache.hadoop.fs.BlockLocation[]"/>
  21371. <param name="offset" type="long"/>
  21372. </method>
  21373. <method name="setInputPaths"
  21374. abstract="false" native="false" synchronized="false"
  21375. static="true" final="false" visibility="public"
  21376. deprecated="not deprecated">
  21377. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21378. <param name="commaSeparatedPaths" type="java.lang.String"/>
  21379. <exception name="IOException" type="java.io.IOException"/>
  21380. <doc>
  21381. <![CDATA[Sets the given comma separated paths as the list of inputs
  21382. for the map-reduce job.
  21383. @param job the job
  21384. @param commaSeparatedPaths Comma separated paths to be set as
  21385. the list of inputs for the map-reduce job.]]>
  21386. </doc>
  21387. </method>
  21388. <method name="addInputPaths"
  21389. abstract="false" native="false" synchronized="false"
  21390. static="true" final="false" visibility="public"
  21391. deprecated="not deprecated">
  21392. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21393. <param name="commaSeparatedPaths" type="java.lang.String"/>
  21394. <exception name="IOException" type="java.io.IOException"/>
  21395. <doc>
  21396. <![CDATA[Add the given comma separated paths to the list of inputs for
  21397. the map-reduce job.
  21398. @param job The job to modify
  21399. @param commaSeparatedPaths Comma separated paths to be added to
  21400. the list of inputs for the map-reduce job.]]>
  21401. </doc>
  21402. </method>
  21403. <method name="setInputPaths"
  21404. abstract="false" native="false" synchronized="false"
  21405. static="true" final="false" visibility="public"
  21406. deprecated="not deprecated">
  21407. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21408. <param name="inputPaths" type="org.apache.hadoop.fs.Path[]"/>
  21409. <exception name="IOException" type="java.io.IOException"/>
  21410. <doc>
  21411. <![CDATA[Set the array of {@link Path}s as the list of inputs
  21412. for the map-reduce job.
  21413. @param job The job to modify
  21414. @param inputPaths the {@link Path}s of the input directories/files
  21415. for the map-reduce job.]]>
  21416. </doc>
  21417. </method>
  21418. <method name="addInputPath"
  21419. abstract="false" native="false" synchronized="false"
  21420. static="true" final="false" visibility="public"
  21421. deprecated="not deprecated">
  21422. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21423. <param name="path" type="org.apache.hadoop.fs.Path"/>
  21424. <exception name="IOException" type="java.io.IOException"/>
  21425. <doc>
  21426. <![CDATA[Add a {@link Path} to the list of inputs for the map-reduce job.
  21427. @param job The {@link Job} to modify
  21428. @param path {@link Path} to be added to the list of inputs for
  21429. the map-reduce job.]]>
  21430. </doc>
  21431. </method>
  21432. <method name="getInputPaths" return="org.apache.hadoop.fs.Path[]"
  21433. abstract="false" native="false" synchronized="false"
  21434. static="true" final="false" visibility="public"
  21435. deprecated="not deprecated">
  21436. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  21437. <doc>
  21438. <![CDATA[Get the list of input {@link Path}s for the map-reduce job.
  21439. @param context The job
  21440. @return the list of input {@link Path}s for the map-reduce job.]]>
  21441. </doc>
  21442. </method>
  21443. <field name="COUNTER_GROUP" type="java.lang.String"
  21444. transient="false" volatile="false"
  21445. static="true" final="true" visibility="public"
  21446. deprecated="not deprecated">
  21447. </field>
  21448. <field name="BYTES_READ" type="java.lang.String"
  21449. transient="false" volatile="false"
  21450. static="true" final="true" visibility="public"
  21451. deprecated="not deprecated">
  21452. </field>
  21453. <field name="INPUT_DIR" type="java.lang.String"
  21454. transient="false" volatile="false"
  21455. static="true" final="true" visibility="public"
  21456. deprecated="not deprecated">
  21457. </field>
  21458. <field name="SPLIT_MAXSIZE" type="java.lang.String"
  21459. transient="false" volatile="false"
  21460. static="true" final="true" visibility="public"
  21461. deprecated="not deprecated">
  21462. </field>
  21463. <field name="SPLIT_MINSIZE" type="java.lang.String"
  21464. transient="false" volatile="false"
  21465. static="true" final="true" visibility="public"
  21466. deprecated="not deprecated">
  21467. </field>
  21468. <field name="PATHFILTER_CLASS" type="java.lang.String"
  21469. transient="false" volatile="false"
  21470. static="true" final="true" visibility="public"
  21471. deprecated="not deprecated">
  21472. </field>
  21473. <field name="NUM_INPUT_FILES" type="java.lang.String"
  21474. transient="false" volatile="false"
  21475. static="true" final="true" visibility="public"
  21476. deprecated="not deprecated">
  21477. </field>
  21478. <doc>
  21479. <![CDATA[A base class for file-based {@link InputFormat}s.
  21480. <p><code>FileInputFormat</code> is the base class for all file-based
  21481. <code>InputFormat</code>s. This provides a generic implementation of
  21482. {@link #getSplits(JobContext)}.
  21483. Subclasses of <code>FileInputFormat</code> can also override the
  21484. {@link #isSplitable(JobContext, Path)} method to ensure input-files are
  21485. not split-up and are processed as a whole by {@link Mapper}s.]]>
  21486. </doc>
  21487. </class>
  21488. <!-- end class org.apache.hadoop.mapreduce.lib.input.FileInputFormat -->
  21489. <!-- start class org.apache.hadoop.mapreduce.lib.input.FileSplit -->
  21490. <class name="FileSplit" extends="org.apache.hadoop.mapreduce.InputSplit"
  21491. abstract="false"
  21492. static="false" final="false" visibility="public"
  21493. deprecated="not deprecated">
  21494. <implements name="org.apache.hadoop.io.Writable"/>
  21495. <constructor name="FileSplit"
  21496. static="false" final="false" visibility="public"
  21497. deprecated="not deprecated">
  21498. </constructor>
  21499. <constructor name="FileSplit" type="org.apache.hadoop.fs.Path, long, long, java.lang.String[]"
  21500. static="false" final="false" visibility="public"
  21501. deprecated="not deprecated">
  21502. <doc>
  21503. <![CDATA[Constructs a split with host information
  21504. @param file the file name
  21505. @param start the position of the first byte in the file to process
  21506. @param length the number of bytes in the file to process
  21507. @param hosts the list of hosts containing the block, possibly null]]>
  21508. </doc>
  21509. </constructor>
  21510. <method name="getPath" return="org.apache.hadoop.fs.Path"
  21511. abstract="false" native="false" synchronized="false"
  21512. static="false" final="false" visibility="public"
  21513. deprecated="not deprecated">
  21514. <doc>
  21515. <![CDATA[The file containing this split's data.]]>
  21516. </doc>
  21517. </method>
  21518. <method name="getStart" return="long"
  21519. abstract="false" native="false" synchronized="false"
  21520. static="false" final="false" visibility="public"
  21521. deprecated="not deprecated">
  21522. <doc>
  21523. <![CDATA[The position of the first byte in the file to process.]]>
  21524. </doc>
  21525. </method>
  21526. <method name="getLength" return="long"
  21527. abstract="false" native="false" synchronized="false"
  21528. static="false" final="false" visibility="public"
  21529. deprecated="not deprecated">
  21530. <doc>
  21531. <![CDATA[The number of bytes in the file to process.]]>
  21532. </doc>
  21533. </method>
  21534. <method name="toString" return="java.lang.String"
  21535. abstract="false" native="false" synchronized="false"
  21536. static="false" final="false" visibility="public"
  21537. deprecated="not deprecated">
  21538. </method>
  21539. <method name="write"
  21540. abstract="false" native="false" synchronized="false"
  21541. static="false" final="false" visibility="public"
  21542. deprecated="not deprecated">
  21543. <param name="out" type="java.io.DataOutput"/>
  21544. <exception name="IOException" type="java.io.IOException"/>
  21545. </method>
  21546. <method name="readFields"
  21547. abstract="false" native="false" synchronized="false"
  21548. static="false" final="false" visibility="public"
  21549. deprecated="not deprecated">
  21550. <param name="in" type="java.io.DataInput"/>
  21551. <exception name="IOException" type="java.io.IOException"/>
  21552. </method>
  21553. <method name="getLocations" return="java.lang.String[]"
  21554. abstract="false" native="false" synchronized="false"
  21555. static="false" final="false" visibility="public"
  21556. deprecated="not deprecated">
  21557. <exception name="IOException" type="java.io.IOException"/>
  21558. </method>
  21559. <doc>
  21560. <![CDATA[A section of an input file. Returned by {@link
  21561. InputFormat#getSplits(JobContext)} and passed to
  21562. {@link InputFormat#createRecordReader(InputSplit,TaskAttemptContext)}.]]>
  21563. </doc>
  21564. </class>
  21565. <!-- end class org.apache.hadoop.mapreduce.lib.input.FileSplit -->
  21566. <!-- start class org.apache.hadoop.mapreduce.lib.input.InvalidInputException -->
  21567. <class name="InvalidInputException" extends="java.io.IOException"
  21568. abstract="false"
  21569. static="false" final="false" visibility="public"
  21570. deprecated="not deprecated">
  21571. <constructor name="InvalidInputException" type="java.util.List"
  21572. static="false" final="false" visibility="public"
  21573. deprecated="not deprecated">
  21574. <doc>
  21575. <![CDATA[Create the exception with the given list.
  21576. @param probs the list of problems to report. this list is not copied.]]>
  21577. </doc>
  21578. </constructor>
  21579. <method name="getProblems" return="java.util.List"
  21580. abstract="false" native="false" synchronized="false"
  21581. static="false" final="false" visibility="public"
  21582. deprecated="not deprecated">
  21583. <doc>
  21584. <![CDATA[Get the complete list of the problems reported.
  21585. @return the list of problems, which must not be modified]]>
  21586. </doc>
  21587. </method>
  21588. <method name="getMessage" return="java.lang.String"
  21589. abstract="false" native="false" synchronized="false"
  21590. static="false" final="false" visibility="public"
  21591. deprecated="not deprecated">
  21592. <doc>
  21593. <![CDATA[Get a summary message of the problems found.
  21594. @return the concatenated messages from all of the problems.]]>
  21595. </doc>
  21596. </method>
  21597. <doc>
  21598. <![CDATA[This class wraps a list of problems with the input, so that the user
  21599. can get a list of problems together instead of finding and fixing them one
  21600. by one.]]>
  21601. </doc>
  21602. </class>
  21603. <!-- end class org.apache.hadoop.mapreduce.lib.input.InvalidInputException -->
  21604. <!-- start class org.apache.hadoop.mapreduce.lib.input.KeyValueLineRecordReader -->
  21605. <class name="KeyValueLineRecordReader" extends="org.apache.hadoop.mapreduce.RecordReader"
  21606. abstract="false"
  21607. static="false" final="false" visibility="public"
  21608. deprecated="not deprecated">
  21609. <constructor name="KeyValueLineRecordReader" type="org.apache.hadoop.conf.Configuration"
  21610. static="false" final="false" visibility="public"
  21611. deprecated="not deprecated">
  21612. <exception name="IOException" type="java.io.IOException"/>
  21613. </constructor>
  21614. <method name="initialize"
  21615. abstract="false" native="false" synchronized="false"
  21616. static="false" final="false" visibility="public"
  21617. deprecated="not deprecated">
  21618. <param name="genericSplit" type="org.apache.hadoop.mapreduce.InputSplit"/>
  21619. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  21620. <exception name="IOException" type="java.io.IOException"/>
  21621. </method>
  21622. <method name="findSeparator" return="int"
  21623. abstract="false" native="false" synchronized="false"
  21624. static="true" final="false" visibility="public"
  21625. deprecated="not deprecated">
  21626. <param name="utf" type="byte[]"/>
  21627. <param name="start" type="int"/>
  21628. <param name="length" type="int"/>
  21629. <param name="sep" type="byte"/>
  21630. </method>
  21631. <method name="setKeyValue"
  21632. abstract="false" native="false" synchronized="false"
  21633. static="true" final="false" visibility="public"
  21634. deprecated="not deprecated">
  21635. <param name="key" type="org.apache.hadoop.io.Text"/>
  21636. <param name="value" type="org.apache.hadoop.io.Text"/>
  21637. <param name="line" type="byte[]"/>
  21638. <param name="lineLen" type="int"/>
  21639. <param name="pos" type="int"/>
  21640. </method>
  21641. <method name="nextKeyValue" return="boolean"
  21642. abstract="false" native="false" synchronized="true"
  21643. static="false" final="false" visibility="public"
  21644. deprecated="not deprecated">
  21645. <exception name="IOException" type="java.io.IOException"/>
  21646. <doc>
  21647. <![CDATA[Read key/value pair in a line.]]>
  21648. </doc>
  21649. </method>
  21650. <method name="getCurrentKey" return="org.apache.hadoop.io.Text"
  21651. abstract="false" native="false" synchronized="false"
  21652. static="false" final="false" visibility="public"
  21653. deprecated="not deprecated">
  21654. </method>
  21655. <method name="getCurrentValue" return="org.apache.hadoop.io.Text"
  21656. abstract="false" native="false" synchronized="false"
  21657. static="false" final="false" visibility="public"
  21658. deprecated="not deprecated">
  21659. </method>
  21660. <method name="getProgress" return="float"
  21661. abstract="false" native="false" synchronized="false"
  21662. static="false" final="false" visibility="public"
  21663. deprecated="not deprecated">
  21664. <exception name="IOException" type="java.io.IOException"/>
  21665. </method>
  21666. <method name="close"
  21667. abstract="false" native="false" synchronized="true"
  21668. static="false" final="false" visibility="public"
  21669. deprecated="not deprecated">
  21670. <exception name="IOException" type="java.io.IOException"/>
  21671. </method>
  21672. <field name="KEY_VALUE_SEPERATOR" type="java.lang.String"
  21673. transient="false" volatile="false"
  21674. static="true" final="true" visibility="public"
  21675. deprecated="not deprecated">
  21676. </field>
  21677. <doc>
  21678. <![CDATA[This class treats a line in the input as a key/value pair separated by a
  21679. separator character. The separator can be specified in config file
  21680. under the attribute name mapreduce.input.keyvaluelinerecordreader.key.value.separator. The default
  21681. separator is the tab character ('\t').]]>
  21682. </doc>
  21683. </class>
  21684. <!-- end class org.apache.hadoop.mapreduce.lib.input.KeyValueLineRecordReader -->
  21685. <!-- start class org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat -->
  21686. <class name="KeyValueTextInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.FileInputFormat"
  21687. abstract="false"
  21688. static="false" final="false" visibility="public"
  21689. deprecated="not deprecated">
  21690. <constructor name="KeyValueTextInputFormat"
  21691. static="false" final="false" visibility="public"
  21692. deprecated="not deprecated">
  21693. </constructor>
  21694. <method name="isSplitable" return="boolean"
  21695. abstract="false" native="false" synchronized="false"
  21696. static="false" final="false" visibility="protected"
  21697. deprecated="not deprecated">
  21698. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  21699. <param name="file" type="org.apache.hadoop.fs.Path"/>
  21700. </method>
  21701. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  21702. abstract="false" native="false" synchronized="false"
  21703. static="false" final="false" visibility="public"
  21704. deprecated="not deprecated">
  21705. <param name="genericSplit" type="org.apache.hadoop.mapreduce.InputSplit"/>
  21706. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  21707. <exception name="IOException" type="java.io.IOException"/>
  21708. </method>
  21709. <doc>
  21710. <![CDATA[An {@link InputFormat} for plain text files. Files are broken into lines.
  21711. Either line feed or carriage-return are used to signal end of line.
  21712. Each line is divided into key and value parts by a separator byte. If no
  21713. such a byte exists, the key will be the entire line and value will be empty.]]>
  21714. </doc>
  21715. </class>
  21716. <!-- end class org.apache.hadoop.mapreduce.lib.input.KeyValueTextInputFormat -->
  21717. <!-- start class org.apache.hadoop.mapreduce.lib.input.MultipleInputs -->
  21718. <class name="MultipleInputs" extends="java.lang.Object"
  21719. abstract="false"
  21720. static="false" final="false" visibility="public"
  21721. deprecated="not deprecated">
  21722. <constructor name="MultipleInputs"
  21723. static="false" final="false" visibility="public"
  21724. deprecated="not deprecated">
  21725. </constructor>
  21726. <method name="addInputPath"
  21727. abstract="false" native="false" synchronized="false"
  21728. static="true" final="false" visibility="public"
  21729. deprecated="not deprecated">
  21730. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21731. <param name="path" type="org.apache.hadoop.fs.Path"/>
  21732. <param name="inputFormatClass" type="java.lang.Class"/>
  21733. <doc>
  21734. <![CDATA[Add a {@link Path} with a custom {@link InputFormat} to the list of
  21735. inputs for the map-reduce job.
  21736. @param job The {@link Job}
  21737. @param path {@link Path} to be added to the list of inputs for the job
  21738. @param inputFormatClass {@link InputFormat} class to use for this path]]>
  21739. </doc>
  21740. </method>
  21741. <method name="addInputPath"
  21742. abstract="false" native="false" synchronized="false"
  21743. static="true" final="false" visibility="public"
  21744. deprecated="not deprecated">
  21745. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21746. <param name="path" type="org.apache.hadoop.fs.Path"/>
  21747. <param name="inputFormatClass" type="java.lang.Class"/>
  21748. <param name="mapperClass" type="java.lang.Class"/>
  21749. <doc>
  21750. <![CDATA[Add a {@link Path} with a custom {@link InputFormat} and
  21751. {@link Mapper} to the list of inputs for the map-reduce job.
  21752. @param job The {@link Job}
  21753. @param path {@link Path} to be added to the list of inputs for the job
  21754. @param inputFormatClass {@link InputFormat} class to use for this path
  21755. @param mapperClass {@link Mapper} class to use for this path]]>
  21756. </doc>
  21757. </method>
  21758. <field name="DIR_FORMATS" type="java.lang.String"
  21759. transient="false" volatile="false"
  21760. static="true" final="true" visibility="public"
  21761. deprecated="not deprecated">
  21762. </field>
  21763. <field name="DIR_MAPPERS" type="java.lang.String"
  21764. transient="false" volatile="false"
  21765. static="true" final="true" visibility="public"
  21766. deprecated="not deprecated">
  21767. </field>
  21768. <doc>
  21769. <![CDATA[This class supports MapReduce jobs that have multiple input paths with
  21770. a different {@link InputFormat} and {@link Mapper} for each path]]>
  21771. </doc>
  21772. </class>
  21773. <!-- end class org.apache.hadoop.mapreduce.lib.input.MultipleInputs -->
  21774. <!-- start class org.apache.hadoop.mapreduce.lib.input.NLineInputFormat -->
  21775. <class name="NLineInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.FileInputFormat"
  21776. abstract="false"
  21777. static="false" final="false" visibility="public"
  21778. deprecated="not deprecated">
  21779. <constructor name="NLineInputFormat"
  21780. static="false" final="false" visibility="public"
  21781. deprecated="not deprecated">
  21782. </constructor>
  21783. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  21784. abstract="false" native="false" synchronized="false"
  21785. static="false" final="false" visibility="public"
  21786. deprecated="not deprecated">
  21787. <param name="genericSplit" type="org.apache.hadoop.mapreduce.InputSplit"/>
  21788. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  21789. <exception name="IOException" type="java.io.IOException"/>
  21790. </method>
  21791. <method name="getSplits" return="java.util.List"
  21792. abstract="false" native="false" synchronized="false"
  21793. static="false" final="false" visibility="public"
  21794. deprecated="not deprecated">
  21795. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  21796. <exception name="IOException" type="java.io.IOException"/>
  21797. <doc>
  21798. <![CDATA[Logically splits the set of input files for the job, splits N lines
  21799. of the input as one split.
  21800. @see FileInputFormat#getSplits(JobContext)]]>
  21801. </doc>
  21802. </method>
  21803. <method name="getSplitsForFile" return="java.util.List"
  21804. abstract="false" native="false" synchronized="false"
  21805. static="true" final="false" visibility="public"
  21806. deprecated="not deprecated">
  21807. <param name="status" type="org.apache.hadoop.fs.FileStatus"/>
  21808. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  21809. <param name="numLinesPerSplit" type="int"/>
  21810. <exception name="IOException" type="java.io.IOException"/>
  21811. </method>
  21812. <method name="setNumLinesPerSplit"
  21813. abstract="false" native="false" synchronized="false"
  21814. static="true" final="false" visibility="public"
  21815. deprecated="not deprecated">
  21816. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  21817. <param name="numLines" type="int"/>
  21818. <doc>
  21819. <![CDATA[Set the number of lines per split
  21820. @param job the job to modify
  21821. @param numLines the number of lines per split]]>
  21822. </doc>
  21823. </method>
  21824. <method name="getNumLinesPerSplit" return="int"
  21825. abstract="false" native="false" synchronized="false"
  21826. static="true" final="false" visibility="public"
  21827. deprecated="not deprecated">
  21828. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  21829. <doc>
  21830. <![CDATA[Get the number of lines per split
  21831. @param job the job
  21832. @return the number of lines per split]]>
  21833. </doc>
  21834. </method>
  21835. <field name="LINES_PER_MAP" type="java.lang.String"
  21836. transient="false" volatile="false"
  21837. static="true" final="true" visibility="public"
  21838. deprecated="not deprecated">
  21839. </field>
  21840. <doc>
  21841. <![CDATA[NLineInputFormat which splits N lines of input as one split.
  21842. In many "pleasantly" parallel applications, each process/mapper
  21843. processes the same input file (s), but with computations are
  21844. controlled by different parameters.(Referred to as "parameter sweeps").
  21845. One way to achieve this, is to specify a set of parameters
  21846. (one set per line) as input in a control file
  21847. (which is the input path to the map-reduce application,
  21848. where as the input dataset is specified
  21849. via a config variable in JobConf.).
  21850. The NLineInputFormat can be used in such applications, that splits
  21851. the input file such that by default, one line is fed as
  21852. a value to one map task, and key is the offset.
  21853. i.e. (k,v) is (LongWritable, Text).
  21854. The location hints will span the whole mapred cluster.]]>
  21855. </doc>
  21856. </class>
  21857. <!-- end class org.apache.hadoop.mapreduce.lib.input.NLineInputFormat -->
  21858. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsBinaryInputFormat -->
  21859. <class name="SequenceFileAsBinaryInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat"
  21860. abstract="false"
  21861. static="false" final="false" visibility="public"
  21862. deprecated="not deprecated">
  21863. <constructor name="SequenceFileAsBinaryInputFormat"
  21864. static="false" final="false" visibility="public"
  21865. deprecated="not deprecated">
  21866. </constructor>
  21867. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  21868. abstract="false" native="false" synchronized="false"
  21869. static="false" final="false" visibility="public"
  21870. deprecated="not deprecated">
  21871. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  21872. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  21873. <exception name="IOException" type="java.io.IOException"/>
  21874. </method>
  21875. <doc>
  21876. <![CDATA[InputFormat reading keys, values from SequenceFiles in binary (raw)
  21877. format.]]>
  21878. </doc>
  21879. </class>
  21880. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsBinaryInputFormat -->
  21881. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader -->
  21882. <class name="SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader" extends="org.apache.hadoop.mapreduce.RecordReader"
  21883. abstract="false"
  21884. static="true" final="false" visibility="public"
  21885. deprecated="not deprecated">
  21886. <constructor name="SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader"
  21887. static="false" final="false" visibility="public"
  21888. deprecated="not deprecated">
  21889. </constructor>
  21890. <method name="initialize"
  21891. abstract="false" native="false" synchronized="false"
  21892. static="false" final="false" visibility="public"
  21893. deprecated="not deprecated">
  21894. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  21895. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  21896. <exception name="IOException" type="java.io.IOException"/>
  21897. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  21898. </method>
  21899. <method name="getCurrentKey" return="org.apache.hadoop.io.BytesWritable"
  21900. abstract="false" native="false" synchronized="false"
  21901. static="false" final="false" visibility="public"
  21902. deprecated="not deprecated">
  21903. <exception name="IOException" type="java.io.IOException"/>
  21904. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  21905. </method>
  21906. <method name="getCurrentValue" return="org.apache.hadoop.io.BytesWritable"
  21907. abstract="false" native="false" synchronized="false"
  21908. static="false" final="false" visibility="public"
  21909. deprecated="not deprecated">
  21910. <exception name="IOException" type="java.io.IOException"/>
  21911. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  21912. </method>
  21913. <method name="getKeyClassName" return="java.lang.String"
  21914. abstract="false" native="false" synchronized="false"
  21915. static="false" final="false" visibility="public"
  21916. deprecated="not deprecated">
  21917. <doc>
  21918. <![CDATA[Retrieve the name of the key class for this SequenceFile.
  21919. @see org.apache.hadoop.io.SequenceFile.Reader#getKeyClassName]]>
  21920. </doc>
  21921. </method>
  21922. <method name="getValueClassName" return="java.lang.String"
  21923. abstract="false" native="false" synchronized="false"
  21924. static="false" final="false" visibility="public"
  21925. deprecated="not deprecated">
  21926. <doc>
  21927. <![CDATA[Retrieve the name of the value class for this SequenceFile.
  21928. @see org.apache.hadoop.io.SequenceFile.Reader#getValueClassName]]>
  21929. </doc>
  21930. </method>
  21931. <method name="nextKeyValue" return="boolean"
  21932. abstract="false" native="false" synchronized="true"
  21933. static="false" final="false" visibility="public"
  21934. deprecated="not deprecated">
  21935. <exception name="IOException" type="java.io.IOException"/>
  21936. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  21937. <doc>
  21938. <![CDATA[Read raw bytes from a SequenceFile.]]>
  21939. </doc>
  21940. </method>
  21941. <method name="close"
  21942. abstract="false" native="false" synchronized="false"
  21943. static="false" final="false" visibility="public"
  21944. deprecated="not deprecated">
  21945. <exception name="IOException" type="java.io.IOException"/>
  21946. </method>
  21947. <method name="getProgress" return="float"
  21948. abstract="false" native="false" synchronized="false"
  21949. static="false" final="false" visibility="public"
  21950. deprecated="not deprecated">
  21951. <exception name="IOException" type="java.io.IOException"/>
  21952. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  21953. <doc>
  21954. <![CDATA[Return the progress within the input split
  21955. @return 0.0 to 1.0 of the input byte range]]>
  21956. </doc>
  21957. </method>
  21958. <doc>
  21959. <![CDATA[Read records from a SequenceFile as binary (raw) bytes.]]>
  21960. </doc>
  21961. </class>
  21962. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsBinaryInputFormat.SequenceFileAsBinaryRecordReader -->
  21963. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextInputFormat -->
  21964. <class name="SequenceFileAsTextInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat"
  21965. abstract="false"
  21966. static="false" final="false" visibility="public"
  21967. deprecated="not deprecated">
  21968. <constructor name="SequenceFileAsTextInputFormat"
  21969. static="false" final="false" visibility="public"
  21970. deprecated="not deprecated">
  21971. </constructor>
  21972. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  21973. abstract="false" native="false" synchronized="false"
  21974. static="false" final="false" visibility="public"
  21975. deprecated="not deprecated">
  21976. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  21977. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  21978. <exception name="IOException" type="java.io.IOException"/>
  21979. </method>
  21980. <doc>
  21981. <![CDATA[This class is similar to SequenceFileInputFormat, except it generates
  21982. SequenceFileAsTextRecordReader which converts the input keys and values
  21983. to their String forms by calling toString() method.]]>
  21984. </doc>
  21985. </class>
  21986. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextInputFormat -->
  21987. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextRecordReader -->
  21988. <class name="SequenceFileAsTextRecordReader" extends="org.apache.hadoop.mapreduce.RecordReader"
  21989. abstract="false"
  21990. static="false" final="false" visibility="public"
  21991. deprecated="not deprecated">
  21992. <constructor name="SequenceFileAsTextRecordReader"
  21993. static="false" final="false" visibility="public"
  21994. deprecated="not deprecated">
  21995. <exception name="IOException" type="java.io.IOException"/>
  21996. </constructor>
  21997. <method name="initialize"
  21998. abstract="false" native="false" synchronized="false"
  21999. static="false" final="false" visibility="public"
  22000. deprecated="not deprecated">
  22001. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  22002. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  22003. <exception name="IOException" type="java.io.IOException"/>
  22004. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22005. </method>
  22006. <method name="getCurrentKey" return="org.apache.hadoop.io.Text"
  22007. abstract="false" native="false" synchronized="false"
  22008. static="false" final="false" visibility="public"
  22009. deprecated="not deprecated">
  22010. <exception name="IOException" type="java.io.IOException"/>
  22011. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22012. </method>
  22013. <method name="getCurrentValue" return="org.apache.hadoop.io.Text"
  22014. abstract="false" native="false" synchronized="false"
  22015. static="false" final="false" visibility="public"
  22016. deprecated="not deprecated">
  22017. <exception name="IOException" type="java.io.IOException"/>
  22018. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22019. </method>
  22020. <method name="nextKeyValue" return="boolean"
  22021. abstract="false" native="false" synchronized="true"
  22022. static="false" final="false" visibility="public"
  22023. deprecated="not deprecated">
  22024. <exception name="IOException" type="java.io.IOException"/>
  22025. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22026. <doc>
  22027. <![CDATA[Read key/value pair in a line.]]>
  22028. </doc>
  22029. </method>
  22030. <method name="getProgress" return="float"
  22031. abstract="false" native="false" synchronized="false"
  22032. static="false" final="false" visibility="public"
  22033. deprecated="not deprecated">
  22034. <exception name="IOException" type="java.io.IOException"/>
  22035. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22036. </method>
  22037. <method name="close"
  22038. abstract="false" native="false" synchronized="true"
  22039. static="false" final="false" visibility="public"
  22040. deprecated="not deprecated">
  22041. <exception name="IOException" type="java.io.IOException"/>
  22042. </method>
  22043. <doc>
  22044. <![CDATA[This class converts the input keys and values to their String forms by
  22045. calling toString() method. This class to SequenceFileAsTextInputFormat
  22046. class is as LineRecordReader class to TextInputFormat class.]]>
  22047. </doc>
  22048. </class>
  22049. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileAsTextRecordReader -->
  22050. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter -->
  22051. <class name="SequenceFileInputFilter" extends="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat"
  22052. abstract="false"
  22053. static="false" final="false" visibility="public"
  22054. deprecated="not deprecated">
  22055. <constructor name="SequenceFileInputFilter"
  22056. static="false" final="false" visibility="public"
  22057. deprecated="not deprecated">
  22058. </constructor>
  22059. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  22060. abstract="false" native="false" synchronized="false"
  22061. static="false" final="false" visibility="public"
  22062. deprecated="not deprecated">
  22063. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  22064. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  22065. <exception name="IOException" type="java.io.IOException"/>
  22066. <doc>
  22067. <![CDATA[Create a record reader for the given split
  22068. @param split file split
  22069. @param context the task-attempt context
  22070. @return RecordReader]]>
  22071. </doc>
  22072. </method>
  22073. <method name="setFilterClass"
  22074. abstract="false" native="false" synchronized="false"
  22075. static="true" final="false" visibility="public"
  22076. deprecated="not deprecated">
  22077. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  22078. <param name="filterClass" type="java.lang.Class"/>
  22079. <doc>
  22080. <![CDATA[set the filter class
  22081. @param job The job
  22082. @param filterClass filter class]]>
  22083. </doc>
  22084. </method>
  22085. <field name="LOG" type="org.apache.commons.logging.Log"
  22086. transient="false" volatile="false"
  22087. static="true" final="true" visibility="public"
  22088. deprecated="not deprecated">
  22089. </field>
  22090. <field name="FILTER_CLASS" type="java.lang.String"
  22091. transient="false" volatile="false"
  22092. static="true" final="true" visibility="public"
  22093. deprecated="not deprecated">
  22094. </field>
  22095. <field name="FILTER_FREQUENCY" type="java.lang.String"
  22096. transient="false" volatile="false"
  22097. static="true" final="true" visibility="public"
  22098. deprecated="not deprecated">
  22099. </field>
  22100. <field name="FILTER_REGEX" type="java.lang.String"
  22101. transient="false" volatile="false"
  22102. static="true" final="true" visibility="public"
  22103. deprecated="not deprecated">
  22104. </field>
  22105. <doc>
  22106. <![CDATA[A class that allows a map/red job to work on a sample of sequence files.
  22107. The sample is decided by the filter class set by the job.]]>
  22108. </doc>
  22109. </class>
  22110. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter -->
  22111. <!-- start interface org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.Filter -->
  22112. <interface name="SequenceFileInputFilter.Filter" abstract="true"
  22113. static="true" final="false" visibility="public"
  22114. deprecated="not deprecated">
  22115. <implements name="org.apache.hadoop.conf.Configurable"/>
  22116. <method name="accept" return="boolean"
  22117. abstract="false" native="false" synchronized="false"
  22118. static="false" final="false" visibility="public"
  22119. deprecated="not deprecated">
  22120. <param name="key" type="java.lang.Object"/>
  22121. <doc>
  22122. <![CDATA[filter function
  22123. Decide if a record should be filtered or not
  22124. @param key record key
  22125. @return true if a record is accepted; return false otherwise]]>
  22126. </doc>
  22127. </method>
  22128. <doc>
  22129. <![CDATA[filter interface]]>
  22130. </doc>
  22131. </interface>
  22132. <!-- end interface org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.Filter -->
  22133. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.FilterBase -->
  22134. <class name="SequenceFileInputFilter.FilterBase" extends="java.lang.Object"
  22135. abstract="true"
  22136. static="true" final="false" visibility="public"
  22137. deprecated="not deprecated">
  22138. <implements name="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.Filter"/>
  22139. <constructor name="SequenceFileInputFilter.FilterBase"
  22140. static="false" final="false" visibility="public"
  22141. deprecated="not deprecated">
  22142. </constructor>
  22143. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  22144. abstract="false" native="false" synchronized="false"
  22145. static="false" final="false" visibility="public"
  22146. deprecated="not deprecated">
  22147. </method>
  22148. <doc>
  22149. <![CDATA[base class for Filters]]>
  22150. </doc>
  22151. </class>
  22152. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.FilterBase -->
  22153. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.MD5Filter -->
  22154. <class name="SequenceFileInputFilter.MD5Filter" extends="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.FilterBase"
  22155. abstract="false"
  22156. static="true" final="false" visibility="public"
  22157. deprecated="not deprecated">
  22158. <constructor name="SequenceFileInputFilter.MD5Filter"
  22159. static="false" final="false" visibility="public"
  22160. deprecated="not deprecated">
  22161. </constructor>
  22162. <method name="setFrequency"
  22163. abstract="false" native="false" synchronized="false"
  22164. static="true" final="false" visibility="public"
  22165. deprecated="not deprecated">
  22166. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  22167. <param name="frequency" type="int"/>
  22168. <doc>
  22169. <![CDATA[set the filtering frequency in configuration
  22170. @param conf configuration
  22171. @param frequency filtering frequency]]>
  22172. </doc>
  22173. </method>
  22174. <method name="setConf"
  22175. abstract="false" native="false" synchronized="false"
  22176. static="false" final="false" visibility="public"
  22177. deprecated="not deprecated">
  22178. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  22179. <doc>
  22180. <![CDATA[configure the filter according to configuration
  22181. @param conf configuration]]>
  22182. </doc>
  22183. </method>
  22184. <method name="accept" return="boolean"
  22185. abstract="false" native="false" synchronized="false"
  22186. static="false" final="false" visibility="public"
  22187. deprecated="not deprecated">
  22188. <param name="key" type="java.lang.Object"/>
  22189. <doc>
  22190. <![CDATA[Filtering method
  22191. If MD5(key) % frequency==0, return true; otherwise return false
  22192. @see Filter#accept(Object)]]>
  22193. </doc>
  22194. </method>
  22195. <field name="MD5_LEN" type="int"
  22196. transient="false" volatile="false"
  22197. static="true" final="true" visibility="public"
  22198. deprecated="not deprecated">
  22199. </field>
  22200. <doc>
  22201. <![CDATA[This class returns a set of records by examing the MD5 digest of its
  22202. key against a filtering frequency <i>f</i>. The filtering criteria is
  22203. MD5(key) % f == 0.]]>
  22204. </doc>
  22205. </class>
  22206. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.MD5Filter -->
  22207. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.PercentFilter -->
  22208. <class name="SequenceFileInputFilter.PercentFilter" extends="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.FilterBase"
  22209. abstract="false"
  22210. static="true" final="false" visibility="public"
  22211. deprecated="not deprecated">
  22212. <constructor name="SequenceFileInputFilter.PercentFilter"
  22213. static="false" final="false" visibility="public"
  22214. deprecated="not deprecated">
  22215. </constructor>
  22216. <method name="setFrequency"
  22217. abstract="false" native="false" synchronized="false"
  22218. static="true" final="false" visibility="public"
  22219. deprecated="not deprecated">
  22220. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  22221. <param name="frequency" type="int"/>
  22222. <doc>
  22223. <![CDATA[set the frequency and stores it in conf
  22224. @param conf configuration
  22225. @param frequency filtering frequencey]]>
  22226. </doc>
  22227. </method>
  22228. <method name="setConf"
  22229. abstract="false" native="false" synchronized="false"
  22230. static="false" final="false" visibility="public"
  22231. deprecated="not deprecated">
  22232. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  22233. <doc>
  22234. <![CDATA[configure the filter by checking the configuration
  22235. @param conf configuration]]>
  22236. </doc>
  22237. </method>
  22238. <method name="accept" return="boolean"
  22239. abstract="false" native="false" synchronized="false"
  22240. static="false" final="false" visibility="public"
  22241. deprecated="not deprecated">
  22242. <param name="key" type="java.lang.Object"/>
  22243. <doc>
  22244. <![CDATA[Filtering method
  22245. If record# % frequency==0, return true; otherwise return false
  22246. @see Filter#accept(Object)]]>
  22247. </doc>
  22248. </method>
  22249. <doc>
  22250. <![CDATA[This class returns a percentage of records
  22251. The percentage is determined by a filtering frequency <i>f</i> using
  22252. the criteria record# % f == 0.
  22253. For example, if the frequency is 10, one out of 10 records is returned.]]>
  22254. </doc>
  22255. </class>
  22256. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.PercentFilter -->
  22257. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.RegexFilter -->
  22258. <class name="SequenceFileInputFilter.RegexFilter" extends="org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.FilterBase"
  22259. abstract="false"
  22260. static="true" final="false" visibility="public"
  22261. deprecated="not deprecated">
  22262. <constructor name="SequenceFileInputFilter.RegexFilter"
  22263. static="false" final="false" visibility="public"
  22264. deprecated="not deprecated">
  22265. </constructor>
  22266. <method name="setPattern"
  22267. abstract="false" native="false" synchronized="false"
  22268. static="true" final="false" visibility="public"
  22269. deprecated="not deprecated">
  22270. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  22271. <param name="regex" type="java.lang.String"/>
  22272. <exception name="PatternSyntaxException" type="java.util.regex.PatternSyntaxException"/>
  22273. <doc>
  22274. <![CDATA[Define the filtering regex and stores it in conf
  22275. @param conf where the regex is set
  22276. @param regex regex used as a filter]]>
  22277. </doc>
  22278. </method>
  22279. <method name="setConf"
  22280. abstract="false" native="false" synchronized="false"
  22281. static="false" final="false" visibility="public"
  22282. deprecated="not deprecated">
  22283. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  22284. <doc>
  22285. <![CDATA[configure the Filter by checking the configuration]]>
  22286. </doc>
  22287. </method>
  22288. <method name="accept" return="boolean"
  22289. abstract="false" native="false" synchronized="false"
  22290. static="false" final="false" visibility="public"
  22291. deprecated="not deprecated">
  22292. <param name="key" type="java.lang.Object"/>
  22293. <doc>
  22294. <![CDATA[Filtering method
  22295. If key matches the regex, return true; otherwise return false
  22296. @see Filter#accept(Object)]]>
  22297. </doc>
  22298. </method>
  22299. <doc>
  22300. <![CDATA[Records filter by matching key to regex]]>
  22301. </doc>
  22302. </class>
  22303. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFilter.RegexFilter -->
  22304. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat -->
  22305. <class name="SequenceFileInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.FileInputFormat"
  22306. abstract="false"
  22307. static="false" final="false" visibility="public"
  22308. deprecated="not deprecated">
  22309. <constructor name="SequenceFileInputFormat"
  22310. static="false" final="false" visibility="public"
  22311. deprecated="not deprecated">
  22312. </constructor>
  22313. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  22314. abstract="false" native="false" synchronized="false"
  22315. static="false" final="false" visibility="public"
  22316. deprecated="not deprecated">
  22317. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  22318. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  22319. <exception name="IOException" type="java.io.IOException"/>
  22320. </method>
  22321. <method name="getFormatMinSplitSize" return="long"
  22322. abstract="false" native="false" synchronized="false"
  22323. static="false" final="false" visibility="protected"
  22324. deprecated="not deprecated">
  22325. </method>
  22326. <method name="listStatus" return="java.util.List"
  22327. abstract="false" native="false" synchronized="false"
  22328. static="false" final="false" visibility="protected"
  22329. deprecated="not deprecated">
  22330. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  22331. <exception name="IOException" type="java.io.IOException"/>
  22332. </method>
  22333. <doc>
  22334. <![CDATA[An {@link InputFormat} for {@link SequenceFile}s.]]>
  22335. </doc>
  22336. </class>
  22337. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileInputFormat -->
  22338. <!-- start class org.apache.hadoop.mapreduce.lib.input.SequenceFileRecordReader -->
  22339. <class name="SequenceFileRecordReader" extends="org.apache.hadoop.mapreduce.RecordReader"
  22340. abstract="false"
  22341. static="false" final="false" visibility="public"
  22342. deprecated="not deprecated">
  22343. <constructor name="SequenceFileRecordReader"
  22344. static="false" final="false" visibility="public"
  22345. deprecated="not deprecated">
  22346. </constructor>
  22347. <method name="initialize"
  22348. abstract="false" native="false" synchronized="false"
  22349. static="false" final="false" visibility="public"
  22350. deprecated="not deprecated">
  22351. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  22352. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  22353. <exception name="IOException" type="java.io.IOException"/>
  22354. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22355. </method>
  22356. <method name="nextKeyValue" return="boolean"
  22357. abstract="false" native="false" synchronized="false"
  22358. static="false" final="false" visibility="public"
  22359. deprecated="not deprecated">
  22360. <exception name="IOException" type="java.io.IOException"/>
  22361. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22362. </method>
  22363. <method name="getCurrentKey" return="K"
  22364. abstract="false" native="false" synchronized="false"
  22365. static="false" final="false" visibility="public"
  22366. deprecated="not deprecated">
  22367. </method>
  22368. <method name="getCurrentValue" return="V"
  22369. abstract="false" native="false" synchronized="false"
  22370. static="false" final="false" visibility="public"
  22371. deprecated="not deprecated">
  22372. </method>
  22373. <method name="getProgress" return="float"
  22374. abstract="false" native="false" synchronized="false"
  22375. static="false" final="false" visibility="public"
  22376. deprecated="not deprecated">
  22377. <exception name="IOException" type="java.io.IOException"/>
  22378. <doc>
  22379. <![CDATA[Return the progress within the input split
  22380. @return 0.0 to 1.0 of the input byte range]]>
  22381. </doc>
  22382. </method>
  22383. <method name="close"
  22384. abstract="false" native="false" synchronized="true"
  22385. static="false" final="false" visibility="public"
  22386. deprecated="not deprecated">
  22387. <exception name="IOException" type="java.io.IOException"/>
  22388. </method>
  22389. <field name="conf" type="org.apache.hadoop.conf.Configuration"
  22390. transient="false" volatile="false"
  22391. static="false" final="false" visibility="protected"
  22392. deprecated="not deprecated">
  22393. </field>
  22394. <doc>
  22395. <![CDATA[An {@link RecordReader} for {@link SequenceFile}s.]]>
  22396. </doc>
  22397. </class>
  22398. <!-- end class org.apache.hadoop.mapreduce.lib.input.SequenceFileRecordReader -->
  22399. <!-- start class org.apache.hadoop.mapreduce.lib.input.TextInputFormat -->
  22400. <class name="TextInputFormat" extends="org.apache.hadoop.mapreduce.lib.input.FileInputFormat"
  22401. abstract="false"
  22402. static="false" final="false" visibility="public"
  22403. deprecated="not deprecated">
  22404. <constructor name="TextInputFormat"
  22405. static="false" final="false" visibility="public"
  22406. deprecated="not deprecated">
  22407. </constructor>
  22408. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  22409. abstract="false" native="false" synchronized="false"
  22410. static="false" final="false" visibility="public"
  22411. deprecated="not deprecated">
  22412. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  22413. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  22414. </method>
  22415. <method name="isSplitable" return="boolean"
  22416. abstract="false" native="false" synchronized="false"
  22417. static="false" final="false" visibility="protected"
  22418. deprecated="not deprecated">
  22419. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  22420. <param name="file" type="org.apache.hadoop.fs.Path"/>
  22421. </method>
  22422. <doc>
  22423. <![CDATA[An {@link InputFormat} for plain text files. Files are broken into lines.
  22424. Either linefeed or carriage-return are used to signal end of line. Keys are
  22425. the position in the file, and values are the line of text..]]>
  22426. </doc>
  22427. </class>
  22428. <!-- end class org.apache.hadoop.mapreduce.lib.input.TextInputFormat -->
  22429. </package>
  22430. <package name="org.apache.hadoop.mapreduce.lib.jobcontrol">
  22431. <!-- start class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob -->
  22432. <class name="ControlledJob" extends="java.lang.Object"
  22433. abstract="false"
  22434. static="false" final="false" visibility="public"
  22435. deprecated="not deprecated">
  22436. <constructor name="ControlledJob" type="org.apache.hadoop.mapreduce.Job, java.util.List"
  22437. static="false" final="false" visibility="public"
  22438. deprecated="not deprecated">
  22439. <exception name="IOException" type="java.io.IOException"/>
  22440. <doc>
  22441. <![CDATA[Construct a job.
  22442. @param job a mapreduce job to be executed.
  22443. @param dependingJobs an array of jobs the current job depends on]]>
  22444. </doc>
  22445. </constructor>
  22446. <constructor name="ControlledJob" type="org.apache.hadoop.conf.Configuration"
  22447. static="false" final="false" visibility="public"
  22448. deprecated="not deprecated">
  22449. <exception name="IOException" type="java.io.IOException"/>
  22450. <doc>
  22451. <![CDATA[Construct a job.
  22452. @param conf mapred job configuration representing a job to be executed.
  22453. @throws IOException]]>
  22454. </doc>
  22455. </constructor>
  22456. <method name="toString" return="java.lang.String"
  22457. abstract="false" native="false" synchronized="false"
  22458. static="false" final="false" visibility="public"
  22459. deprecated="not deprecated">
  22460. </method>
  22461. <method name="getJobName" return="java.lang.String"
  22462. abstract="false" native="false" synchronized="false"
  22463. static="false" final="false" visibility="public"
  22464. deprecated="not deprecated">
  22465. <doc>
  22466. <![CDATA[@return the job name of this job]]>
  22467. </doc>
  22468. </method>
  22469. <method name="setJobName"
  22470. abstract="false" native="false" synchronized="false"
  22471. static="false" final="false" visibility="public"
  22472. deprecated="not deprecated">
  22473. <param name="jobName" type="java.lang.String"/>
  22474. <doc>
  22475. <![CDATA[Set the job name for this job.
  22476. @param jobName the job name]]>
  22477. </doc>
  22478. </method>
  22479. <method name="getJobID" return="java.lang.String"
  22480. abstract="false" native="false" synchronized="false"
  22481. static="false" final="false" visibility="public"
  22482. deprecated="not deprecated">
  22483. <doc>
  22484. <![CDATA[@return the job ID of this job assigned by JobControl]]>
  22485. </doc>
  22486. </method>
  22487. <method name="setJobID"
  22488. abstract="false" native="false" synchronized="false"
  22489. static="false" final="false" visibility="public"
  22490. deprecated="not deprecated">
  22491. <param name="id" type="java.lang.String"/>
  22492. <doc>
  22493. <![CDATA[Set the job ID for this job.
  22494. @param id the job ID]]>
  22495. </doc>
  22496. </method>
  22497. <method name="getMapredJobID" return="org.apache.hadoop.mapreduce.JobID"
  22498. abstract="false" native="false" synchronized="false"
  22499. static="false" final="false" visibility="public"
  22500. deprecated="not deprecated">
  22501. <doc>
  22502. <![CDATA[@return the mapred ID of this job as assigned by the
  22503. mapred framework.]]>
  22504. </doc>
  22505. </method>
  22506. <method name="getJob" return="org.apache.hadoop.mapreduce.Job"
  22507. abstract="false" native="false" synchronized="true"
  22508. static="false" final="false" visibility="public"
  22509. deprecated="not deprecated">
  22510. <doc>
  22511. <![CDATA[@return the mapreduce job]]>
  22512. </doc>
  22513. </method>
  22514. <method name="setJob"
  22515. abstract="false" native="false" synchronized="true"
  22516. static="false" final="false" visibility="public"
  22517. deprecated="not deprecated">
  22518. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  22519. <doc>
  22520. <![CDATA[Set the mapreduce job
  22521. @param job the mapreduce job for this job.]]>
  22522. </doc>
  22523. </method>
  22524. <method name="getJobState" return="org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State"
  22525. abstract="false" native="false" synchronized="true"
  22526. static="false" final="false" visibility="public"
  22527. deprecated="not deprecated">
  22528. <doc>
  22529. <![CDATA[@return the state of this job]]>
  22530. </doc>
  22531. </method>
  22532. <method name="setJobState"
  22533. abstract="false" native="false" synchronized="true"
  22534. static="false" final="false" visibility="protected"
  22535. deprecated="not deprecated">
  22536. <param name="state" type="org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State"/>
  22537. <doc>
  22538. <![CDATA[Set the state for this job.
  22539. @param state the new state for this job.]]>
  22540. </doc>
  22541. </method>
  22542. <method name="getMessage" return="java.lang.String"
  22543. abstract="false" native="false" synchronized="true"
  22544. static="false" final="false" visibility="public"
  22545. deprecated="not deprecated">
  22546. <doc>
  22547. <![CDATA[@return the message of this job]]>
  22548. </doc>
  22549. </method>
  22550. <method name="setMessage"
  22551. abstract="false" native="false" synchronized="true"
  22552. static="false" final="false" visibility="public"
  22553. deprecated="not deprecated">
  22554. <param name="message" type="java.lang.String"/>
  22555. <doc>
  22556. <![CDATA[Set the message for this job.
  22557. @param message the message for this job.]]>
  22558. </doc>
  22559. </method>
  22560. <method name="getDependentJobs" return="java.util.List"
  22561. abstract="false" native="false" synchronized="false"
  22562. static="false" final="false" visibility="public"
  22563. deprecated="not deprecated">
  22564. <doc>
  22565. <![CDATA[@return the depending jobs of this job]]>
  22566. </doc>
  22567. </method>
  22568. <method name="addDependingJob" return="boolean"
  22569. abstract="false" native="false" synchronized="true"
  22570. static="false" final="false" visibility="public"
  22571. deprecated="not deprecated">
  22572. <param name="dependingJob" type="org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob"/>
  22573. <doc>
  22574. <![CDATA[Add a job to this jobs' dependency list.
  22575. Dependent jobs can only be added while a Job
  22576. is waiting to run, not during or afterwards.
  22577. @param dependingJob Job that this Job depends on.
  22578. @return <tt>true</tt> if the Job was added.]]>
  22579. </doc>
  22580. </method>
  22581. <method name="isCompleted" return="boolean"
  22582. abstract="false" native="false" synchronized="true"
  22583. static="false" final="false" visibility="public"
  22584. deprecated="not deprecated">
  22585. <doc>
  22586. <![CDATA[@return true if this job is in a complete state]]>
  22587. </doc>
  22588. </method>
  22589. <method name="isReady" return="boolean"
  22590. abstract="false" native="false" synchronized="true"
  22591. static="false" final="false" visibility="public"
  22592. deprecated="not deprecated">
  22593. <doc>
  22594. <![CDATA[@return true if this job is in READY state]]>
  22595. </doc>
  22596. </method>
  22597. <method name="killJob"
  22598. abstract="false" native="false" synchronized="false"
  22599. static="false" final="false" visibility="public"
  22600. deprecated="not deprecated">
  22601. <exception name="IOException" type="java.io.IOException"/>
  22602. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22603. </method>
  22604. <method name="submit"
  22605. abstract="false" native="false" synchronized="true"
  22606. static="false" final="false" visibility="protected"
  22607. deprecated="not deprecated">
  22608. <doc>
  22609. <![CDATA[Submit this job to mapred. The state becomes RUNNING if submission
  22610. is successful, FAILED otherwise.]]>
  22611. </doc>
  22612. </method>
  22613. <field name="CREATE_DIR" type="java.lang.String"
  22614. transient="false" volatile="false"
  22615. static="true" final="true" visibility="public"
  22616. deprecated="not deprecated">
  22617. </field>
  22618. <doc>
  22619. <![CDATA[This class encapsulates a MapReduce job and its dependency. It monitors
  22620. the states of the depending jobs and updates the state of this job.
  22621. A job starts in the WAITING state. If it does not have any depending jobs,
  22622. or all of the depending jobs are in SUCCESS state, then the job state
  22623. will become READY. If any depending jobs fail, the job will fail too.
  22624. When in READY state, the job can be submitted to Hadoop for execution, with
  22625. the state changing into RUNNING state. From RUNNING state, the job
  22626. can get into SUCCESS or FAILED state, depending
  22627. the status of the job execution.]]>
  22628. </doc>
  22629. </class>
  22630. <!-- end class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob -->
  22631. <!-- start class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State -->
  22632. <class name="ControlledJob.State" extends="java.lang.Enum"
  22633. abstract="false"
  22634. static="true" final="true" visibility="public"
  22635. deprecated="not deprecated">
  22636. <method name="values" return="org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State[]"
  22637. abstract="false" native="false" synchronized="false"
  22638. static="true" final="false" visibility="public"
  22639. deprecated="not deprecated">
  22640. </method>
  22641. <method name="valueOf" return="org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State"
  22642. abstract="false" native="false" synchronized="false"
  22643. static="true" final="false" visibility="public"
  22644. deprecated="not deprecated">
  22645. <param name="name" type="java.lang.String"/>
  22646. </method>
  22647. </class>
  22648. <!-- end class org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob.State -->
  22649. <!-- start class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl -->
  22650. <class name="JobControl" extends="java.lang.Object"
  22651. abstract="false"
  22652. static="false" final="false" visibility="public"
  22653. deprecated="not deprecated">
  22654. <implements name="java.lang.Runnable"/>
  22655. <constructor name="JobControl" type="java.lang.String"
  22656. static="false" final="false" visibility="public"
  22657. deprecated="not deprecated">
  22658. <doc>
  22659. <![CDATA[Construct a job control for a group of jobs.
  22660. @param groupName a name identifying this group]]>
  22661. </doc>
  22662. </constructor>
  22663. <method name="getWaitingJobList" return="java.util.List"
  22664. abstract="false" native="false" synchronized="false"
  22665. static="false" final="false" visibility="public"
  22666. deprecated="not deprecated">
  22667. <doc>
  22668. <![CDATA[@return the jobs in the waiting state]]>
  22669. </doc>
  22670. </method>
  22671. <method name="getRunningJobList" return="java.util.List"
  22672. abstract="false" native="false" synchronized="false"
  22673. static="false" final="false" visibility="public"
  22674. deprecated="not deprecated">
  22675. <doc>
  22676. <![CDATA[@return the jobs in the running state]]>
  22677. </doc>
  22678. </method>
  22679. <method name="getReadyJobsList" return="java.util.List"
  22680. abstract="false" native="false" synchronized="false"
  22681. static="false" final="false" visibility="public"
  22682. deprecated="not deprecated">
  22683. <doc>
  22684. <![CDATA[@return the jobs in the ready state]]>
  22685. </doc>
  22686. </method>
  22687. <method name="getSuccessfulJobList" return="java.util.List"
  22688. abstract="false" native="false" synchronized="false"
  22689. static="false" final="false" visibility="public"
  22690. deprecated="not deprecated">
  22691. <doc>
  22692. <![CDATA[@return the jobs in the success state]]>
  22693. </doc>
  22694. </method>
  22695. <method name="getFailedJobList" return="java.util.List"
  22696. abstract="false" native="false" synchronized="false"
  22697. static="false" final="false" visibility="public"
  22698. deprecated="not deprecated">
  22699. </method>
  22700. <method name="addJob" return="java.lang.String"
  22701. abstract="false" native="false" synchronized="true"
  22702. static="false" final="false" visibility="public"
  22703. deprecated="not deprecated">
  22704. <param name="aJob" type="org.apache.hadoop.mapreduce.lib.jobcontrol.ControlledJob"/>
  22705. <doc>
  22706. <![CDATA[Add a new job.
  22707. @param aJob the new job]]>
  22708. </doc>
  22709. </method>
  22710. <method name="addJobCollection"
  22711. abstract="false" native="false" synchronized="false"
  22712. static="false" final="false" visibility="public"
  22713. deprecated="not deprecated">
  22714. <param name="jobs" type="java.util.Collection"/>
  22715. <doc>
  22716. <![CDATA[Add a collection of jobs
  22717. @param jobs]]>
  22718. </doc>
  22719. </method>
  22720. <method name="getThreadState" return="org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl.ThreadState"
  22721. abstract="false" native="false" synchronized="false"
  22722. static="false" final="false" visibility="public"
  22723. deprecated="not deprecated">
  22724. <doc>
  22725. <![CDATA[@return the thread state]]>
  22726. </doc>
  22727. </method>
  22728. <method name="stop"
  22729. abstract="false" native="false" synchronized="false"
  22730. static="false" final="false" visibility="public"
  22731. deprecated="not deprecated">
  22732. <doc>
  22733. <![CDATA[set the thread state to STOPPING so that the
  22734. thread will stop when it wakes up.]]>
  22735. </doc>
  22736. </method>
  22737. <method name="suspend"
  22738. abstract="false" native="false" synchronized="false"
  22739. static="false" final="false" visibility="public"
  22740. deprecated="not deprecated">
  22741. <doc>
  22742. <![CDATA[suspend the running thread]]>
  22743. </doc>
  22744. </method>
  22745. <method name="resume"
  22746. abstract="false" native="false" synchronized="false"
  22747. static="false" final="false" visibility="public"
  22748. deprecated="not deprecated">
  22749. <doc>
  22750. <![CDATA[resume the suspended thread]]>
  22751. </doc>
  22752. </method>
  22753. <method name="allFinished" return="boolean"
  22754. abstract="false" native="false" synchronized="true"
  22755. static="false" final="false" visibility="public"
  22756. deprecated="not deprecated">
  22757. </method>
  22758. <method name="run"
  22759. abstract="false" native="false" synchronized="false"
  22760. static="false" final="false" visibility="public"
  22761. deprecated="not deprecated">
  22762. <doc>
  22763. <![CDATA[The main loop for the thread.
  22764. The loop does the following:
  22765. Check the states of the running jobs
  22766. Update the states of waiting jobs
  22767. Submit the jobs in ready state]]>
  22768. </doc>
  22769. </method>
  22770. <doc>
  22771. <![CDATA[This class encapsulates a set of MapReduce jobs and its dependency.
  22772. It tracks the states of the jobs by placing them into different tables
  22773. according to their states.
  22774. This class provides APIs for the client app to add a job to the group
  22775. and to get the jobs in the group in different states. When a job is
  22776. added, an ID unique to the group is assigned to the job.
  22777. This class has a thread that submits jobs when they become ready,
  22778. monitors the states of the running jobs, and updates the states of jobs
  22779. based on the state changes of their depending jobs states. The class
  22780. provides APIs for suspending/resuming the thread, and
  22781. for stopping the thread.]]>
  22782. </doc>
  22783. </class>
  22784. <!-- end class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl -->
  22785. <!-- start class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl.ThreadState -->
  22786. <class name="JobControl.ThreadState" extends="java.lang.Enum"
  22787. abstract="false"
  22788. static="true" final="true" visibility="public"
  22789. deprecated="not deprecated">
  22790. <method name="values" return="org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl.ThreadState[]"
  22791. abstract="false" native="false" synchronized="false"
  22792. static="true" final="false" visibility="public"
  22793. deprecated="not deprecated">
  22794. </method>
  22795. <method name="valueOf" return="org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl.ThreadState"
  22796. abstract="false" native="false" synchronized="false"
  22797. static="true" final="false" visibility="public"
  22798. deprecated="not deprecated">
  22799. <param name="name" type="java.lang.String"/>
  22800. </method>
  22801. </class>
  22802. <!-- end class org.apache.hadoop.mapreduce.lib.jobcontrol.JobControl.ThreadState -->
  22803. </package>
  22804. <package name="org.apache.hadoop.mapreduce.lib.join">
  22805. <!-- start class org.apache.hadoop.mapreduce.lib.join.ArrayListBackedIterator -->
  22806. <class name="ArrayListBackedIterator" extends="java.lang.Object"
  22807. abstract="false"
  22808. static="false" final="false" visibility="public"
  22809. deprecated="not deprecated">
  22810. <implements name="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"/>
  22811. <constructor name="ArrayListBackedIterator"
  22812. static="false" final="false" visibility="public"
  22813. deprecated="not deprecated">
  22814. </constructor>
  22815. <constructor name="ArrayListBackedIterator" type="java.util.ArrayList"
  22816. static="false" final="false" visibility="public"
  22817. deprecated="not deprecated">
  22818. </constructor>
  22819. <method name="hasNext" return="boolean"
  22820. abstract="false" native="false" synchronized="false"
  22821. static="false" final="false" visibility="public"
  22822. deprecated="not deprecated">
  22823. </method>
  22824. <method name="next" return="boolean"
  22825. abstract="false" native="false" synchronized="false"
  22826. static="false" final="false" visibility="public"
  22827. deprecated="not deprecated">
  22828. <param name="val" type="X"/>
  22829. <exception name="IOException" type="java.io.IOException"/>
  22830. </method>
  22831. <method name="replay" return="boolean"
  22832. abstract="false" native="false" synchronized="false"
  22833. static="false" final="false" visibility="public"
  22834. deprecated="not deprecated">
  22835. <param name="val" type="X"/>
  22836. <exception name="IOException" type="java.io.IOException"/>
  22837. </method>
  22838. <method name="reset"
  22839. abstract="false" native="false" synchronized="false"
  22840. static="false" final="false" visibility="public"
  22841. deprecated="not deprecated">
  22842. </method>
  22843. <method name="add"
  22844. abstract="false" native="false" synchronized="false"
  22845. static="false" final="false" visibility="public"
  22846. deprecated="not deprecated">
  22847. <param name="item" type="X"/>
  22848. <exception name="IOException" type="java.io.IOException"/>
  22849. </method>
  22850. <method name="close"
  22851. abstract="false" native="false" synchronized="false"
  22852. static="false" final="false" visibility="public"
  22853. deprecated="not deprecated">
  22854. <exception name="IOException" type="java.io.IOException"/>
  22855. </method>
  22856. <method name="clear"
  22857. abstract="false" native="false" synchronized="false"
  22858. static="false" final="false" visibility="public"
  22859. deprecated="not deprecated">
  22860. </method>
  22861. <doc>
  22862. <![CDATA[This class provides an implementation of ResetableIterator. The
  22863. implementation uses an {@link java.util.ArrayList} to store elements
  22864. added to it, replaying them as requested.
  22865. Prefer {@link StreamBackedIterator}.]]>
  22866. </doc>
  22867. </class>
  22868. <!-- end class org.apache.hadoop.mapreduce.lib.join.ArrayListBackedIterator -->
  22869. <!-- start class org.apache.hadoop.mapreduce.lib.join.ComposableInputFormat -->
  22870. <class name="ComposableInputFormat" extends="org.apache.hadoop.mapreduce.InputFormat"
  22871. abstract="true"
  22872. static="false" final="false" visibility="public"
  22873. deprecated="not deprecated">
  22874. <constructor name="ComposableInputFormat"
  22875. static="false" final="false" visibility="public"
  22876. deprecated="not deprecated">
  22877. </constructor>
  22878. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader"
  22879. abstract="true" native="false" synchronized="false"
  22880. static="false" final="false" visibility="public"
  22881. deprecated="not deprecated">
  22882. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  22883. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  22884. <exception name="IOException" type="java.io.IOException"/>
  22885. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22886. </method>
  22887. <doc>
  22888. <![CDATA[Refinement of InputFormat requiring implementors to provide
  22889. ComposableRecordReader instead of RecordReader.]]>
  22890. </doc>
  22891. </class>
  22892. <!-- end class org.apache.hadoop.mapreduce.lib.join.ComposableInputFormat -->
  22893. <!-- start class org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader -->
  22894. <class name="ComposableRecordReader" extends="org.apache.hadoop.mapreduce.RecordReader"
  22895. abstract="true"
  22896. static="false" final="false" visibility="public"
  22897. deprecated="not deprecated">
  22898. <implements name="java.lang.Comparable"/>
  22899. <constructor name="ComposableRecordReader"
  22900. static="false" final="false" visibility="public"
  22901. deprecated="not deprecated">
  22902. </constructor>
  22903. <doc>
  22904. <![CDATA[Additional operations required of a RecordReader to participate in a join.]]>
  22905. </doc>
  22906. </class>
  22907. <!-- end class org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader -->
  22908. <!-- start class org.apache.hadoop.mapreduce.lib.join.CompositeInputFormat -->
  22909. <class name="CompositeInputFormat" extends="org.apache.hadoop.mapreduce.InputFormat"
  22910. abstract="false"
  22911. static="false" final="false" visibility="public"
  22912. deprecated="not deprecated">
  22913. <constructor name="CompositeInputFormat"
  22914. static="false" final="false" visibility="public"
  22915. deprecated="not deprecated">
  22916. </constructor>
  22917. <method name="setFormat"
  22918. abstract="false" native="false" synchronized="false"
  22919. static="false" final="false" visibility="public"
  22920. deprecated="not deprecated">
  22921. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  22922. <exception name="IOException" type="java.io.IOException"/>
  22923. <doc>
  22924. <![CDATA[Interpret a given string as a composite expression.
  22925. {@code
  22926. func ::= <ident>([<func>,]*<func>)
  22927. func ::= tbl(<class>,"<path>")
  22928. class ::= @see java.lang.Class#forName(java.lang.String)
  22929. path ::= @see org.apache.hadoop.fs.Path#Path(java.lang.String)
  22930. }
  22931. Reads expression from the <tt>mapreduce.join.expr</tt> property and
  22932. user-supplied join types from <tt>mapreduce.join.define.&lt;ident&gt;</tt>
  22933. types. Paths supplied to <tt>tbl</tt> are given as input paths to the
  22934. InputFormat class listed.
  22935. @see #compose(java.lang.String, java.lang.Class, java.lang.String...)]]>
  22936. </doc>
  22937. </method>
  22938. <method name="addDefaults"
  22939. abstract="false" native="false" synchronized="false"
  22940. static="false" final="false" visibility="protected"
  22941. deprecated="not deprecated">
  22942. <doc>
  22943. <![CDATA[Adds the default set of identifiers to the parser.]]>
  22944. </doc>
  22945. </method>
  22946. <method name="getSplits" return="java.util.List"
  22947. abstract="false" native="false" synchronized="false"
  22948. static="false" final="false" visibility="public"
  22949. deprecated="not deprecated">
  22950. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  22951. <exception name="IOException" type="java.io.IOException"/>
  22952. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22953. <doc>
  22954. <![CDATA[Build a CompositeInputSplit from the child InputFormats by assigning the
  22955. ith split from each child to the ith composite split.]]>
  22956. </doc>
  22957. </method>
  22958. <method name="createRecordReader" return="org.apache.hadoop.mapreduce.RecordReader"
  22959. abstract="false" native="false" synchronized="false"
  22960. static="false" final="false" visibility="public"
  22961. deprecated="not deprecated">
  22962. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  22963. <param name="taskContext" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  22964. <exception name="IOException" type="java.io.IOException"/>
  22965. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  22966. <doc>
  22967. <![CDATA[Construct a CompositeRecordReader for the children of this InputFormat
  22968. as defined in the init expression.
  22969. The outermost join need only be composable, not necessarily a composite.
  22970. Mandating TupleWritable isn't strictly correct.]]>
  22971. </doc>
  22972. </method>
  22973. <method name="compose" return="java.lang.String"
  22974. abstract="false" native="false" synchronized="false"
  22975. static="true" final="false" visibility="public"
  22976. deprecated="not deprecated">
  22977. <param name="inf" type="java.lang.Class"/>
  22978. <param name="path" type="java.lang.String"/>
  22979. <doc>
  22980. <![CDATA[Convenience method for constructing composite formats.
  22981. Given InputFormat class (inf), path (p) return:
  22982. {@code tbl(<inf>, <p>) }]]>
  22983. </doc>
  22984. </method>
  22985. <method name="compose" return="java.lang.String"
  22986. abstract="false" native="false" synchronized="false"
  22987. static="true" final="false" visibility="public"
  22988. deprecated="not deprecated">
  22989. <param name="op" type="java.lang.String"/>
  22990. <param name="inf" type="java.lang.Class"/>
  22991. <param name="path" type="java.lang.String[]"/>
  22992. <doc>
  22993. <![CDATA[Convenience method for constructing composite formats.
  22994. Given operation (op), Object class (inf), set of paths (p) return:
  22995. {@code <op>(tbl(<inf>,<p1>),tbl(<inf>,<p2>),...,tbl(<inf>,<pn>)) }]]>
  22996. </doc>
  22997. </method>
  22998. <method name="compose" return="java.lang.String"
  22999. abstract="false" native="false" synchronized="false"
  23000. static="true" final="false" visibility="public"
  23001. deprecated="not deprecated">
  23002. <param name="op" type="java.lang.String"/>
  23003. <param name="inf" type="java.lang.Class"/>
  23004. <param name="path" type="org.apache.hadoop.fs.Path[]"/>
  23005. <doc>
  23006. <![CDATA[Convenience method for constructing composite formats.
  23007. Given operation (op), Object class (inf), set of paths (p) return:
  23008. {@code <op>(tbl(<inf>,<p1>),tbl(<inf>,<p2>),...,tbl(<inf>,<pn>)) }]]>
  23009. </doc>
  23010. </method>
  23011. <field name="JOIN_EXPR" type="java.lang.String"
  23012. transient="false" volatile="false"
  23013. static="true" final="true" visibility="public"
  23014. deprecated="not deprecated">
  23015. </field>
  23016. <field name="JOIN_COMPARATOR" type="java.lang.String"
  23017. transient="false" volatile="false"
  23018. static="true" final="true" visibility="public"
  23019. deprecated="not deprecated">
  23020. </field>
  23021. <doc>
  23022. <![CDATA[An InputFormat capable of performing joins over a set of data sources sorted
  23023. and partitioned the same way.
  23024. @see #setFormat
  23025. A user may define new join types by setting the property
  23026. <tt>mapreduce.join.define.&lt;ident&gt;</tt> to a classname.
  23027. In the expression <tt>mapreduce.join.expr</tt>, the identifier will be
  23028. assumed to be a ComposableRecordReader.
  23029. <tt>mapreduce.join.keycomparator</tt> can be a classname used to compare
  23030. keys in the join.
  23031. @see JoinRecordReader
  23032. @see MultiFilterRecordReader]]>
  23033. </doc>
  23034. </class>
  23035. <!-- end class org.apache.hadoop.mapreduce.lib.join.CompositeInputFormat -->
  23036. <!-- start class org.apache.hadoop.mapreduce.lib.join.CompositeInputSplit -->
  23037. <class name="CompositeInputSplit" extends="org.apache.hadoop.mapreduce.InputSplit"
  23038. abstract="false"
  23039. static="false" final="false" visibility="public"
  23040. deprecated="not deprecated">
  23041. <implements name="org.apache.hadoop.io.Writable"/>
  23042. <constructor name="CompositeInputSplit"
  23043. static="false" final="false" visibility="public"
  23044. deprecated="not deprecated">
  23045. </constructor>
  23046. <constructor name="CompositeInputSplit" type="int"
  23047. static="false" final="false" visibility="public"
  23048. deprecated="not deprecated">
  23049. </constructor>
  23050. <method name="add"
  23051. abstract="false" native="false" synchronized="false"
  23052. static="false" final="false" visibility="public"
  23053. deprecated="not deprecated">
  23054. <param name="s" type="org.apache.hadoop.mapreduce.InputSplit"/>
  23055. <exception name="IOException" type="java.io.IOException"/>
  23056. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23057. <doc>
  23058. <![CDATA[Add an InputSplit to this collection.
  23059. @throws IOException If capacity was not specified during construction
  23060. or if capacity has been reached.]]>
  23061. </doc>
  23062. </method>
  23063. <method name="get" return="org.apache.hadoop.mapreduce.InputSplit"
  23064. abstract="false" native="false" synchronized="false"
  23065. static="false" final="false" visibility="public"
  23066. deprecated="not deprecated">
  23067. <param name="i" type="int"/>
  23068. <doc>
  23069. <![CDATA[Get ith child InputSplit.]]>
  23070. </doc>
  23071. </method>
  23072. <method name="getLength" return="long"
  23073. abstract="false" native="false" synchronized="false"
  23074. static="false" final="false" visibility="public"
  23075. deprecated="not deprecated">
  23076. <exception name="IOException" type="java.io.IOException"/>
  23077. <doc>
  23078. <![CDATA[Return the aggregate length of all child InputSplits currently added.]]>
  23079. </doc>
  23080. </method>
  23081. <method name="getLength" return="long"
  23082. abstract="false" native="false" synchronized="false"
  23083. static="false" final="false" visibility="public"
  23084. deprecated="not deprecated">
  23085. <param name="i" type="int"/>
  23086. <exception name="IOException" type="java.io.IOException"/>
  23087. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23088. <doc>
  23089. <![CDATA[Get the length of ith child InputSplit.]]>
  23090. </doc>
  23091. </method>
  23092. <method name="getLocations" return="java.lang.String[]"
  23093. abstract="false" native="false" synchronized="false"
  23094. static="false" final="false" visibility="public"
  23095. deprecated="not deprecated">
  23096. <exception name="IOException" type="java.io.IOException"/>
  23097. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23098. <doc>
  23099. <![CDATA[Collect a set of hosts from all child InputSplits.]]>
  23100. </doc>
  23101. </method>
  23102. <method name="getLocation" return="java.lang.String[]"
  23103. abstract="false" native="false" synchronized="false"
  23104. static="false" final="false" visibility="public"
  23105. deprecated="not deprecated">
  23106. <param name="i" type="int"/>
  23107. <exception name="IOException" type="java.io.IOException"/>
  23108. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23109. <doc>
  23110. <![CDATA[getLocations from ith InputSplit.]]>
  23111. </doc>
  23112. </method>
  23113. <method name="write"
  23114. abstract="false" native="false" synchronized="false"
  23115. static="false" final="false" visibility="public"
  23116. deprecated="not deprecated">
  23117. <param name="out" type="java.io.DataOutput"/>
  23118. <exception name="IOException" type="java.io.IOException"/>
  23119. <doc>
  23120. <![CDATA[Write splits in the following format.
  23121. {@code
  23122. <count><class1><class2>...<classn><split1><split2>...<splitn>
  23123. }]]>
  23124. </doc>
  23125. </method>
  23126. <method name="readFields"
  23127. abstract="false" native="false" synchronized="false"
  23128. static="false" final="false" visibility="public"
  23129. deprecated="not deprecated">
  23130. <param name="in" type="java.io.DataInput"/>
  23131. <exception name="IOException" type="java.io.IOException"/>
  23132. <doc>
  23133. <![CDATA[{@inheritDoc}
  23134. @throws IOException If the child InputSplit cannot be read, typically
  23135. for failing access checks.]]>
  23136. </doc>
  23137. </method>
  23138. <doc>
  23139. <![CDATA[This InputSplit contains a set of child InputSplits. Any InputSplit inserted
  23140. into this collection must have a public default constructor.]]>
  23141. </doc>
  23142. </class>
  23143. <!-- end class org.apache.hadoop.mapreduce.lib.join.CompositeInputSplit -->
  23144. <!-- start class org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader -->
  23145. <class name="CompositeRecordReader" extends="org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader"
  23146. abstract="true"
  23147. static="false" final="false" visibility="public"
  23148. deprecated="not deprecated">
  23149. <implements name="org.apache.hadoop.conf.Configurable"/>
  23150. <constructor name="CompositeRecordReader" type="int, int, java.lang.Class"
  23151. static="false" final="false" visibility="public"
  23152. deprecated="not deprecated">
  23153. <exception name="IOException" type="java.io.IOException"/>
  23154. <doc>
  23155. <![CDATA[Create a RecordReader with <tt>capacity</tt> children to position
  23156. <tt>id</tt> in the parent reader.
  23157. The id of a root CompositeRecordReader is -1 by convention, but relying
  23158. on this is not recommended.]]>
  23159. </doc>
  23160. </constructor>
  23161. <method name="combine" return="boolean"
  23162. abstract="true" native="false" synchronized="false"
  23163. static="false" final="false" visibility="protected"
  23164. deprecated="not deprecated">
  23165. <param name="srcs" type="java.lang.Object[]"/>
  23166. <param name="value" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23167. </method>
  23168. <method name="initialize"
  23169. abstract="false" native="false" synchronized="false"
  23170. static="false" final="false" visibility="public"
  23171. deprecated="not deprecated">
  23172. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  23173. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  23174. <exception name="IOException" type="java.io.IOException"/>
  23175. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23176. </method>
  23177. <method name="id" return="int"
  23178. abstract="false" native="false" synchronized="false"
  23179. static="false" final="false" visibility="public"
  23180. deprecated="not deprecated">
  23181. <doc>
  23182. <![CDATA[Return the position in the collector this class occupies.]]>
  23183. </doc>
  23184. </method>
  23185. <method name="setConf"
  23186. abstract="false" native="false" synchronized="false"
  23187. static="false" final="false" visibility="public"
  23188. deprecated="not deprecated">
  23189. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  23190. <doc>
  23191. <![CDATA[{@inheritDoc}]]>
  23192. </doc>
  23193. </method>
  23194. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  23195. abstract="false" native="false" synchronized="false"
  23196. static="false" final="false" visibility="public"
  23197. deprecated="not deprecated">
  23198. <doc>
  23199. <![CDATA[{@inheritDoc}]]>
  23200. </doc>
  23201. </method>
  23202. <method name="getRecordReaderQueue" return="java.util.PriorityQueue"
  23203. abstract="false" native="false" synchronized="false"
  23204. static="false" final="false" visibility="protected"
  23205. deprecated="not deprecated">
  23206. <doc>
  23207. <![CDATA[Return sorted list of RecordReaders for this composite.]]>
  23208. </doc>
  23209. </method>
  23210. <method name="getComparator" return="org.apache.hadoop.io.WritableComparator"
  23211. abstract="false" native="false" synchronized="false"
  23212. static="false" final="false" visibility="protected"
  23213. deprecated="not deprecated">
  23214. <doc>
  23215. <![CDATA[Return comparator defining the ordering for RecordReaders in this
  23216. composite.]]>
  23217. </doc>
  23218. </method>
  23219. <method name="add"
  23220. abstract="false" native="false" synchronized="false"
  23221. static="false" final="false" visibility="public"
  23222. deprecated="not deprecated">
  23223. <param name="rr" type="org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader"/>
  23224. <exception name="IOException" type="java.io.IOException"/>
  23225. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23226. <doc>
  23227. <![CDATA[Add a RecordReader to this collection.
  23228. The id() of a RecordReader determines where in the Tuple its
  23229. entry will appear. Adding RecordReaders with the same id has
  23230. undefined behavior.]]>
  23231. </doc>
  23232. </method>
  23233. <method name="key" return="K"
  23234. abstract="false" native="false" synchronized="false"
  23235. static="false" final="false" visibility="public"
  23236. deprecated="not deprecated">
  23237. <doc>
  23238. <![CDATA[Return the key for the current join or the value at the top of the
  23239. RecordReader heap.]]>
  23240. </doc>
  23241. </method>
  23242. <method name="key"
  23243. abstract="false" native="false" synchronized="false"
  23244. static="false" final="false" visibility="public"
  23245. deprecated="not deprecated">
  23246. <param name="key" type="K"/>
  23247. <exception name="IOException" type="java.io.IOException"/>
  23248. <doc>
  23249. <![CDATA[Clone the key at the top of this RR into the given object.]]>
  23250. </doc>
  23251. </method>
  23252. <method name="getCurrentKey" return="K"
  23253. abstract="false" native="false" synchronized="false"
  23254. static="false" final="false" visibility="public"
  23255. deprecated="not deprecated">
  23256. </method>
  23257. <method name="hasNext" return="boolean"
  23258. abstract="false" native="false" synchronized="false"
  23259. static="false" final="false" visibility="public"
  23260. deprecated="not deprecated">
  23261. <doc>
  23262. <![CDATA[Return true if it is possible that this could emit more values.]]>
  23263. </doc>
  23264. </method>
  23265. <method name="skip"
  23266. abstract="false" native="false" synchronized="false"
  23267. static="false" final="false" visibility="public"
  23268. deprecated="not deprecated">
  23269. <param name="key" type="K"/>
  23270. <exception name="IOException" type="java.io.IOException"/>
  23271. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23272. <doc>
  23273. <![CDATA[Pass skip key to child RRs.]]>
  23274. </doc>
  23275. </method>
  23276. <method name="getDelegate" return="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"
  23277. abstract="true" native="false" synchronized="false"
  23278. static="false" final="false" visibility="protected"
  23279. deprecated="not deprecated">
  23280. <doc>
  23281. <![CDATA[Obtain an iterator over the child RRs apropos of the value type
  23282. ultimately emitted from this join.]]>
  23283. </doc>
  23284. </method>
  23285. <method name="accept"
  23286. abstract="false" native="false" synchronized="false"
  23287. static="false" final="false" visibility="public"
  23288. deprecated="not deprecated">
  23289. <param name="jc" type="org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader.JoinCollector"/>
  23290. <param name="key" type="K"/>
  23291. <exception name="IOException" type="java.io.IOException"/>
  23292. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23293. <doc>
  23294. <![CDATA[If key provided matches that of this Composite, give JoinCollector
  23295. iterator over values it may emit.]]>
  23296. </doc>
  23297. </method>
  23298. <method name="fillJoinCollector"
  23299. abstract="false" native="false" synchronized="false"
  23300. static="false" final="false" visibility="protected"
  23301. deprecated="not deprecated">
  23302. <param name="iterkey" type="K"/>
  23303. <exception name="IOException" type="java.io.IOException"/>
  23304. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23305. <doc>
  23306. <![CDATA[For all child RRs offering the key provided, obtain an iterator
  23307. at that position in the JoinCollector.]]>
  23308. </doc>
  23309. </method>
  23310. <method name="compareTo" return="int"
  23311. abstract="false" native="false" synchronized="false"
  23312. static="false" final="false" visibility="public"
  23313. deprecated="not deprecated">
  23314. <param name="other" type="org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader"/>
  23315. <doc>
  23316. <![CDATA[Implement Comparable contract (compare key of join or head of heap
  23317. with that of another).]]>
  23318. </doc>
  23319. </method>
  23320. <method name="createKey" return="K"
  23321. abstract="false" native="false" synchronized="false"
  23322. static="false" final="false" visibility="protected"
  23323. deprecated="not deprecated">
  23324. <doc>
  23325. <![CDATA[Create a new key common to all child RRs.
  23326. @throws ClassCastException if key classes differ.]]>
  23327. </doc>
  23328. </method>
  23329. <method name="createTupleWritable" return="org.apache.hadoop.mapreduce.lib.join.TupleWritable"
  23330. abstract="false" native="false" synchronized="false"
  23331. static="false" final="false" visibility="protected"
  23332. deprecated="not deprecated">
  23333. <doc>
  23334. <![CDATA[Create a value to be used internally for joins.]]>
  23335. </doc>
  23336. </method>
  23337. <method name="getCurrentValue" return="X"
  23338. abstract="false" native="false" synchronized="false"
  23339. static="false" final="false" visibility="public"
  23340. deprecated="not deprecated">
  23341. <exception name="IOException" type="java.io.IOException"/>
  23342. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23343. <doc>
  23344. <![CDATA[{@inheritDoc}]]>
  23345. </doc>
  23346. </method>
  23347. <method name="close"
  23348. abstract="false" native="false" synchronized="false"
  23349. static="false" final="false" visibility="public"
  23350. deprecated="not deprecated">
  23351. <exception name="IOException" type="java.io.IOException"/>
  23352. <doc>
  23353. <![CDATA[Close all child RRs.]]>
  23354. </doc>
  23355. </method>
  23356. <method name="getProgress" return="float"
  23357. abstract="false" native="false" synchronized="false"
  23358. static="false" final="false" visibility="public"
  23359. deprecated="not deprecated">
  23360. <exception name="IOException" type="java.io.IOException"/>
  23361. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23362. <doc>
  23363. <![CDATA[Report progress as the minimum of all child RR progress.]]>
  23364. </doc>
  23365. </method>
  23366. <field name="conf" type="org.apache.hadoop.conf.Configuration"
  23367. transient="false" volatile="false"
  23368. static="false" final="false" visibility="protected"
  23369. deprecated="not deprecated">
  23370. </field>
  23371. <field name="keyclass" type="java.lang.Class"
  23372. transient="false" volatile="false"
  23373. static="false" final="false" visibility="protected"
  23374. deprecated="not deprecated">
  23375. </field>
  23376. <field name="jc" type="org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader.JoinCollector"
  23377. transient="false" volatile="false"
  23378. static="false" final="true" visibility="protected"
  23379. deprecated="not deprecated">
  23380. </field>
  23381. <field name="kids" type="org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader[]"
  23382. transient="false" volatile="false"
  23383. static="false" final="true" visibility="protected"
  23384. deprecated="not deprecated">
  23385. </field>
  23386. <field name="key" type="K"
  23387. transient="false" volatile="false"
  23388. static="false" final="false" visibility="protected"
  23389. deprecated="not deprecated">
  23390. </field>
  23391. <field name="value" type="X"
  23392. transient="false" volatile="false"
  23393. static="false" final="false" visibility="protected"
  23394. deprecated="not deprecated">
  23395. </field>
  23396. <doc>
  23397. <![CDATA[A RecordReader that can effect joins of RecordReaders sharing a common key
  23398. type and partitioning.]]>
  23399. </doc>
  23400. </class>
  23401. <!-- end class org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader -->
  23402. <!-- start class org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader.JoinCollector -->
  23403. <class name="CompositeRecordReader.JoinCollector" extends="java.lang.Object"
  23404. abstract="false"
  23405. static="false" final="false" visibility="public"
  23406. deprecated="not deprecated">
  23407. <constructor name="CompositeRecordReader.JoinCollector" type="int"
  23408. static="false" final="false" visibility="public"
  23409. deprecated="not deprecated">
  23410. <doc>
  23411. <![CDATA[Construct a collector capable of handling the specified number of
  23412. children.]]>
  23413. </doc>
  23414. </constructor>
  23415. <method name="add"
  23416. abstract="false" native="false" synchronized="false"
  23417. static="false" final="false" visibility="public"
  23418. deprecated="not deprecated">
  23419. <param name="id" type="int"/>
  23420. <param name="i" type="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"/>
  23421. <exception name="IOException" type="java.io.IOException"/>
  23422. <doc>
  23423. <![CDATA[Register a given iterator at position id.]]>
  23424. </doc>
  23425. </method>
  23426. <method name="key" return="K"
  23427. abstract="false" native="false" synchronized="false"
  23428. static="false" final="false" visibility="public"
  23429. deprecated="not deprecated">
  23430. <doc>
  23431. <![CDATA[Return the key associated with this collection.]]>
  23432. </doc>
  23433. </method>
  23434. <method name="reset"
  23435. abstract="false" native="false" synchronized="false"
  23436. static="false" final="false" visibility="public"
  23437. deprecated="not deprecated">
  23438. <param name="key" type="K"/>
  23439. <doc>
  23440. <![CDATA[Codify the contents of the collector to be iterated over.
  23441. When this is called, all RecordReaders registered for this
  23442. key should have added ResetableIterators.]]>
  23443. </doc>
  23444. </method>
  23445. <method name="clear"
  23446. abstract="false" native="false" synchronized="false"
  23447. static="false" final="false" visibility="public"
  23448. deprecated="not deprecated">
  23449. <doc>
  23450. <![CDATA[Clear all state information.]]>
  23451. </doc>
  23452. </method>
  23453. <method name="hasNext" return="boolean"
  23454. abstract="false" native="false" synchronized="false"
  23455. static="false" final="false" visibility="public"
  23456. deprecated="not deprecated">
  23457. <doc>
  23458. <![CDATA[Returns false if exhausted or if reset(K) has not been called.]]>
  23459. </doc>
  23460. </method>
  23461. <method name="next" return="boolean"
  23462. abstract="false" native="false" synchronized="false"
  23463. static="false" final="false" visibility="protected"
  23464. deprecated="not deprecated">
  23465. <param name="val" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23466. <exception name="IOException" type="java.io.IOException"/>
  23467. <doc>
  23468. <![CDATA[Populate Tuple from iterators.
  23469. It should be the case that, given iterators i_1...i_n over values from
  23470. sources s_1...s_n sharing key k, repeated calls to next should yield
  23471. I x I.]]>
  23472. </doc>
  23473. </method>
  23474. <method name="replay" return="boolean"
  23475. abstract="false" native="false" synchronized="false"
  23476. static="false" final="false" visibility="public"
  23477. deprecated="not deprecated">
  23478. <param name="val" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23479. <exception name="IOException" type="java.io.IOException"/>
  23480. <doc>
  23481. <![CDATA[Replay the last Tuple emitted.]]>
  23482. </doc>
  23483. </method>
  23484. <method name="close"
  23485. abstract="false" native="false" synchronized="false"
  23486. static="false" final="false" visibility="public"
  23487. deprecated="not deprecated">
  23488. <exception name="IOException" type="java.io.IOException"/>
  23489. <doc>
  23490. <![CDATA[Close all child iterators.]]>
  23491. </doc>
  23492. </method>
  23493. <method name="flush" return="boolean"
  23494. abstract="false" native="false" synchronized="false"
  23495. static="false" final="false" visibility="public"
  23496. deprecated="not deprecated">
  23497. <param name="value" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23498. <exception name="IOException" type="java.io.IOException"/>
  23499. <doc>
  23500. <![CDATA[Write the next value into key, value as accepted by the operation
  23501. associated with this set of RecordReaders.]]>
  23502. </doc>
  23503. </method>
  23504. <doc>
  23505. <![CDATA[Collector for join values.
  23506. This accumulates values for a given key from the child RecordReaders. If
  23507. one or more child RR contain duplicate keys, this will emit the cross
  23508. product of the associated values until exhausted.]]>
  23509. </doc>
  23510. </class>
  23511. <!-- end class org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader.JoinCollector -->
  23512. <!-- start class org.apache.hadoop.mapreduce.lib.join.InnerJoinRecordReader -->
  23513. <class name="InnerJoinRecordReader" extends="org.apache.hadoop.mapreduce.lib.join.JoinRecordReader"
  23514. abstract="false"
  23515. static="false" final="false" visibility="public"
  23516. deprecated="not deprecated">
  23517. <method name="combine" return="boolean"
  23518. abstract="false" native="false" synchronized="false"
  23519. static="false" final="false" visibility="protected"
  23520. deprecated="not deprecated">
  23521. <param name="srcs" type="java.lang.Object[]"/>
  23522. <param name="dst" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23523. <doc>
  23524. <![CDATA[Return true iff the tuple is full (all data sources contain this key).]]>
  23525. </doc>
  23526. </method>
  23527. <doc>
  23528. <![CDATA[Full inner join.]]>
  23529. </doc>
  23530. </class>
  23531. <!-- end class org.apache.hadoop.mapreduce.lib.join.InnerJoinRecordReader -->
  23532. <!-- start class org.apache.hadoop.mapreduce.lib.join.JoinRecordReader -->
  23533. <class name="JoinRecordReader" extends="org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader"
  23534. abstract="true"
  23535. static="false" final="false" visibility="public"
  23536. deprecated="not deprecated">
  23537. <constructor name="JoinRecordReader" type="int, org.apache.hadoop.conf.Configuration, int, java.lang.Class"
  23538. static="false" final="false" visibility="public"
  23539. deprecated="not deprecated">
  23540. <exception name="IOException" type="java.io.IOException"/>
  23541. </constructor>
  23542. <method name="nextKeyValue" return="boolean"
  23543. abstract="false" native="false" synchronized="false"
  23544. static="false" final="false" visibility="public"
  23545. deprecated="not deprecated">
  23546. <exception name="IOException" type="java.io.IOException"/>
  23547. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23548. <doc>
  23549. <![CDATA[Emit the next set of key, value pairs as defined by the child
  23550. RecordReaders and operation associated with this composite RR.]]>
  23551. </doc>
  23552. </method>
  23553. <method name="createValue" return="org.apache.hadoop.mapreduce.lib.join.TupleWritable"
  23554. abstract="false" native="false" synchronized="false"
  23555. static="false" final="false" visibility="public"
  23556. deprecated="not deprecated">
  23557. </method>
  23558. <method name="getDelegate" return="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"
  23559. abstract="false" native="false" synchronized="false"
  23560. static="false" final="false" visibility="protected"
  23561. deprecated="not deprecated">
  23562. <doc>
  23563. <![CDATA[Return an iterator wrapping the JoinCollector.]]>
  23564. </doc>
  23565. </method>
  23566. <doc>
  23567. <![CDATA[Base class for Composite joins returning Tuples of arbitrary Writables.]]>
  23568. </doc>
  23569. </class>
  23570. <!-- end class org.apache.hadoop.mapreduce.lib.join.JoinRecordReader -->
  23571. <!-- start class org.apache.hadoop.mapreduce.lib.join.JoinRecordReader.JoinDelegationIterator -->
  23572. <class name="JoinRecordReader.JoinDelegationIterator" extends="java.lang.Object"
  23573. abstract="false"
  23574. static="false" final="false" visibility="protected"
  23575. deprecated="not deprecated">
  23576. <implements name="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"/>
  23577. <constructor name="JoinRecordReader.JoinDelegationIterator"
  23578. static="false" final="false" visibility="protected"
  23579. deprecated="not deprecated">
  23580. </constructor>
  23581. <method name="hasNext" return="boolean"
  23582. abstract="false" native="false" synchronized="false"
  23583. static="false" final="false" visibility="public"
  23584. deprecated="not deprecated">
  23585. </method>
  23586. <method name="next" return="boolean"
  23587. abstract="false" native="false" synchronized="false"
  23588. static="false" final="false" visibility="public"
  23589. deprecated="not deprecated">
  23590. <param name="val" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23591. <exception name="IOException" type="java.io.IOException"/>
  23592. </method>
  23593. <method name="replay" return="boolean"
  23594. abstract="false" native="false" synchronized="false"
  23595. static="false" final="false" visibility="public"
  23596. deprecated="not deprecated">
  23597. <param name="val" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23598. <exception name="IOException" type="java.io.IOException"/>
  23599. </method>
  23600. <method name="reset"
  23601. abstract="false" native="false" synchronized="false"
  23602. static="false" final="false" visibility="public"
  23603. deprecated="not deprecated">
  23604. </method>
  23605. <method name="add"
  23606. abstract="false" native="false" synchronized="false"
  23607. static="false" final="false" visibility="public"
  23608. deprecated="not deprecated">
  23609. <param name="item" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23610. <exception name="IOException" type="java.io.IOException"/>
  23611. </method>
  23612. <method name="close"
  23613. abstract="false" native="false" synchronized="false"
  23614. static="false" final="false" visibility="public"
  23615. deprecated="not deprecated">
  23616. <exception name="IOException" type="java.io.IOException"/>
  23617. </method>
  23618. <method name="clear"
  23619. abstract="false" native="false" synchronized="false"
  23620. static="false" final="false" visibility="public"
  23621. deprecated="not deprecated">
  23622. </method>
  23623. <doc>
  23624. <![CDATA[Since the JoinCollector is effecting our operation, we need only
  23625. provide an iterator proxy wrapping its operation.]]>
  23626. </doc>
  23627. </class>
  23628. <!-- end class org.apache.hadoop.mapreduce.lib.join.JoinRecordReader.JoinDelegationIterator -->
  23629. <!-- start class org.apache.hadoop.mapreduce.lib.join.MultiFilterRecordReader -->
  23630. <class name="MultiFilterRecordReader" extends="org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader"
  23631. abstract="true"
  23632. static="false" final="false" visibility="public"
  23633. deprecated="not deprecated">
  23634. <constructor name="MultiFilterRecordReader" type="int, org.apache.hadoop.conf.Configuration, int, java.lang.Class"
  23635. static="false" final="false" visibility="public"
  23636. deprecated="not deprecated">
  23637. <exception name="IOException" type="java.io.IOException"/>
  23638. </constructor>
  23639. <method name="emit" return="V"
  23640. abstract="true" native="false" synchronized="false"
  23641. static="false" final="false" visibility="protected"
  23642. deprecated="not deprecated">
  23643. <param name="dst" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23644. <exception name="IOException" type="java.io.IOException"/>
  23645. <doc>
  23646. <![CDATA[For each tuple emitted, return a value (typically one of the values
  23647. in the tuple).
  23648. Modifying the Writables in the tuple is permitted and unlikely to affect
  23649. join behavior in most cases, but it is not recommended. It's safer to
  23650. clone first.]]>
  23651. </doc>
  23652. </method>
  23653. <method name="combine" return="boolean"
  23654. abstract="false" native="false" synchronized="false"
  23655. static="false" final="false" visibility="protected"
  23656. deprecated="not deprecated">
  23657. <param name="srcs" type="java.lang.Object[]"/>
  23658. <param name="dst" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23659. <doc>
  23660. <![CDATA[Default implementation offers {@link #emit} every Tuple from the
  23661. collector (the outer join of child RRs).]]>
  23662. </doc>
  23663. </method>
  23664. <method name="nextKeyValue" return="boolean"
  23665. abstract="false" native="false" synchronized="false"
  23666. static="false" final="false" visibility="public"
  23667. deprecated="not deprecated">
  23668. <exception name="IOException" type="java.io.IOException"/>
  23669. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23670. <doc>
  23671. <![CDATA[{@inheritDoc}]]>
  23672. </doc>
  23673. </method>
  23674. <method name="initialize"
  23675. abstract="false" native="false" synchronized="false"
  23676. static="false" final="false" visibility="public"
  23677. deprecated="not deprecated">
  23678. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  23679. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  23680. <exception name="IOException" type="java.io.IOException"/>
  23681. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23682. </method>
  23683. <method name="getDelegate" return="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"
  23684. abstract="false" native="false" synchronized="false"
  23685. static="false" final="false" visibility="protected"
  23686. deprecated="not deprecated">
  23687. <doc>
  23688. <![CDATA[Return an iterator returning a single value from the tuple.
  23689. @see MultiFilterDelegationIterator]]>
  23690. </doc>
  23691. </method>
  23692. <doc>
  23693. <![CDATA[Base class for Composite join returning values derived from multiple
  23694. sources, but generally not tuples.]]>
  23695. </doc>
  23696. </class>
  23697. <!-- end class org.apache.hadoop.mapreduce.lib.join.MultiFilterRecordReader -->
  23698. <!-- start class org.apache.hadoop.mapreduce.lib.join.MultiFilterRecordReader.MultiFilterDelegationIterator -->
  23699. <class name="MultiFilterRecordReader.MultiFilterDelegationIterator" extends="java.lang.Object"
  23700. abstract="false"
  23701. static="false" final="false" visibility="protected"
  23702. deprecated="not deprecated">
  23703. <implements name="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"/>
  23704. <constructor name="MultiFilterRecordReader.MultiFilterDelegationIterator"
  23705. static="false" final="false" visibility="protected"
  23706. deprecated="not deprecated">
  23707. </constructor>
  23708. <method name="hasNext" return="boolean"
  23709. abstract="false" native="false" synchronized="false"
  23710. static="false" final="false" visibility="public"
  23711. deprecated="not deprecated">
  23712. </method>
  23713. <method name="next" return="boolean"
  23714. abstract="false" native="false" synchronized="false"
  23715. static="false" final="false" visibility="public"
  23716. deprecated="not deprecated">
  23717. <param name="val" type="V"/>
  23718. <exception name="IOException" type="java.io.IOException"/>
  23719. </method>
  23720. <method name="replay" return="boolean"
  23721. abstract="false" native="false" synchronized="false"
  23722. static="false" final="false" visibility="public"
  23723. deprecated="not deprecated">
  23724. <param name="val" type="V"/>
  23725. <exception name="IOException" type="java.io.IOException"/>
  23726. </method>
  23727. <method name="reset"
  23728. abstract="false" native="false" synchronized="false"
  23729. static="false" final="false" visibility="public"
  23730. deprecated="not deprecated">
  23731. </method>
  23732. <method name="add"
  23733. abstract="false" native="false" synchronized="false"
  23734. static="false" final="false" visibility="public"
  23735. deprecated="not deprecated">
  23736. <param name="item" type="V"/>
  23737. <exception name="IOException" type="java.io.IOException"/>
  23738. </method>
  23739. <method name="close"
  23740. abstract="false" native="false" synchronized="false"
  23741. static="false" final="false" visibility="public"
  23742. deprecated="not deprecated">
  23743. <exception name="IOException" type="java.io.IOException"/>
  23744. </method>
  23745. <method name="clear"
  23746. abstract="false" native="false" synchronized="false"
  23747. static="false" final="false" visibility="public"
  23748. deprecated="not deprecated">
  23749. </method>
  23750. <doc>
  23751. <![CDATA[Proxy the JoinCollector, but include callback to emit.]]>
  23752. </doc>
  23753. </class>
  23754. <!-- end class org.apache.hadoop.mapreduce.lib.join.MultiFilterRecordReader.MultiFilterDelegationIterator -->
  23755. <!-- start class org.apache.hadoop.mapreduce.lib.join.OuterJoinRecordReader -->
  23756. <class name="OuterJoinRecordReader" extends="org.apache.hadoop.mapreduce.lib.join.JoinRecordReader"
  23757. abstract="false"
  23758. static="false" final="false" visibility="public"
  23759. deprecated="not deprecated">
  23760. <method name="combine" return="boolean"
  23761. abstract="false" native="false" synchronized="false"
  23762. static="false" final="false" visibility="protected"
  23763. deprecated="not deprecated">
  23764. <param name="srcs" type="java.lang.Object[]"/>
  23765. <param name="dst" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23766. <doc>
  23767. <![CDATA[Emit everything from the collector.]]>
  23768. </doc>
  23769. </method>
  23770. <doc>
  23771. <![CDATA[Full outer join.]]>
  23772. </doc>
  23773. </class>
  23774. <!-- end class org.apache.hadoop.mapreduce.lib.join.OuterJoinRecordReader -->
  23775. <!-- start class org.apache.hadoop.mapreduce.lib.join.OverrideRecordReader -->
  23776. <class name="OverrideRecordReader" extends="org.apache.hadoop.mapreduce.lib.join.MultiFilterRecordReader"
  23777. abstract="false"
  23778. static="false" final="false" visibility="public"
  23779. deprecated="not deprecated">
  23780. <method name="emit" return="V"
  23781. abstract="false" native="false" synchronized="false"
  23782. static="false" final="false" visibility="protected"
  23783. deprecated="not deprecated">
  23784. <param name="dst" type="org.apache.hadoop.mapreduce.lib.join.TupleWritable"/>
  23785. <doc>
  23786. <![CDATA[Emit the value with the highest position in the tuple.]]>
  23787. </doc>
  23788. </method>
  23789. <method name="createValue" return="V"
  23790. abstract="false" native="false" synchronized="false"
  23791. static="false" final="false" visibility="public"
  23792. deprecated="not deprecated">
  23793. </method>
  23794. <method name="fillJoinCollector"
  23795. abstract="false" native="false" synchronized="false"
  23796. static="false" final="false" visibility="protected"
  23797. deprecated="not deprecated">
  23798. <param name="iterkey" type="K"/>
  23799. <exception name="IOException" type="java.io.IOException"/>
  23800. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  23801. <doc>
  23802. <![CDATA[Instead of filling the JoinCollector with iterators from all
  23803. data sources, fill only the rightmost for this key.
  23804. This not only saves space by discarding the other sources, but
  23805. it also emits the number of key-value pairs in the preferred
  23806. RecordReader instead of repeating that stream n times, where
  23807. n is the cardinality of the cross product of the discarded
  23808. streams for the given key.]]>
  23809. </doc>
  23810. </method>
  23811. <doc>
  23812. <![CDATA[Prefer the &quot;rightmost&quot; data source for this key.
  23813. For example, <tt>override(S1,S2,S3)</tt> will prefer values
  23814. from S3 over S2, and values from S2 over S1 for all keys
  23815. emitted from all sources.]]>
  23816. </doc>
  23817. </class>
  23818. <!-- end class org.apache.hadoop.mapreduce.lib.join.OverrideRecordReader -->
  23819. <!-- start class org.apache.hadoop.mapreduce.lib.join.Parser -->
  23820. <class name="Parser" extends="java.lang.Object"
  23821. abstract="false"
  23822. static="false" final="false" visibility="public"
  23823. deprecated="not deprecated">
  23824. <constructor name="Parser"
  23825. static="false" final="false" visibility="public"
  23826. deprecated="not deprecated">
  23827. </constructor>
  23828. <doc>
  23829. <![CDATA[Very simple shift-reduce parser for join expressions.
  23830. This should be sufficient for the user extension permitted now, but ought to
  23831. be replaced with a parser generator if more complex grammars are supported.
  23832. In particular, this &quot;shift-reduce&quot; parser has no states. Each set
  23833. of formals requires a different internal node type, which is responsible for
  23834. interpreting the list of tokens it receives. This is sufficient for the
  23835. current grammar, but it has several annoying properties that might inhibit
  23836. extension. In particular, parenthesis are always function calls; an
  23837. algebraic or filter grammar would not only require a node type, but must
  23838. also work around the internals of this parser.
  23839. For most other cases, adding classes to the hierarchy- particularly by
  23840. extending JoinRecordReader and MultiFilterRecordReader- is fairly
  23841. straightforward. One need only override the relevant method(s) (usually only
  23842. {@link CompositeRecordReader#combine}) and include a property to map its
  23843. value to an identifier in the parser.]]>
  23844. </doc>
  23845. </class>
  23846. <!-- end class org.apache.hadoop.mapreduce.lib.join.Parser -->
  23847. <!-- start class org.apache.hadoop.mapreduce.lib.join.Parser.Node -->
  23848. <class name="Parser.Node" extends="org.apache.hadoop.mapreduce.lib.join.ComposableInputFormat"
  23849. abstract="true"
  23850. static="true" final="false" visibility="public"
  23851. deprecated="not deprecated">
  23852. <constructor name="Parser.Node" type="java.lang.String"
  23853. static="false" final="false" visibility="protected"
  23854. deprecated="not deprecated">
  23855. </constructor>
  23856. <method name="addIdentifier"
  23857. abstract="false" native="false" synchronized="false"
  23858. static="true" final="false" visibility="protected"
  23859. deprecated="not deprecated">
  23860. <param name="ident" type="java.lang.String"/>
  23861. <param name="mcstrSig" type="java.lang.Class[]"/>
  23862. <param name="nodetype" type="java.lang.Class"/>
  23863. <param name="cl" type="java.lang.Class"/>
  23864. <exception name="NoSuchMethodException" type="java.lang.NoSuchMethodException"/>
  23865. <doc>
  23866. <![CDATA[For a given identifier, add a mapping to the nodetype for the parse
  23867. tree and to the ComposableRecordReader to be created, including the
  23868. formals required to invoke the constructor.
  23869. The nodetype and constructor signature should be filled in from the
  23870. child node.]]>
  23871. </doc>
  23872. </method>
  23873. <method name="setID"
  23874. abstract="false" native="false" synchronized="false"
  23875. static="false" final="false" visibility="protected"
  23876. deprecated="not deprecated">
  23877. <param name="id" type="int"/>
  23878. </method>
  23879. <method name="setKeyComparator"
  23880. abstract="false" native="false" synchronized="false"
  23881. static="false" final="false" visibility="protected"
  23882. deprecated="not deprecated">
  23883. <param name="cmpcl" type="java.lang.Class"/>
  23884. </method>
  23885. <field name="rrCstrMap" type="java.util.Map"
  23886. transient="false" volatile="false"
  23887. static="true" final="true" visibility="protected"
  23888. deprecated="not deprecated">
  23889. </field>
  23890. <field name="id" type="int"
  23891. transient="false" volatile="false"
  23892. static="false" final="false" visibility="protected"
  23893. deprecated="not deprecated">
  23894. </field>
  23895. <field name="ident" type="java.lang.String"
  23896. transient="false" volatile="false"
  23897. static="false" final="false" visibility="protected"
  23898. deprecated="not deprecated">
  23899. </field>
  23900. <field name="cmpcl" type="java.lang.Class"
  23901. transient="false" volatile="false"
  23902. static="false" final="false" visibility="protected"
  23903. deprecated="not deprecated">
  23904. </field>
  23905. </class>
  23906. <!-- end class org.apache.hadoop.mapreduce.lib.join.Parser.Node -->
  23907. <!-- start class org.apache.hadoop.mapreduce.lib.join.Parser.NodeToken -->
  23908. <class name="Parser.NodeToken" extends="org.apache.hadoop.mapreduce.lib.join.Parser.Token"
  23909. abstract="false"
  23910. static="true" final="false" visibility="public"
  23911. deprecated="not deprecated">
  23912. <method name="getNode" return="org.apache.hadoop.mapreduce.lib.join.Parser.Node"
  23913. abstract="false" native="false" synchronized="false"
  23914. static="false" final="false" visibility="public"
  23915. deprecated="not deprecated">
  23916. </method>
  23917. </class>
  23918. <!-- end class org.apache.hadoop.mapreduce.lib.join.Parser.NodeToken -->
  23919. <!-- start class org.apache.hadoop.mapreduce.lib.join.Parser.NumToken -->
  23920. <class name="Parser.NumToken" extends="org.apache.hadoop.mapreduce.lib.join.Parser.Token"
  23921. abstract="false"
  23922. static="true" final="false" visibility="public"
  23923. deprecated="not deprecated">
  23924. <constructor name="Parser.NumToken" type="double"
  23925. static="false" final="false" visibility="public"
  23926. deprecated="not deprecated">
  23927. </constructor>
  23928. <method name="getNum" return="double"
  23929. abstract="false" native="false" synchronized="false"
  23930. static="false" final="false" visibility="public"
  23931. deprecated="not deprecated">
  23932. </method>
  23933. </class>
  23934. <!-- end class org.apache.hadoop.mapreduce.lib.join.Parser.NumToken -->
  23935. <!-- start class org.apache.hadoop.mapreduce.lib.join.Parser.StrToken -->
  23936. <class name="Parser.StrToken" extends="org.apache.hadoop.mapreduce.lib.join.Parser.Token"
  23937. abstract="false"
  23938. static="true" final="false" visibility="public"
  23939. deprecated="not deprecated">
  23940. <constructor name="Parser.StrToken" type="org.apache.hadoop.mapreduce.lib.join.Parser.TType, java.lang.String"
  23941. static="false" final="false" visibility="public"
  23942. deprecated="not deprecated">
  23943. </constructor>
  23944. <method name="getStr" return="java.lang.String"
  23945. abstract="false" native="false" synchronized="false"
  23946. static="false" final="false" visibility="public"
  23947. deprecated="not deprecated">
  23948. </method>
  23949. </class>
  23950. <!-- end class org.apache.hadoop.mapreduce.lib.join.Parser.StrToken -->
  23951. <!-- start class org.apache.hadoop.mapreduce.lib.join.Parser.Token -->
  23952. <class name="Parser.Token" extends="java.lang.Object"
  23953. abstract="false"
  23954. static="true" final="false" visibility="public"
  23955. deprecated="not deprecated">
  23956. <method name="getType" return="org.apache.hadoop.mapreduce.lib.join.Parser.TType"
  23957. abstract="false" native="false" synchronized="false"
  23958. static="false" final="false" visibility="public"
  23959. deprecated="not deprecated">
  23960. </method>
  23961. <method name="getNode" return="org.apache.hadoop.mapreduce.lib.join.Parser.Node"
  23962. abstract="false" native="false" synchronized="false"
  23963. static="false" final="false" visibility="public"
  23964. deprecated="not deprecated">
  23965. <exception name="IOException" type="java.io.IOException"/>
  23966. </method>
  23967. <method name="getNum" return="double"
  23968. abstract="false" native="false" synchronized="false"
  23969. static="false" final="false" visibility="public"
  23970. deprecated="not deprecated">
  23971. <exception name="IOException" type="java.io.IOException"/>
  23972. </method>
  23973. <method name="getStr" return="java.lang.String"
  23974. abstract="false" native="false" synchronized="false"
  23975. static="false" final="false" visibility="public"
  23976. deprecated="not deprecated">
  23977. <exception name="IOException" type="java.io.IOException"/>
  23978. </method>
  23979. <doc>
  23980. <![CDATA[Tagged-union type for tokens from the join expression.
  23981. @see Parser.TType]]>
  23982. </doc>
  23983. </class>
  23984. <!-- end class org.apache.hadoop.mapreduce.lib.join.Parser.Token -->
  23985. <!-- start class org.apache.hadoop.mapreduce.lib.join.Parser.TType -->
  23986. <class name="Parser.TType" extends="java.lang.Enum"
  23987. abstract="false"
  23988. static="true" final="true" visibility="public"
  23989. deprecated="not deprecated">
  23990. <method name="values" return="org.apache.hadoop.mapreduce.lib.join.Parser.TType[]"
  23991. abstract="false" native="false" synchronized="false"
  23992. static="true" final="false" visibility="public"
  23993. deprecated="not deprecated">
  23994. </method>
  23995. <method name="valueOf" return="org.apache.hadoop.mapreduce.lib.join.Parser.TType"
  23996. abstract="false" native="false" synchronized="false"
  23997. static="true" final="false" visibility="public"
  23998. deprecated="not deprecated">
  23999. <param name="name" type="java.lang.String"/>
  24000. </method>
  24001. </class>
  24002. <!-- end class org.apache.hadoop.mapreduce.lib.join.Parser.TType -->
  24003. <!-- start interface org.apache.hadoop.mapreduce.lib.join.ResetableIterator -->
  24004. <interface name="ResetableIterator" abstract="true"
  24005. static="false" final="false" visibility="public"
  24006. deprecated="not deprecated">
  24007. <method name="hasNext" return="boolean"
  24008. abstract="false" native="false" synchronized="false"
  24009. static="false" final="false" visibility="public"
  24010. deprecated="not deprecated">
  24011. <doc>
  24012. <![CDATA[True if a call to next may return a value. This is permitted false
  24013. positives, but not false negatives.]]>
  24014. </doc>
  24015. </method>
  24016. <method name="next" return="boolean"
  24017. abstract="false" native="false" synchronized="false"
  24018. static="false" final="false" visibility="public"
  24019. deprecated="not deprecated">
  24020. <param name="val" type="T"/>
  24021. <exception name="IOException" type="java.io.IOException"/>
  24022. <doc>
  24023. <![CDATA[Assign next value to actual.
  24024. It is required that elements added to a ResetableIterator be returned in
  24025. the same order after a call to {@link #reset} (FIFO).
  24026. Note that a call to this may fail for nested joins (i.e. more elements
  24027. available, but none satisfying the constraints of the join)]]>
  24028. </doc>
  24029. </method>
  24030. <method name="replay" return="boolean"
  24031. abstract="false" native="false" synchronized="false"
  24032. static="false" final="false" visibility="public"
  24033. deprecated="not deprecated">
  24034. <param name="val" type="T"/>
  24035. <exception name="IOException" type="java.io.IOException"/>
  24036. <doc>
  24037. <![CDATA[Assign last value returned to actual.]]>
  24038. </doc>
  24039. </method>
  24040. <method name="reset"
  24041. abstract="false" native="false" synchronized="false"
  24042. static="false" final="false" visibility="public"
  24043. deprecated="not deprecated">
  24044. <doc>
  24045. <![CDATA[Set iterator to return to the start of its range. Must be called after
  24046. calling {@link #add} to avoid a ConcurrentModificationException.]]>
  24047. </doc>
  24048. </method>
  24049. <method name="add"
  24050. abstract="false" native="false" synchronized="false"
  24051. static="false" final="false" visibility="public"
  24052. deprecated="not deprecated">
  24053. <param name="item" type="T"/>
  24054. <exception name="IOException" type="java.io.IOException"/>
  24055. <doc>
  24056. <![CDATA[Add an element to the collection of elements to iterate over.]]>
  24057. </doc>
  24058. </method>
  24059. <method name="close"
  24060. abstract="false" native="false" synchronized="false"
  24061. static="false" final="false" visibility="public"
  24062. deprecated="not deprecated">
  24063. <exception name="IOException" type="java.io.IOException"/>
  24064. <doc>
  24065. <![CDATA[Close datasources and release resources. Calling methods on the iterator
  24066. after calling close has undefined behavior.]]>
  24067. </doc>
  24068. </method>
  24069. <method name="clear"
  24070. abstract="false" native="false" synchronized="false"
  24071. static="false" final="false" visibility="public"
  24072. deprecated="not deprecated">
  24073. <doc>
  24074. <![CDATA[Close datasources, but do not release internal resources. Calling this
  24075. method should permit the object to be reused with a different datasource.]]>
  24076. </doc>
  24077. </method>
  24078. <doc>
  24079. <![CDATA[This defines an interface to a stateful Iterator that can replay elements
  24080. added to it directly.
  24081. Note that this does not extend {@link java.util.Iterator}.]]>
  24082. </doc>
  24083. </interface>
  24084. <!-- end interface org.apache.hadoop.mapreduce.lib.join.ResetableIterator -->
  24085. <!-- start class org.apache.hadoop.mapreduce.lib.join.ResetableIterator.EMPTY -->
  24086. <class name="ResetableIterator.EMPTY" extends="java.lang.Object"
  24087. abstract="false"
  24088. static="true" final="false" visibility="public"
  24089. deprecated="not deprecated">
  24090. <implements name="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"/>
  24091. <constructor name="ResetableIterator.EMPTY"
  24092. static="false" final="false" visibility="public"
  24093. deprecated="not deprecated">
  24094. </constructor>
  24095. <method name="hasNext" return="boolean"
  24096. abstract="false" native="false" synchronized="false"
  24097. static="false" final="false" visibility="public"
  24098. deprecated="not deprecated">
  24099. </method>
  24100. <method name="reset"
  24101. abstract="false" native="false" synchronized="false"
  24102. static="false" final="false" visibility="public"
  24103. deprecated="not deprecated">
  24104. </method>
  24105. <method name="close"
  24106. abstract="false" native="false" synchronized="false"
  24107. static="false" final="false" visibility="public"
  24108. deprecated="not deprecated">
  24109. <exception name="IOException" type="java.io.IOException"/>
  24110. </method>
  24111. <method name="clear"
  24112. abstract="false" native="false" synchronized="false"
  24113. static="false" final="false" visibility="public"
  24114. deprecated="not deprecated">
  24115. </method>
  24116. <method name="next" return="boolean"
  24117. abstract="false" native="false" synchronized="false"
  24118. static="false" final="false" visibility="public"
  24119. deprecated="not deprecated">
  24120. <param name="val" type="U"/>
  24121. <exception name="IOException" type="java.io.IOException"/>
  24122. </method>
  24123. <method name="replay" return="boolean"
  24124. abstract="false" native="false" synchronized="false"
  24125. static="false" final="false" visibility="public"
  24126. deprecated="not deprecated">
  24127. <param name="val" type="U"/>
  24128. <exception name="IOException" type="java.io.IOException"/>
  24129. </method>
  24130. <method name="add"
  24131. abstract="false" native="false" synchronized="false"
  24132. static="false" final="false" visibility="public"
  24133. deprecated="not deprecated">
  24134. <param name="item" type="U"/>
  24135. <exception name="IOException" type="java.io.IOException"/>
  24136. </method>
  24137. </class>
  24138. <!-- end class org.apache.hadoop.mapreduce.lib.join.ResetableIterator.EMPTY -->
  24139. <!-- start class org.apache.hadoop.mapreduce.lib.join.StreamBackedIterator -->
  24140. <class name="StreamBackedIterator" extends="java.lang.Object"
  24141. abstract="false"
  24142. static="false" final="false" visibility="public"
  24143. deprecated="not deprecated">
  24144. <implements name="org.apache.hadoop.mapreduce.lib.join.ResetableIterator"/>
  24145. <constructor name="StreamBackedIterator"
  24146. static="false" final="false" visibility="public"
  24147. deprecated="not deprecated">
  24148. </constructor>
  24149. <method name="hasNext" return="boolean"
  24150. abstract="false" native="false" synchronized="false"
  24151. static="false" final="false" visibility="public"
  24152. deprecated="not deprecated">
  24153. </method>
  24154. <method name="next" return="boolean"
  24155. abstract="false" native="false" synchronized="false"
  24156. static="false" final="false" visibility="public"
  24157. deprecated="not deprecated">
  24158. <param name="val" type="X"/>
  24159. <exception name="IOException" type="java.io.IOException"/>
  24160. </method>
  24161. <method name="replay" return="boolean"
  24162. abstract="false" native="false" synchronized="false"
  24163. static="false" final="false" visibility="public"
  24164. deprecated="not deprecated">
  24165. <param name="val" type="X"/>
  24166. <exception name="IOException" type="java.io.IOException"/>
  24167. </method>
  24168. <method name="reset"
  24169. abstract="false" native="false" synchronized="false"
  24170. static="false" final="false" visibility="public"
  24171. deprecated="not deprecated">
  24172. </method>
  24173. <method name="add"
  24174. abstract="false" native="false" synchronized="false"
  24175. static="false" final="false" visibility="public"
  24176. deprecated="not deprecated">
  24177. <param name="item" type="X"/>
  24178. <exception name="IOException" type="java.io.IOException"/>
  24179. </method>
  24180. <method name="close"
  24181. abstract="false" native="false" synchronized="false"
  24182. static="false" final="false" visibility="public"
  24183. deprecated="not deprecated">
  24184. <exception name="IOException" type="java.io.IOException"/>
  24185. </method>
  24186. <method name="clear"
  24187. abstract="false" native="false" synchronized="false"
  24188. static="false" final="false" visibility="public"
  24189. deprecated="not deprecated">
  24190. </method>
  24191. <doc>
  24192. <![CDATA[This class provides an implementation of ResetableIterator. This
  24193. implementation uses a byte array to store elements added to it.]]>
  24194. </doc>
  24195. </class>
  24196. <!-- end class org.apache.hadoop.mapreduce.lib.join.StreamBackedIterator -->
  24197. <!-- start class org.apache.hadoop.mapreduce.lib.join.TupleWritable -->
  24198. <class name="TupleWritable" extends="java.lang.Object"
  24199. abstract="false"
  24200. static="false" final="false" visibility="public"
  24201. deprecated="not deprecated">
  24202. <implements name="org.apache.hadoop.io.Writable"/>
  24203. <implements name="java.lang.Iterable"/>
  24204. <constructor name="TupleWritable"
  24205. static="false" final="false" visibility="public"
  24206. deprecated="not deprecated">
  24207. <doc>
  24208. <![CDATA[Create an empty tuple with no allocated storage for writables.]]>
  24209. </doc>
  24210. </constructor>
  24211. <constructor name="TupleWritable" type="org.apache.hadoop.io.Writable[]"
  24212. static="false" final="false" visibility="public"
  24213. deprecated="not deprecated">
  24214. <doc>
  24215. <![CDATA[Initialize tuple with storage; unknown whether any of them contain
  24216. &quot;written&quot; values.]]>
  24217. </doc>
  24218. </constructor>
  24219. <method name="has" return="boolean"
  24220. abstract="false" native="false" synchronized="false"
  24221. static="false" final="false" visibility="public"
  24222. deprecated="not deprecated">
  24223. <param name="i" type="int"/>
  24224. <doc>
  24225. <![CDATA[Return true if tuple has an element at the position provided.]]>
  24226. </doc>
  24227. </method>
  24228. <method name="get" return="org.apache.hadoop.io.Writable"
  24229. abstract="false" native="false" synchronized="false"
  24230. static="false" final="false" visibility="public"
  24231. deprecated="not deprecated">
  24232. <param name="i" type="int"/>
  24233. <doc>
  24234. <![CDATA[Get ith Writable from Tuple.]]>
  24235. </doc>
  24236. </method>
  24237. <method name="size" return="int"
  24238. abstract="false" native="false" synchronized="false"
  24239. static="false" final="false" visibility="public"
  24240. deprecated="not deprecated">
  24241. <doc>
  24242. <![CDATA[The number of children in this Tuple.]]>
  24243. </doc>
  24244. </method>
  24245. <method name="equals" return="boolean"
  24246. abstract="false" native="false" synchronized="false"
  24247. static="false" final="false" visibility="public"
  24248. deprecated="not deprecated">
  24249. <param name="other" type="java.lang.Object"/>
  24250. <doc>
  24251. <![CDATA[{@inheritDoc}]]>
  24252. </doc>
  24253. </method>
  24254. <method name="hashCode" return="int"
  24255. abstract="false" native="false" synchronized="false"
  24256. static="false" final="false" visibility="public"
  24257. deprecated="not deprecated">
  24258. </method>
  24259. <method name="iterator" return="java.util.Iterator"
  24260. abstract="false" native="false" synchronized="false"
  24261. static="false" final="false" visibility="public"
  24262. deprecated="not deprecated">
  24263. <doc>
  24264. <![CDATA[Return an iterator over the elements in this tuple.
  24265. Note that this doesn't flatten the tuple; one may receive tuples
  24266. from this iterator.]]>
  24267. </doc>
  24268. </method>
  24269. <method name="toString" return="java.lang.String"
  24270. abstract="false" native="false" synchronized="false"
  24271. static="false" final="false" visibility="public"
  24272. deprecated="not deprecated">
  24273. <doc>
  24274. <![CDATA[Convert Tuple to String as in the following.
  24275. <tt>[<child1>,<child2>,...,<childn>]</tt>]]>
  24276. </doc>
  24277. </method>
  24278. <method name="write"
  24279. abstract="false" native="false" synchronized="false"
  24280. static="false" final="false" visibility="public"
  24281. deprecated="not deprecated">
  24282. <param name="out" type="java.io.DataOutput"/>
  24283. <exception name="IOException" type="java.io.IOException"/>
  24284. <doc>
  24285. <![CDATA[Writes each Writable to <code>out</code>.
  24286. TupleWritable format:
  24287. {@code
  24288. <count><type1><type2>...<typen><obj1><obj2>...<objn>
  24289. }]]>
  24290. </doc>
  24291. </method>
  24292. <method name="readFields"
  24293. abstract="false" native="false" synchronized="false"
  24294. static="false" final="false" visibility="public"
  24295. deprecated="not deprecated">
  24296. <param name="in" type="java.io.DataInput"/>
  24297. <exception name="IOException" type="java.io.IOException"/>
  24298. <doc>
  24299. <![CDATA[{@inheritDoc}]]>
  24300. </doc>
  24301. </method>
  24302. <field name="written" type="java.util.BitSet"
  24303. transient="false" volatile="false"
  24304. static="false" final="false" visibility="protected"
  24305. deprecated="not deprecated">
  24306. </field>
  24307. <doc>
  24308. <![CDATA[Writable type storing multiple {@link org.apache.hadoop.io.Writable}s.
  24309. This is *not* a general-purpose tuple type. In almost all cases, users are
  24310. encouraged to implement their own serializable types, which can perform
  24311. better validation and provide more efficient encodings than this class is
  24312. capable. TupleWritable relies on the join framework for type safety and
  24313. assumes its instances will rarely be persisted, assumptions not only
  24314. incompatible with, but contrary to the general case.
  24315. @see org.apache.hadoop.io.Writable]]>
  24316. </doc>
  24317. </class>
  24318. <!-- end class org.apache.hadoop.mapreduce.lib.join.TupleWritable -->
  24319. <!-- start class org.apache.hadoop.mapreduce.lib.join.WrappedRecordReader -->
  24320. <class name="WrappedRecordReader" extends="org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader"
  24321. abstract="false"
  24322. static="false" final="false" visibility="public"
  24323. deprecated="not deprecated">
  24324. <constructor name="WrappedRecordReader" type="int"
  24325. static="false" final="false" visibility="protected"
  24326. deprecated="not deprecated">
  24327. </constructor>
  24328. <method name="initialize"
  24329. abstract="false" native="false" synchronized="false"
  24330. static="false" final="false" visibility="public"
  24331. deprecated="not deprecated">
  24332. <param name="split" type="org.apache.hadoop.mapreduce.InputSplit"/>
  24333. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  24334. <exception name="IOException" type="java.io.IOException"/>
  24335. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24336. </method>
  24337. <method name="createKey" return="K"
  24338. abstract="false" native="false" synchronized="false"
  24339. static="false" final="false" visibility="public"
  24340. deprecated="not deprecated">
  24341. <doc>
  24342. <![CDATA[Request new key from proxied RR.]]>
  24343. </doc>
  24344. </method>
  24345. <method name="createValue" return="U"
  24346. abstract="false" native="false" synchronized="false"
  24347. static="false" final="false" visibility="public"
  24348. deprecated="not deprecated">
  24349. </method>
  24350. <method name="id" return="int"
  24351. abstract="false" native="false" synchronized="false"
  24352. static="false" final="false" visibility="public"
  24353. deprecated="not deprecated">
  24354. <doc>
  24355. <![CDATA[{@inheritDoc}]]>
  24356. </doc>
  24357. </method>
  24358. <method name="key" return="K"
  24359. abstract="false" native="false" synchronized="false"
  24360. static="false" final="false" visibility="public"
  24361. deprecated="not deprecated">
  24362. <doc>
  24363. <![CDATA[Return the key at the head of this RR.]]>
  24364. </doc>
  24365. </method>
  24366. <method name="key"
  24367. abstract="false" native="false" synchronized="false"
  24368. static="false" final="false" visibility="public"
  24369. deprecated="not deprecated">
  24370. <param name="qkey" type="K"/>
  24371. <exception name="IOException" type="java.io.IOException"/>
  24372. <doc>
  24373. <![CDATA[Clone the key at the head of this RR into the object supplied.]]>
  24374. </doc>
  24375. </method>
  24376. <method name="hasNext" return="boolean"
  24377. abstract="false" native="false" synchronized="false"
  24378. static="false" final="false" visibility="public"
  24379. deprecated="not deprecated">
  24380. <doc>
  24381. <![CDATA[Return true if the RR- including the k,v pair stored in this object-
  24382. is exhausted.]]>
  24383. </doc>
  24384. </method>
  24385. <method name="skip"
  24386. abstract="false" native="false" synchronized="false"
  24387. static="false" final="false" visibility="public"
  24388. deprecated="not deprecated">
  24389. <param name="key" type="K"/>
  24390. <exception name="IOException" type="java.io.IOException"/>
  24391. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24392. <doc>
  24393. <![CDATA[Skip key-value pairs with keys less than or equal to the key provided.]]>
  24394. </doc>
  24395. </method>
  24396. <method name="accept"
  24397. abstract="false" native="false" synchronized="false"
  24398. static="false" final="false" visibility="public"
  24399. deprecated="not deprecated">
  24400. <param name="i" type="org.apache.hadoop.mapreduce.lib.join.CompositeRecordReader.JoinCollector"/>
  24401. <param name="key" type="K"/>
  24402. <exception name="IOException" type="java.io.IOException"/>
  24403. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24404. <doc>
  24405. <![CDATA[Add an iterator to the collector at the position occupied by this
  24406. RecordReader over the values in this stream paired with the key
  24407. provided (ie register a stream of values from this source matching K
  24408. with a collector).]]>
  24409. </doc>
  24410. </method>
  24411. <method name="nextKeyValue" return="boolean"
  24412. abstract="false" native="false" synchronized="false"
  24413. static="false" final="false" visibility="public"
  24414. deprecated="not deprecated">
  24415. <exception name="IOException" type="java.io.IOException"/>
  24416. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24417. <doc>
  24418. <![CDATA[Read the next k,v pair into the head of this object; return true iff
  24419. the RR and this are exhausted.]]>
  24420. </doc>
  24421. </method>
  24422. <method name="getCurrentKey" return="K"
  24423. abstract="false" native="false" synchronized="false"
  24424. static="false" final="false" visibility="public"
  24425. deprecated="not deprecated">
  24426. <exception name="IOException" type="java.io.IOException"/>
  24427. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24428. <doc>
  24429. <![CDATA[Get current key]]>
  24430. </doc>
  24431. </method>
  24432. <method name="getCurrentValue" return="U"
  24433. abstract="false" native="false" synchronized="false"
  24434. static="false" final="false" visibility="public"
  24435. deprecated="not deprecated">
  24436. <exception name="IOException" type="java.io.IOException"/>
  24437. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24438. <doc>
  24439. <![CDATA[Get current value]]>
  24440. </doc>
  24441. </method>
  24442. <method name="getProgress" return="float"
  24443. abstract="false" native="false" synchronized="false"
  24444. static="false" final="false" visibility="public"
  24445. deprecated="not deprecated">
  24446. <exception name="IOException" type="java.io.IOException"/>
  24447. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24448. <doc>
  24449. <![CDATA[Request progress from proxied RR.]]>
  24450. </doc>
  24451. </method>
  24452. <method name="close"
  24453. abstract="false" native="false" synchronized="false"
  24454. static="false" final="false" visibility="public"
  24455. deprecated="not deprecated">
  24456. <exception name="IOException" type="java.io.IOException"/>
  24457. <doc>
  24458. <![CDATA[Forward close request to proxied RR.]]>
  24459. </doc>
  24460. </method>
  24461. <method name="compareTo" return="int"
  24462. abstract="false" native="false" synchronized="false"
  24463. static="false" final="false" visibility="public"
  24464. deprecated="not deprecated">
  24465. <param name="other" type="org.apache.hadoop.mapreduce.lib.join.ComposableRecordReader"/>
  24466. <doc>
  24467. <![CDATA[Implement Comparable contract (compare key at head of proxied RR
  24468. with that of another).]]>
  24469. </doc>
  24470. </method>
  24471. <method name="equals" return="boolean"
  24472. abstract="false" native="false" synchronized="false"
  24473. static="false" final="false" visibility="public"
  24474. deprecated="not deprecated">
  24475. <param name="other" type="java.lang.Object"/>
  24476. <doc>
  24477. <![CDATA[Return true iff compareTo(other) retn true.]]>
  24478. </doc>
  24479. </method>
  24480. <method name="hashCode" return="int"
  24481. abstract="false" native="false" synchronized="false"
  24482. static="false" final="false" visibility="public"
  24483. deprecated="not deprecated">
  24484. </method>
  24485. <field name="empty" type="boolean"
  24486. transient="false" volatile="false"
  24487. static="false" final="false" visibility="protected"
  24488. deprecated="not deprecated">
  24489. </field>
  24490. <field name="cmp" type="org.apache.hadoop.io.WritableComparator"
  24491. transient="false" volatile="false"
  24492. static="false" final="false" visibility="protected"
  24493. deprecated="not deprecated">
  24494. </field>
  24495. <doc>
  24496. <![CDATA[Proxy class for a RecordReader participating in the join framework.
  24497. This class keeps track of the &quot;head&quot; key-value pair for the
  24498. provided RecordReader and keeps a store of values matching a key when
  24499. this source is participating in a join.]]>
  24500. </doc>
  24501. </class>
  24502. <!-- end class org.apache.hadoop.mapreduce.lib.join.WrappedRecordReader -->
  24503. </package>
  24504. <package name="org.apache.hadoop.mapreduce.lib.map">
  24505. <!-- start class org.apache.hadoop.mapreduce.lib.map.InverseMapper -->
  24506. <class name="InverseMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  24507. abstract="false"
  24508. static="false" final="false" visibility="public"
  24509. deprecated="not deprecated">
  24510. <constructor name="InverseMapper"
  24511. static="false" final="false" visibility="public"
  24512. deprecated="not deprecated">
  24513. </constructor>
  24514. <method name="map"
  24515. abstract="false" native="false" synchronized="false"
  24516. static="false" final="false" visibility="public"
  24517. deprecated="not deprecated">
  24518. <param name="key" type="K"/>
  24519. <param name="value" type="V"/>
  24520. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  24521. <exception name="IOException" type="java.io.IOException"/>
  24522. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24523. <doc>
  24524. <![CDATA[The inverse function. Input keys and values are swapped.]]>
  24525. </doc>
  24526. </method>
  24527. <doc>
  24528. <![CDATA[A {@link Mapper} that swaps keys and values.]]>
  24529. </doc>
  24530. </class>
  24531. <!-- end class org.apache.hadoop.mapreduce.lib.map.InverseMapper -->
  24532. <!-- start class org.apache.hadoop.mapreduce.lib.map.MultithreadedMapper -->
  24533. <class name="MultithreadedMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  24534. abstract="false"
  24535. static="false" final="false" visibility="public"
  24536. deprecated="not deprecated">
  24537. <constructor name="MultithreadedMapper"
  24538. static="false" final="false" visibility="public"
  24539. deprecated="not deprecated">
  24540. </constructor>
  24541. <method name="getNumberOfThreads" return="int"
  24542. abstract="false" native="false" synchronized="false"
  24543. static="true" final="false" visibility="public"
  24544. deprecated="not deprecated">
  24545. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  24546. <doc>
  24547. <![CDATA[The number of threads in the thread pool that will run the map function.
  24548. @param job the job
  24549. @return the number of threads]]>
  24550. </doc>
  24551. </method>
  24552. <method name="setNumberOfThreads"
  24553. abstract="false" native="false" synchronized="false"
  24554. static="true" final="false" visibility="public"
  24555. deprecated="not deprecated">
  24556. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  24557. <param name="threads" type="int"/>
  24558. <doc>
  24559. <![CDATA[Set the number of threads in the pool for running maps.
  24560. @param job the job to modify
  24561. @param threads the new number of threads]]>
  24562. </doc>
  24563. </method>
  24564. <method name="getMapperClass" return="java.lang.Class"
  24565. abstract="false" native="false" synchronized="false"
  24566. static="true" final="false" visibility="public"
  24567. deprecated="not deprecated">
  24568. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  24569. <doc>
  24570. <![CDATA[Get the application's mapper class.
  24571. @param <K1> the map's input key type
  24572. @param <V1> the map's input value type
  24573. @param <K2> the map's output key type
  24574. @param <V2> the map's output value type
  24575. @param job the job
  24576. @return the mapper class to run]]>
  24577. </doc>
  24578. </method>
  24579. <method name="setMapperClass"
  24580. abstract="false" native="false" synchronized="false"
  24581. static="true" final="false" visibility="public"
  24582. deprecated="not deprecated">
  24583. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  24584. <param name="cls" type="java.lang.Class"/>
  24585. <doc>
  24586. <![CDATA[Set the application's mapper class.
  24587. @param <K1> the map input key type
  24588. @param <V1> the map input value type
  24589. @param <K2> the map output key type
  24590. @param <V2> the map output value type
  24591. @param job the job to modify
  24592. @param cls the class to use as the mapper]]>
  24593. </doc>
  24594. </method>
  24595. <method name="run"
  24596. abstract="false" native="false" synchronized="false"
  24597. static="false" final="false" visibility="public"
  24598. deprecated="not deprecated">
  24599. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  24600. <exception name="IOException" type="java.io.IOException"/>
  24601. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24602. <doc>
  24603. <![CDATA[Run the application's maps using a thread pool.]]>
  24604. </doc>
  24605. </method>
  24606. <field name="NUM_THREADS" type="java.lang.String"
  24607. transient="false" volatile="false"
  24608. static="true" final="false" visibility="public"
  24609. deprecated="not deprecated">
  24610. </field>
  24611. <field name="MAP_CLASS" type="java.lang.String"
  24612. transient="false" volatile="false"
  24613. static="true" final="false" visibility="public"
  24614. deprecated="not deprecated">
  24615. </field>
  24616. <doc>
  24617. <![CDATA[Multithreaded implementation for @link org.apache.hadoop.mapreduce.Mapper.
  24618. <p>
  24619. It can be used instead of the default implementation,
  24620. @link org.apache.hadoop.mapred.MapRunner, when the Map operation is not CPU
  24621. bound in order to improve throughput.
  24622. <p>
  24623. Mapper implementations using this MapRunnable must be thread-safe.
  24624. <p>
  24625. The Map-Reduce job has to be configured with the mapper to use via
  24626. {@link #setMapperClass(Configuration, Class)} and
  24627. the number of thread the thread-pool can use with the
  24628. {@link #getNumberOfThreads(Configuration) method. The default
  24629. value is 10 threads.
  24630. <p>]]>
  24631. </doc>
  24632. </class>
  24633. <!-- end class org.apache.hadoop.mapreduce.lib.map.MultithreadedMapper -->
  24634. <!-- start class org.apache.hadoop.mapreduce.lib.map.RegexMapper -->
  24635. <class name="RegexMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  24636. abstract="false"
  24637. static="false" final="false" visibility="public"
  24638. deprecated="not deprecated">
  24639. <constructor name="RegexMapper"
  24640. static="false" final="false" visibility="public"
  24641. deprecated="not deprecated">
  24642. </constructor>
  24643. <method name="setup"
  24644. abstract="false" native="false" synchronized="false"
  24645. static="false" final="false" visibility="public"
  24646. deprecated="not deprecated">
  24647. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  24648. </method>
  24649. <method name="map"
  24650. abstract="false" native="false" synchronized="false"
  24651. static="false" final="false" visibility="public"
  24652. deprecated="not deprecated">
  24653. <param name="key" type="K"/>
  24654. <param name="value" type="org.apache.hadoop.io.Text"/>
  24655. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  24656. <exception name="IOException" type="java.io.IOException"/>
  24657. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24658. </method>
  24659. <field name="PATTERN" type="java.lang.String"
  24660. transient="false" volatile="false"
  24661. static="true" final="false" visibility="public"
  24662. deprecated="not deprecated">
  24663. </field>
  24664. <field name="GROUP" type="java.lang.String"
  24665. transient="false" volatile="false"
  24666. static="true" final="false" visibility="public"
  24667. deprecated="not deprecated">
  24668. </field>
  24669. <doc>
  24670. <![CDATA[A {@link Mapper} that extracts text matching a regular expression.]]>
  24671. </doc>
  24672. </class>
  24673. <!-- end class org.apache.hadoop.mapreduce.lib.map.RegexMapper -->
  24674. <!-- start class org.apache.hadoop.mapreduce.lib.map.TokenCounterMapper -->
  24675. <class name="TokenCounterMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  24676. abstract="false"
  24677. static="false" final="false" visibility="public"
  24678. deprecated="not deprecated">
  24679. <constructor name="TokenCounterMapper"
  24680. static="false" final="false" visibility="public"
  24681. deprecated="not deprecated">
  24682. </constructor>
  24683. <method name="map"
  24684. abstract="false" native="false" synchronized="false"
  24685. static="false" final="false" visibility="public"
  24686. deprecated="not deprecated">
  24687. <param name="key" type="java.lang.Object"/>
  24688. <param name="value" type="org.apache.hadoop.io.Text"/>
  24689. <param name="context" type="org.apache.hadoop.mapreduce.Mapper.Context"/>
  24690. <exception name="IOException" type="java.io.IOException"/>
  24691. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24692. </method>
  24693. <doc>
  24694. <![CDATA[Tokenize the input values and emit each word with a count of 1.]]>
  24695. </doc>
  24696. </class>
  24697. <!-- end class org.apache.hadoop.mapreduce.lib.map.TokenCounterMapper -->
  24698. <!-- start class org.apache.hadoop.mapreduce.lib.map.WrappedMapper -->
  24699. <class name="WrappedMapper" extends="org.apache.hadoop.mapreduce.Mapper"
  24700. abstract="false"
  24701. static="false" final="false" visibility="public"
  24702. deprecated="not deprecated">
  24703. <constructor name="WrappedMapper"
  24704. static="false" final="false" visibility="public"
  24705. deprecated="not deprecated">
  24706. </constructor>
  24707. <method name="getMapContext" return="org.apache.hadoop.mapreduce.Mapper.Context"
  24708. abstract="false" native="false" synchronized="false"
  24709. static="false" final="false" visibility="public"
  24710. deprecated="not deprecated">
  24711. <param name="mapContext" type="org.apache.hadoop.mapreduce.MapContext"/>
  24712. <doc>
  24713. <![CDATA[Get a wrapped {@link Mapper.Context} for custom implementations.
  24714. @param mapContext <code>MapContext</code> to be wrapped
  24715. @return a wrapped <code>Mapper.Context</code> for custom implementations]]>
  24716. </doc>
  24717. </method>
  24718. <doc>
  24719. <![CDATA[A {@link Mapper} which wraps a given one to allow custom
  24720. {@link Mapper.Context} implementations.]]>
  24721. </doc>
  24722. </class>
  24723. <!-- end class org.apache.hadoop.mapreduce.lib.map.WrappedMapper -->
  24724. <!-- start class org.apache.hadoop.mapreduce.lib.map.WrappedMapper.Context -->
  24725. <class name="WrappedMapper.Context" extends="org.apache.hadoop.mapreduce.Mapper.Context"
  24726. abstract="false"
  24727. static="false" final="false" visibility="public"
  24728. deprecated="not deprecated">
  24729. <constructor name="WrappedMapper.Context" type="org.apache.hadoop.mapreduce.MapContext"
  24730. static="false" final="false" visibility="public"
  24731. deprecated="not deprecated">
  24732. </constructor>
  24733. <method name="getInputSplit" return="org.apache.hadoop.mapreduce.InputSplit"
  24734. abstract="false" native="false" synchronized="false"
  24735. static="false" final="false" visibility="public"
  24736. deprecated="not deprecated">
  24737. <doc>
  24738. <![CDATA[Get the input split for this map.]]>
  24739. </doc>
  24740. </method>
  24741. <method name="getCurrentKey" return="KEYIN"
  24742. abstract="false" native="false" synchronized="false"
  24743. static="false" final="false" visibility="public"
  24744. deprecated="not deprecated">
  24745. <exception name="IOException" type="java.io.IOException"/>
  24746. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24747. </method>
  24748. <method name="getCurrentValue" return="VALUEIN"
  24749. abstract="false" native="false" synchronized="false"
  24750. static="false" final="false" visibility="public"
  24751. deprecated="not deprecated">
  24752. <exception name="IOException" type="java.io.IOException"/>
  24753. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24754. </method>
  24755. <method name="nextKeyValue" return="boolean"
  24756. abstract="false" native="false" synchronized="false"
  24757. static="false" final="false" visibility="public"
  24758. deprecated="not deprecated">
  24759. <exception name="IOException" type="java.io.IOException"/>
  24760. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24761. </method>
  24762. <method name="getCounter" return="org.apache.hadoop.mapreduce.Counter"
  24763. abstract="false" native="false" synchronized="false"
  24764. static="false" final="false" visibility="public"
  24765. deprecated="not deprecated">
  24766. <param name="counterName" type="java.lang.Enum"/>
  24767. </method>
  24768. <method name="getCounter" return="org.apache.hadoop.mapreduce.Counter"
  24769. abstract="false" native="false" synchronized="false"
  24770. static="false" final="false" visibility="public"
  24771. deprecated="not deprecated">
  24772. <param name="groupName" type="java.lang.String"/>
  24773. <param name="counterName" type="java.lang.String"/>
  24774. </method>
  24775. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  24776. abstract="false" native="false" synchronized="false"
  24777. static="false" final="false" visibility="public"
  24778. deprecated="not deprecated">
  24779. </method>
  24780. <method name="write"
  24781. abstract="false" native="false" synchronized="false"
  24782. static="false" final="false" visibility="public"
  24783. deprecated="not deprecated">
  24784. <param name="key" type="KEYOUT"/>
  24785. <param name="value" type="VALUEOUT"/>
  24786. <exception name="IOException" type="java.io.IOException"/>
  24787. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  24788. </method>
  24789. <method name="getStatus" return="java.lang.String"
  24790. abstract="false" native="false" synchronized="false"
  24791. static="false" final="false" visibility="public"
  24792. deprecated="not deprecated">
  24793. </method>
  24794. <method name="getTaskAttemptID" return="org.apache.hadoop.mapreduce.TaskAttemptID"
  24795. abstract="false" native="false" synchronized="false"
  24796. static="false" final="false" visibility="public"
  24797. deprecated="not deprecated">
  24798. </method>
  24799. <method name="setStatus"
  24800. abstract="false" native="false" synchronized="false"
  24801. static="false" final="false" visibility="public"
  24802. deprecated="not deprecated">
  24803. <param name="msg" type="java.lang.String"/>
  24804. </method>
  24805. <method name="getArchiveClassPaths" return="org.apache.hadoop.fs.Path[]"
  24806. abstract="false" native="false" synchronized="false"
  24807. static="false" final="false" visibility="public"
  24808. deprecated="not deprecated">
  24809. </method>
  24810. <method name="getArchiveTimestamps" return="java.lang.String[]"
  24811. abstract="false" native="false" synchronized="false"
  24812. static="false" final="false" visibility="public"
  24813. deprecated="not deprecated">
  24814. </method>
  24815. <method name="getCacheArchives" return="java.net.URI[]"
  24816. abstract="false" native="false" synchronized="false"
  24817. static="false" final="false" visibility="public"
  24818. deprecated="not deprecated">
  24819. <exception name="IOException" type="java.io.IOException"/>
  24820. </method>
  24821. <method name="getCacheFiles" return="java.net.URI[]"
  24822. abstract="false" native="false" synchronized="false"
  24823. static="false" final="false" visibility="public"
  24824. deprecated="not deprecated">
  24825. <exception name="IOException" type="java.io.IOException"/>
  24826. </method>
  24827. <method name="getCombinerClass" return="java.lang.Class"
  24828. abstract="false" native="false" synchronized="false"
  24829. static="false" final="false" visibility="public"
  24830. deprecated="not deprecated">
  24831. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  24832. </method>
  24833. <method name="getConfiguration" return="org.apache.hadoop.conf.Configuration"
  24834. abstract="false" native="false" synchronized="false"
  24835. static="false" final="false" visibility="public"
  24836. deprecated="not deprecated">
  24837. </method>
  24838. <method name="getFileClassPaths" return="org.apache.hadoop.fs.Path[]"
  24839. abstract="false" native="false" synchronized="false"
  24840. static="false" final="false" visibility="public"
  24841. deprecated="not deprecated">
  24842. </method>
  24843. <method name="getFileTimestamps" return="java.lang.String[]"
  24844. abstract="false" native="false" synchronized="false"
  24845. static="false" final="false" visibility="public"
  24846. deprecated="not deprecated">
  24847. </method>
  24848. <method name="getGroupingComparator" return="org.apache.hadoop.io.RawComparator"
  24849. abstract="false" native="false" synchronized="false"
  24850. static="false" final="false" visibility="public"
  24851. deprecated="not deprecated">
  24852. </method>
  24853. <method name="getInputFormatClass" return="java.lang.Class"
  24854. abstract="false" native="false" synchronized="false"
  24855. static="false" final="false" visibility="public"
  24856. deprecated="not deprecated">
  24857. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  24858. </method>
  24859. <method name="getJar" return="java.lang.String"
  24860. abstract="false" native="false" synchronized="false"
  24861. static="false" final="false" visibility="public"
  24862. deprecated="not deprecated">
  24863. </method>
  24864. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  24865. abstract="false" native="false" synchronized="false"
  24866. static="false" final="false" visibility="public"
  24867. deprecated="not deprecated">
  24868. </method>
  24869. <method name="getJobName" return="java.lang.String"
  24870. abstract="false" native="false" synchronized="false"
  24871. static="false" final="false" visibility="public"
  24872. deprecated="not deprecated">
  24873. </method>
  24874. <method name="getJobSetupCleanupNeeded" return="boolean"
  24875. abstract="false" native="false" synchronized="false"
  24876. static="false" final="false" visibility="public"
  24877. deprecated="not deprecated">
  24878. </method>
  24879. <method name="getLocalCacheArchives" return="org.apache.hadoop.fs.Path[]"
  24880. abstract="false" native="false" synchronized="false"
  24881. static="false" final="false" visibility="public"
  24882. deprecated="not deprecated">
  24883. <exception name="IOException" type="java.io.IOException"/>
  24884. </method>
  24885. <method name="getLocalCacheFiles" return="org.apache.hadoop.fs.Path[]"
  24886. abstract="false" native="false" synchronized="false"
  24887. static="false" final="false" visibility="public"
  24888. deprecated="not deprecated">
  24889. <exception name="IOException" type="java.io.IOException"/>
  24890. </method>
  24891. <method name="getMapOutputKeyClass" return="java.lang.Class"
  24892. abstract="false" native="false" synchronized="false"
  24893. static="false" final="false" visibility="public"
  24894. deprecated="not deprecated">
  24895. </method>
  24896. <method name="getMapOutputValueClass" return="java.lang.Class"
  24897. abstract="false" native="false" synchronized="false"
  24898. static="false" final="false" visibility="public"
  24899. deprecated="not deprecated">
  24900. </method>
  24901. <method name="getMapperClass" return="java.lang.Class"
  24902. abstract="false" native="false" synchronized="false"
  24903. static="false" final="false" visibility="public"
  24904. deprecated="not deprecated">
  24905. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  24906. </method>
  24907. <method name="getMaxMapAttempts" return="int"
  24908. abstract="false" native="false" synchronized="false"
  24909. static="false" final="false" visibility="public"
  24910. deprecated="not deprecated">
  24911. </method>
  24912. <method name="getMaxReduceAttempts" return="int"
  24913. abstract="false" native="false" synchronized="false"
  24914. static="false" final="false" visibility="public"
  24915. deprecated="not deprecated">
  24916. </method>
  24917. <method name="getNumReduceTasks" return="int"
  24918. abstract="false" native="false" synchronized="false"
  24919. static="false" final="false" visibility="public"
  24920. deprecated="not deprecated">
  24921. </method>
  24922. <method name="getOutputFormatClass" return="java.lang.Class"
  24923. abstract="false" native="false" synchronized="false"
  24924. static="false" final="false" visibility="public"
  24925. deprecated="not deprecated">
  24926. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  24927. </method>
  24928. <method name="getOutputKeyClass" return="java.lang.Class"
  24929. abstract="false" native="false" synchronized="false"
  24930. static="false" final="false" visibility="public"
  24931. deprecated="not deprecated">
  24932. </method>
  24933. <method name="getOutputValueClass" return="java.lang.Class"
  24934. abstract="false" native="false" synchronized="false"
  24935. static="false" final="false" visibility="public"
  24936. deprecated="not deprecated">
  24937. </method>
  24938. <method name="getPartitionerClass" return="java.lang.Class"
  24939. abstract="false" native="false" synchronized="false"
  24940. static="false" final="false" visibility="public"
  24941. deprecated="not deprecated">
  24942. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  24943. </method>
  24944. <method name="getReducerClass" return="java.lang.Class"
  24945. abstract="false" native="false" synchronized="false"
  24946. static="false" final="false" visibility="public"
  24947. deprecated="not deprecated">
  24948. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  24949. </method>
  24950. <method name="getSortComparator" return="org.apache.hadoop.io.RawComparator"
  24951. abstract="false" native="false" synchronized="false"
  24952. static="false" final="false" visibility="public"
  24953. deprecated="not deprecated">
  24954. </method>
  24955. <method name="getSymlink" return="boolean"
  24956. abstract="false" native="false" synchronized="false"
  24957. static="false" final="false" visibility="public"
  24958. deprecated="not deprecated">
  24959. </method>
  24960. <method name="getWorkingDirectory" return="org.apache.hadoop.fs.Path"
  24961. abstract="false" native="false" synchronized="false"
  24962. static="false" final="false" visibility="public"
  24963. deprecated="not deprecated">
  24964. <exception name="IOException" type="java.io.IOException"/>
  24965. </method>
  24966. <method name="progress"
  24967. abstract="false" native="false" synchronized="false"
  24968. static="false" final="false" visibility="public"
  24969. deprecated="not deprecated">
  24970. </method>
  24971. <method name="getProfileEnabled" return="boolean"
  24972. abstract="false" native="false" synchronized="false"
  24973. static="false" final="false" visibility="public"
  24974. deprecated="not deprecated">
  24975. </method>
  24976. <method name="getProfileParams" return="java.lang.String"
  24977. abstract="false" native="false" synchronized="false"
  24978. static="false" final="false" visibility="public"
  24979. deprecated="not deprecated">
  24980. </method>
  24981. <method name="getProfileTaskRange" return="org.apache.hadoop.conf.Configuration.IntegerRanges"
  24982. abstract="false" native="false" synchronized="false"
  24983. static="false" final="false" visibility="public"
  24984. deprecated="not deprecated">
  24985. <param name="isMap" type="boolean"/>
  24986. </method>
  24987. <method name="getUser" return="java.lang.String"
  24988. abstract="false" native="false" synchronized="false"
  24989. static="false" final="false" visibility="public"
  24990. deprecated="not deprecated">
  24991. </method>
  24992. <method name="getCredentials" return="org.apache.hadoop.security.Credentials"
  24993. abstract="false" native="false" synchronized="false"
  24994. static="false" final="false" visibility="public"
  24995. deprecated="not deprecated">
  24996. </method>
  24997. <field name="mapContext" type="org.apache.hadoop.mapreduce.MapContext"
  24998. transient="false" volatile="false"
  24999. static="false" final="false" visibility="protected"
  25000. deprecated="not deprecated">
  25001. </field>
  25002. </class>
  25003. <!-- end class org.apache.hadoop.mapreduce.lib.map.WrappedMapper.Context -->
  25004. </package>
  25005. <package name="org.apache.hadoop.mapreduce.lib.output">
  25006. <!-- start class org.apache.hadoop.mapreduce.lib.output.FileOutputCommitter -->
  25007. <class name="FileOutputCommitter" extends="org.apache.hadoop.mapreduce.OutputCommitter"
  25008. abstract="false"
  25009. static="false" final="false" visibility="public"
  25010. deprecated="not deprecated">
  25011. <constructor name="FileOutputCommitter" type="org.apache.hadoop.fs.Path, org.apache.hadoop.mapreduce.TaskAttemptContext"
  25012. static="false" final="false" visibility="public"
  25013. deprecated="not deprecated">
  25014. <exception name="IOException" type="java.io.IOException"/>
  25015. <doc>
  25016. <![CDATA[Create a file output committer
  25017. @param outputPath the job's output path
  25018. @param context the task's context
  25019. @throws IOException]]>
  25020. </doc>
  25021. </constructor>
  25022. <method name="setupJob"
  25023. abstract="false" native="false" synchronized="false"
  25024. static="false" final="false" visibility="public"
  25025. deprecated="not deprecated">
  25026. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  25027. <exception name="IOException" type="java.io.IOException"/>
  25028. <doc>
  25029. <![CDATA[Create the temporary directory that is the root of all of the task
  25030. work directories.
  25031. @param context the job's context]]>
  25032. </doc>
  25033. </method>
  25034. <method name="commitJob"
  25035. abstract="false" native="false" synchronized="false"
  25036. static="false" final="false" visibility="public"
  25037. deprecated="not deprecated">
  25038. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  25039. <exception name="IOException" type="java.io.IOException"/>
  25040. <doc>
  25041. <![CDATA[Delete the temporary directory, including all of the work directories.
  25042. Create a _SUCCESS file to make it as successful.
  25043. @param context the job's context]]>
  25044. </doc>
  25045. </method>
  25046. <method name="cleanupJob"
  25047. abstract="false" native="false" synchronized="false"
  25048. static="false" final="false" visibility="public"
  25049. deprecated="not deprecated">
  25050. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  25051. <exception name="IOException" type="java.io.IOException"/>
  25052. </method>
  25053. <method name="abortJob"
  25054. abstract="false" native="false" synchronized="false"
  25055. static="false" final="false" visibility="public"
  25056. deprecated="not deprecated">
  25057. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  25058. <param name="state" type="org.apache.hadoop.mapreduce.JobStatus.State"/>
  25059. <exception name="IOException" type="java.io.IOException"/>
  25060. <doc>
  25061. <![CDATA[Delete the temporary directory, including all of the work directories.
  25062. @param context the job's context]]>
  25063. </doc>
  25064. </method>
  25065. <method name="setupTask"
  25066. abstract="false" native="false" synchronized="false"
  25067. static="false" final="false" visibility="public"
  25068. deprecated="not deprecated">
  25069. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25070. <exception name="IOException" type="java.io.IOException"/>
  25071. <doc>
  25072. <![CDATA[No task setup required.]]>
  25073. </doc>
  25074. </method>
  25075. <method name="commitTask"
  25076. abstract="false" native="false" synchronized="false"
  25077. static="false" final="false" visibility="public"
  25078. deprecated="not deprecated">
  25079. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25080. <exception name="IOException" type="java.io.IOException"/>
  25081. <doc>
  25082. <![CDATA[Move the files from the work directory to the job output directory
  25083. @param context the task context]]>
  25084. </doc>
  25085. </method>
  25086. <method name="abortTask"
  25087. abstract="false" native="false" synchronized="false"
  25088. static="false" final="false" visibility="public"
  25089. deprecated="not deprecated">
  25090. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25091. <exception name="IOException" type="java.io.IOException"/>
  25092. <doc>
  25093. <![CDATA[Delete the work directory
  25094. @throws IOException]]>
  25095. </doc>
  25096. </method>
  25097. <method name="needsTaskCommit" return="boolean"
  25098. abstract="false" native="false" synchronized="false"
  25099. static="false" final="false" visibility="public"
  25100. deprecated="not deprecated">
  25101. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25102. <exception name="IOException" type="java.io.IOException"/>
  25103. <doc>
  25104. <![CDATA[Did this task write any files in the work directory?
  25105. @param context the task's context]]>
  25106. </doc>
  25107. </method>
  25108. <method name="getWorkPath" return="org.apache.hadoop.fs.Path"
  25109. abstract="false" native="false" synchronized="false"
  25110. static="false" final="false" visibility="public"
  25111. deprecated="not deprecated">
  25112. <exception name="IOException" type="java.io.IOException"/>
  25113. <doc>
  25114. <![CDATA[Get the directory that the task should write results into
  25115. @return the work directory
  25116. @throws IOException]]>
  25117. </doc>
  25118. </method>
  25119. <field name="TEMP_DIR_NAME" type="java.lang.String"
  25120. transient="false" volatile="false"
  25121. static="true" final="true" visibility="protected"
  25122. deprecated="not deprecated">
  25123. <doc>
  25124. <![CDATA[Temporary directory name]]>
  25125. </doc>
  25126. </field>
  25127. <field name="SUCCEEDED_FILE_NAME" type="java.lang.String"
  25128. transient="false" volatile="false"
  25129. static="true" final="true" visibility="public"
  25130. deprecated="not deprecated">
  25131. </field>
  25132. <doc>
  25133. <![CDATA[An {@link OutputCommitter} that commits files specified
  25134. in job output directory i.e. ${mapreduce.output.fileoutputformat.outputdir}.]]>
  25135. </doc>
  25136. </class>
  25137. <!-- end class org.apache.hadoop.mapreduce.lib.output.FileOutputCommitter -->
  25138. <!-- start class org.apache.hadoop.mapreduce.lib.output.FileOutputFormat -->
  25139. <class name="FileOutputFormat" extends="org.apache.hadoop.mapreduce.OutputFormat"
  25140. abstract="true"
  25141. static="false" final="false" visibility="public"
  25142. deprecated="not deprecated">
  25143. <constructor name="FileOutputFormat"
  25144. static="false" final="false" visibility="public"
  25145. deprecated="not deprecated">
  25146. </constructor>
  25147. <method name="setCompressOutput"
  25148. abstract="false" native="false" synchronized="false"
  25149. static="true" final="false" visibility="public"
  25150. deprecated="not deprecated">
  25151. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25152. <param name="compress" type="boolean"/>
  25153. <doc>
  25154. <![CDATA[Set whether the output of the job is compressed.
  25155. @param job the job to modify
  25156. @param compress should the output of the job be compressed?]]>
  25157. </doc>
  25158. </method>
  25159. <method name="getCompressOutput" return="boolean"
  25160. abstract="false" native="false" synchronized="false"
  25161. static="true" final="false" visibility="public"
  25162. deprecated="not deprecated">
  25163. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25164. <doc>
  25165. <![CDATA[Is the job output compressed?
  25166. @param job the Job to look in
  25167. @return <code>true</code> if the job output should be compressed,
  25168. <code>false</code> otherwise]]>
  25169. </doc>
  25170. </method>
  25171. <method name="setOutputCompressorClass"
  25172. abstract="false" native="false" synchronized="false"
  25173. static="true" final="false" visibility="public"
  25174. deprecated="not deprecated">
  25175. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25176. <param name="codecClass" type="java.lang.Class"/>
  25177. <doc>
  25178. <![CDATA[Set the {@link CompressionCodec} to be used to compress job outputs.
  25179. @param job the job to modify
  25180. @param codecClass the {@link CompressionCodec} to be used to
  25181. compress the job outputs]]>
  25182. </doc>
  25183. </method>
  25184. <method name="getOutputCompressorClass" return="java.lang.Class"
  25185. abstract="false" native="false" synchronized="false"
  25186. static="true" final="false" visibility="public"
  25187. deprecated="not deprecated">
  25188. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25189. <param name="defaultValue" type="java.lang.Class"/>
  25190. <doc>
  25191. <![CDATA[Get the {@link CompressionCodec} for compressing the job outputs.
  25192. @param job the {@link Job} to look in
  25193. @param defaultValue the {@link CompressionCodec} to return if not set
  25194. @return the {@link CompressionCodec} to be used to compress the
  25195. job outputs
  25196. @throws IllegalArgumentException if the class was specified, but not found]]>
  25197. </doc>
  25198. </method>
  25199. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  25200. abstract="true" native="false" synchronized="false"
  25201. static="false" final="false" visibility="public"
  25202. deprecated="not deprecated">
  25203. <param name="job" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25204. <exception name="IOException" type="java.io.IOException"/>
  25205. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25206. </method>
  25207. <method name="checkOutputSpecs"
  25208. abstract="false" native="false" synchronized="false"
  25209. static="false" final="false" visibility="public"
  25210. deprecated="not deprecated">
  25211. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25212. <exception name="FileAlreadyExistsException" type="org.apache.hadoop.fs.FileAlreadyExistsException"/>
  25213. <exception name="IOException" type="java.io.IOException"/>
  25214. </method>
  25215. <method name="setOutputPath"
  25216. abstract="false" native="false" synchronized="false"
  25217. static="true" final="false" visibility="public"
  25218. deprecated="not deprecated">
  25219. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25220. <param name="outputDir" type="org.apache.hadoop.fs.Path"/>
  25221. <doc>
  25222. <![CDATA[Set the {@link Path} of the output directory for the map-reduce job.
  25223. @param job The job to modify
  25224. @param outputDir the {@link Path} of the output directory for
  25225. the map-reduce job.]]>
  25226. </doc>
  25227. </method>
  25228. <method name="getOutputPath" return="org.apache.hadoop.fs.Path"
  25229. abstract="false" native="false" synchronized="false"
  25230. static="true" final="false" visibility="public"
  25231. deprecated="not deprecated">
  25232. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25233. <doc>
  25234. <![CDATA[Get the {@link Path} to the output directory for the map-reduce job.
  25235. @return the {@link Path} to the output directory for the map-reduce job.
  25236. @see FileOutputFormat#getWorkOutputPath(TaskInputOutputContext)]]>
  25237. </doc>
  25238. </method>
  25239. <method name="getWorkOutputPath" return="org.apache.hadoop.fs.Path"
  25240. abstract="false" native="false" synchronized="false"
  25241. static="true" final="false" visibility="public"
  25242. deprecated="not deprecated">
  25243. <param name="context" type="org.apache.hadoop.mapreduce.TaskInputOutputContext"/>
  25244. <exception name="IOException" type="java.io.IOException"/>
  25245. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25246. <doc>
  25247. <![CDATA[Get the {@link Path} to the task's temporary output directory
  25248. for the map-reduce job
  25249. <h4 id="SideEffectFiles">Tasks' Side-Effect Files</h4>
  25250. <p>Some applications need to create/write-to side-files, which differ from
  25251. the actual job-outputs.
  25252. <p>In such cases there could be issues with 2 instances of the same TIP
  25253. (running simultaneously e.g. speculative tasks) trying to open/write-to the
  25254. same file (path) on HDFS. Hence the application-writer will have to pick
  25255. unique names per task-attempt (e.g. using the attemptid, say
  25256. <tt>attempt_200709221812_0001_m_000000_0</tt>), not just per TIP.</p>
  25257. <p>To get around this the Map-Reduce framework helps the application-writer
  25258. out by maintaining a special
  25259. <tt>${mapreduce.output.fileoutputformat.outputdir}/_temporary/_${taskid}</tt>
  25260. sub-directory for each task-attempt on HDFS where the output of the
  25261. task-attempt goes. On successful completion of the task-attempt the files
  25262. in the <tt>${mapreduce.output.fileoutputformat.outputdir}/_temporary/_${taskid}</tt> (only)
  25263. are <i>promoted</i> to <tt>${mapreduce.output.fileoutputformat.outputdir}</tt>. Of course, the
  25264. framework discards the sub-directory of unsuccessful task-attempts. This
  25265. is completely transparent to the application.</p>
  25266. <p>The application-writer can take advantage of this by creating any
  25267. side-files required in a work directory during execution
  25268. of his task i.e. via
  25269. {@link #getWorkOutputPath(TaskInputOutputContext)}, and
  25270. the framework will move them out similarly - thus she doesn't have to pick
  25271. unique paths per task-attempt.</p>
  25272. <p>The entire discussion holds true for maps of jobs with
  25273. reducer=NONE (i.e. 0 reduces) since output of the map, in that case,
  25274. goes directly to HDFS.</p>
  25275. @return the {@link Path} to the task's temporary output directory
  25276. for the map-reduce job.]]>
  25277. </doc>
  25278. </method>
  25279. <method name="getPathForWorkFile" return="org.apache.hadoop.fs.Path"
  25280. abstract="false" native="false" synchronized="false"
  25281. static="true" final="false" visibility="public"
  25282. deprecated="not deprecated">
  25283. <param name="context" type="org.apache.hadoop.mapreduce.TaskInputOutputContext"/>
  25284. <param name="name" type="java.lang.String"/>
  25285. <param name="extension" type="java.lang.String"/>
  25286. <exception name="IOException" type="java.io.IOException"/>
  25287. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25288. <doc>
  25289. <![CDATA[Helper function to generate a {@link Path} for a file that is unique for
  25290. the task within the job output directory.
  25291. <p>The path can be used to create custom files from within the map and
  25292. reduce tasks. The path name will be unique for each task. The path parent
  25293. will be the job output directory.</p>ls
  25294. <p>This method uses the {@link #getUniqueFile} method to make the file name
  25295. unique for the task.</p>
  25296. @param context the context for the task.
  25297. @param name the name for the file.
  25298. @param extension the extension for the file
  25299. @return a unique path accross all tasks of the job.]]>
  25300. </doc>
  25301. </method>
  25302. <method name="getUniqueFile" return="java.lang.String"
  25303. abstract="false" native="false" synchronized="true"
  25304. static="true" final="false" visibility="public"
  25305. deprecated="not deprecated">
  25306. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25307. <param name="name" type="java.lang.String"/>
  25308. <param name="extension" type="java.lang.String"/>
  25309. <doc>
  25310. <![CDATA[Generate a unique filename, based on the task id, name, and extension
  25311. @param context the task that is calling this
  25312. @param name the base filename
  25313. @param extension the filename extension
  25314. @return a string like $name-[mrsct]-$id$extension]]>
  25315. </doc>
  25316. </method>
  25317. <method name="getDefaultWorkFile" return="org.apache.hadoop.fs.Path"
  25318. abstract="false" native="false" synchronized="false"
  25319. static="false" final="false" visibility="public"
  25320. deprecated="not deprecated">
  25321. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25322. <param name="extension" type="java.lang.String"/>
  25323. <exception name="IOException" type="java.io.IOException"/>
  25324. <doc>
  25325. <![CDATA[Get the default path and filename for the output format.
  25326. @param context the task context
  25327. @param extension an extension to add to the filename
  25328. @return a full path $output/_temporary/$taskid/part-[mr]-$id
  25329. @throws IOException]]>
  25330. </doc>
  25331. </method>
  25332. <method name="getOutputName" return="java.lang.String"
  25333. abstract="false" native="false" synchronized="false"
  25334. static="true" final="false" visibility="protected"
  25335. deprecated="not deprecated">
  25336. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25337. <doc>
  25338. <![CDATA[Get the base output name for the output file.]]>
  25339. </doc>
  25340. </method>
  25341. <method name="setOutputName"
  25342. abstract="false" native="false" synchronized="false"
  25343. static="true" final="false" visibility="protected"
  25344. deprecated="not deprecated">
  25345. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25346. <param name="name" type="java.lang.String"/>
  25347. <doc>
  25348. <![CDATA[Set the base output name for output file to be created.]]>
  25349. </doc>
  25350. </method>
  25351. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  25352. abstract="false" native="false" synchronized="true"
  25353. static="false" final="false" visibility="public"
  25354. deprecated="not deprecated">
  25355. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25356. <exception name="IOException" type="java.io.IOException"/>
  25357. </method>
  25358. <field name="BASE_OUTPUT_NAME" type="java.lang.String"
  25359. transient="false" volatile="false"
  25360. static="true" final="true" visibility="protected"
  25361. deprecated="not deprecated">
  25362. </field>
  25363. <field name="PART" type="java.lang.String"
  25364. transient="false" volatile="false"
  25365. static="true" final="true" visibility="protected"
  25366. deprecated="not deprecated">
  25367. </field>
  25368. <field name="COMPRESS" type="java.lang.String"
  25369. transient="false" volatile="false"
  25370. static="true" final="true" visibility="public"
  25371. deprecated="not deprecated">
  25372. </field>
  25373. <field name="COMPRESS_CODEC" type="java.lang.String"
  25374. transient="false" volatile="false"
  25375. static="true" final="true" visibility="public"
  25376. deprecated="not deprecated">
  25377. </field>
  25378. <field name="COMPRESS_TYPE" type="java.lang.String"
  25379. transient="false" volatile="false"
  25380. static="true" final="true" visibility="public"
  25381. deprecated="not deprecated">
  25382. </field>
  25383. <field name="OUTDIR" type="java.lang.String"
  25384. transient="false" volatile="false"
  25385. static="true" final="true" visibility="public"
  25386. deprecated="not deprecated">
  25387. </field>
  25388. <doc>
  25389. <![CDATA[A base class for {@link OutputFormat}s that read from {@link FileSystem}s.]]>
  25390. </doc>
  25391. </class>
  25392. <!-- end class org.apache.hadoop.mapreduce.lib.output.FileOutputFormat -->
  25393. <!-- start class org.apache.hadoop.mapreduce.lib.output.FilterOutputFormat -->
  25394. <class name="FilterOutputFormat" extends="org.apache.hadoop.mapreduce.OutputFormat"
  25395. abstract="false"
  25396. static="false" final="false" visibility="public"
  25397. deprecated="not deprecated">
  25398. <constructor name="FilterOutputFormat"
  25399. static="false" final="false" visibility="public"
  25400. deprecated="not deprecated">
  25401. </constructor>
  25402. <constructor name="FilterOutputFormat" type="org.apache.hadoop.mapreduce.OutputFormat"
  25403. static="false" final="false" visibility="public"
  25404. deprecated="not deprecated">
  25405. <doc>
  25406. <![CDATA[Create a FilterOutputFormat based on the underlying output format.
  25407. @param baseOut the underlying OutputFormat]]>
  25408. </doc>
  25409. </constructor>
  25410. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  25411. abstract="false" native="false" synchronized="false"
  25412. static="false" final="false" visibility="public"
  25413. deprecated="not deprecated">
  25414. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25415. <exception name="IOException" type="java.io.IOException"/>
  25416. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25417. </method>
  25418. <method name="checkOutputSpecs"
  25419. abstract="false" native="false" synchronized="false"
  25420. static="false" final="false" visibility="public"
  25421. deprecated="not deprecated">
  25422. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  25423. <exception name="IOException" type="java.io.IOException"/>
  25424. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25425. </method>
  25426. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  25427. abstract="false" native="false" synchronized="false"
  25428. static="false" final="false" visibility="public"
  25429. deprecated="not deprecated">
  25430. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25431. <exception name="IOException" type="java.io.IOException"/>
  25432. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25433. </method>
  25434. <field name="baseOut" type="org.apache.hadoop.mapreduce.OutputFormat"
  25435. transient="false" volatile="false"
  25436. static="false" final="false" visibility="protected"
  25437. deprecated="not deprecated">
  25438. </field>
  25439. <doc>
  25440. <![CDATA[FilterOutputFormat is a convenience class that wraps OutputFormat.]]>
  25441. </doc>
  25442. </class>
  25443. <!-- end class org.apache.hadoop.mapreduce.lib.output.FilterOutputFormat -->
  25444. <!-- start class org.apache.hadoop.mapreduce.lib.output.FilterOutputFormat.FilterRecordWriter -->
  25445. <class name="FilterOutputFormat.FilterRecordWriter" extends="org.apache.hadoop.mapreduce.RecordWriter"
  25446. abstract="false"
  25447. static="true" final="false" visibility="public"
  25448. deprecated="not deprecated">
  25449. <constructor name="FilterOutputFormat.FilterRecordWriter"
  25450. static="false" final="false" visibility="public"
  25451. deprecated="not deprecated">
  25452. </constructor>
  25453. <constructor name="FilterOutputFormat.FilterRecordWriter" type="org.apache.hadoop.mapreduce.RecordWriter"
  25454. static="false" final="false" visibility="public"
  25455. deprecated="not deprecated">
  25456. </constructor>
  25457. <method name="write"
  25458. abstract="false" native="false" synchronized="false"
  25459. static="false" final="false" visibility="public"
  25460. deprecated="not deprecated">
  25461. <param name="key" type="K"/>
  25462. <param name="value" type="V"/>
  25463. <exception name="IOException" type="java.io.IOException"/>
  25464. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25465. </method>
  25466. <method name="close"
  25467. abstract="false" native="false" synchronized="false"
  25468. static="false" final="false" visibility="public"
  25469. deprecated="not deprecated">
  25470. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25471. <exception name="IOException" type="java.io.IOException"/>
  25472. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25473. </method>
  25474. <field name="rawWriter" type="org.apache.hadoop.mapreduce.RecordWriter"
  25475. transient="false" volatile="false"
  25476. static="false" final="false" visibility="protected"
  25477. deprecated="not deprecated">
  25478. </field>
  25479. <doc>
  25480. <![CDATA[<code>FilterRecordWriter</code> is a convenience wrapper
  25481. class that extends the {@link RecordWriter}.]]>
  25482. </doc>
  25483. </class>
  25484. <!-- end class org.apache.hadoop.mapreduce.lib.output.FilterOutputFormat.FilterRecordWriter -->
  25485. <!-- start class org.apache.hadoop.mapreduce.lib.output.LazyOutputFormat -->
  25486. <class name="LazyOutputFormat" extends="org.apache.hadoop.mapreduce.lib.output.FilterOutputFormat"
  25487. abstract="false"
  25488. static="false" final="false" visibility="public"
  25489. deprecated="not deprecated">
  25490. <constructor name="LazyOutputFormat"
  25491. static="false" final="false" visibility="public"
  25492. deprecated="not deprecated">
  25493. </constructor>
  25494. <method name="setOutputFormatClass"
  25495. abstract="false" native="false" synchronized="false"
  25496. static="true" final="false" visibility="public"
  25497. deprecated="not deprecated">
  25498. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25499. <param name="theClass" type="java.lang.Class"/>
  25500. <doc>
  25501. <![CDATA[Set the underlying output format for LazyOutputFormat.
  25502. @param job the {@link Job} to modify
  25503. @param theClass the underlying class]]>
  25504. </doc>
  25505. </method>
  25506. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  25507. abstract="false" native="false" synchronized="false"
  25508. static="false" final="false" visibility="public"
  25509. deprecated="not deprecated">
  25510. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25511. <exception name="IOException" type="java.io.IOException"/>
  25512. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25513. </method>
  25514. <method name="checkOutputSpecs"
  25515. abstract="false" native="false" synchronized="false"
  25516. static="false" final="false" visibility="public"
  25517. deprecated="not deprecated">
  25518. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  25519. <exception name="IOException" type="java.io.IOException"/>
  25520. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25521. </method>
  25522. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  25523. abstract="false" native="false" synchronized="false"
  25524. static="false" final="false" visibility="public"
  25525. deprecated="not deprecated">
  25526. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25527. <exception name="IOException" type="java.io.IOException"/>
  25528. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25529. </method>
  25530. <field name="OUTPUT_FORMAT" type="java.lang.String"
  25531. transient="false" volatile="false"
  25532. static="true" final="false" visibility="public"
  25533. deprecated="not deprecated">
  25534. </field>
  25535. <doc>
  25536. <![CDATA[A Convenience class that creates output lazily.]]>
  25537. </doc>
  25538. </class>
  25539. <!-- end class org.apache.hadoop.mapreduce.lib.output.LazyOutputFormat -->
  25540. <!-- start class org.apache.hadoop.mapreduce.lib.output.MapFileOutputFormat -->
  25541. <class name="MapFileOutputFormat" extends="org.apache.hadoop.mapreduce.lib.output.FileOutputFormat"
  25542. abstract="false"
  25543. static="false" final="false" visibility="public"
  25544. deprecated="not deprecated">
  25545. <constructor name="MapFileOutputFormat"
  25546. static="false" final="false" visibility="public"
  25547. deprecated="not deprecated">
  25548. </constructor>
  25549. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  25550. abstract="false" native="false" synchronized="false"
  25551. static="false" final="false" visibility="public"
  25552. deprecated="not deprecated">
  25553. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25554. <exception name="IOException" type="java.io.IOException"/>
  25555. </method>
  25556. <method name="getReaders" return="org.apache.hadoop.io.MapFile.Reader[]"
  25557. abstract="false" native="false" synchronized="false"
  25558. static="true" final="false" visibility="public"
  25559. deprecated="not deprecated">
  25560. <param name="dir" type="org.apache.hadoop.fs.Path"/>
  25561. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  25562. <exception name="IOException" type="java.io.IOException"/>
  25563. <doc>
  25564. <![CDATA[Open the output generated by this format.]]>
  25565. </doc>
  25566. </method>
  25567. <method name="getEntry" return="org.apache.hadoop.io.Writable"
  25568. abstract="false" native="false" synchronized="false"
  25569. static="true" final="false" visibility="public"
  25570. deprecated="not deprecated">
  25571. <param name="readers" type="org.apache.hadoop.io.MapFile.Reader[]"/>
  25572. <param name="partitioner" type="org.apache.hadoop.mapreduce.Partitioner"/>
  25573. <param name="key" type="K"/>
  25574. <param name="value" type="V"/>
  25575. <exception name="IOException" type="java.io.IOException"/>
  25576. <doc>
  25577. <![CDATA[Get an entry from output generated by this class.]]>
  25578. </doc>
  25579. </method>
  25580. <doc>
  25581. <![CDATA[An {@link org.apache.hadoop.mapreduce.OutputFormat} that writes
  25582. {@link MapFile}s.]]>
  25583. </doc>
  25584. </class>
  25585. <!-- end class org.apache.hadoop.mapreduce.lib.output.MapFileOutputFormat -->
  25586. <!-- start class org.apache.hadoop.mapreduce.lib.output.MultipleOutputs -->
  25587. <class name="MultipleOutputs" extends="java.lang.Object"
  25588. abstract="false"
  25589. static="false" final="false" visibility="public"
  25590. deprecated="not deprecated">
  25591. <constructor name="MultipleOutputs" type="org.apache.hadoop.mapreduce.TaskInputOutputContext"
  25592. static="false" final="false" visibility="public"
  25593. deprecated="not deprecated">
  25594. <doc>
  25595. <![CDATA[Creates and initializes multiple outputs support,
  25596. it should be instantiated in the Mapper/Reducer setup method.
  25597. @param context the TaskInputOutputContext object]]>
  25598. </doc>
  25599. </constructor>
  25600. <method name="addNamedOutput"
  25601. abstract="false" native="false" synchronized="false"
  25602. static="true" final="false" visibility="public"
  25603. deprecated="not deprecated">
  25604. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25605. <param name="namedOutput" type="java.lang.String"/>
  25606. <param name="outputFormatClass" type="java.lang.Class"/>
  25607. <param name="keyClass" type="java.lang.Class"/>
  25608. <param name="valueClass" type="java.lang.Class"/>
  25609. <doc>
  25610. <![CDATA[Adds a named output for the job.
  25611. <p/>
  25612. @param job job to add the named output
  25613. @param namedOutput named output name, it has to be a word, letters
  25614. and numbers only, cannot be the word 'part' as
  25615. that is reserved for the default output.
  25616. @param outputFormatClass OutputFormat class.
  25617. @param keyClass key class
  25618. @param valueClass value class]]>
  25619. </doc>
  25620. </method>
  25621. <method name="setCountersEnabled"
  25622. abstract="false" native="false" synchronized="false"
  25623. static="true" final="false" visibility="public"
  25624. deprecated="not deprecated">
  25625. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25626. <param name="enabled" type="boolean"/>
  25627. <doc>
  25628. <![CDATA[Enables or disables counters for the named outputs.
  25629. The counters group is the {@link MultipleOutputs} class name.
  25630. The names of the counters are the same as the named outputs. These
  25631. counters count the number records written to each output name.
  25632. By default these counters are disabled.
  25633. @param job job to enable counters
  25634. @param enabled indicates if the counters will be enabled or not.]]>
  25635. </doc>
  25636. </method>
  25637. <method name="getCountersEnabled" return="boolean"
  25638. abstract="false" native="false" synchronized="false"
  25639. static="true" final="false" visibility="public"
  25640. deprecated="not deprecated">
  25641. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25642. <doc>
  25643. <![CDATA[Returns if the counters for the named outputs are enabled or not.
  25644. By default these counters are disabled.
  25645. @param job the job
  25646. @return TRUE if the counters are enabled, FALSE if they are disabled.]]>
  25647. </doc>
  25648. </method>
  25649. <method name="write"
  25650. abstract="false" native="false" synchronized="false"
  25651. static="false" final="false" visibility="public"
  25652. deprecated="not deprecated">
  25653. <param name="namedOutput" type="java.lang.String"/>
  25654. <param name="key" type="K"/>
  25655. <param name="value" type="V"/>
  25656. <exception name="IOException" type="java.io.IOException"/>
  25657. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25658. <doc>
  25659. <![CDATA[Write key and value to the namedOutput.
  25660. Output path is a unique file generated for the namedOutput.
  25661. For example, {namedOutput}-(m|r)-{part-number}
  25662. @param namedOutput the named output name
  25663. @param key the key
  25664. @param value the value]]>
  25665. </doc>
  25666. </method>
  25667. <method name="write"
  25668. abstract="false" native="false" synchronized="false"
  25669. static="false" final="false" visibility="public"
  25670. deprecated="not deprecated">
  25671. <param name="namedOutput" type="java.lang.String"/>
  25672. <param name="key" type="K"/>
  25673. <param name="value" type="V"/>
  25674. <param name="baseOutputPath" type="java.lang.String"/>
  25675. <exception name="IOException" type="java.io.IOException"/>
  25676. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25677. <doc>
  25678. <![CDATA[Write key and value to baseOutputPath using the namedOutput.
  25679. @param namedOutput the named output name
  25680. @param key the key
  25681. @param value the value
  25682. @param baseOutputPath base-output path to write the record to.
  25683. Note: Framework will generate unique filename for the baseOutputPath]]>
  25684. </doc>
  25685. </method>
  25686. <method name="write"
  25687. abstract="false" native="false" synchronized="false"
  25688. static="false" final="false" visibility="public"
  25689. deprecated="not deprecated">
  25690. <param name="key" type="KEYOUT"/>
  25691. <param name="value" type="VALUEOUT"/>
  25692. <param name="baseOutputPath" type="java.lang.String"/>
  25693. <exception name="IOException" type="java.io.IOException"/>
  25694. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25695. <doc>
  25696. <![CDATA[Write key value to an output file name.
  25697. Gets the record writer from job's output format.
  25698. Job's output format should be a FileOutputFormat.
  25699. @param key the key
  25700. @param value the value
  25701. @param baseOutputPath base-output path to write the record to.
  25702. Note: Framework will generate unique filename for the baseOutputPath]]>
  25703. </doc>
  25704. </method>
  25705. <method name="close"
  25706. abstract="false" native="false" synchronized="false"
  25707. static="false" final="false" visibility="public"
  25708. deprecated="not deprecated">
  25709. <exception name="IOException" type="java.io.IOException"/>
  25710. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25711. <doc>
  25712. <![CDATA[Closes all the opened outputs.
  25713. This should be called from cleanup method of map/reduce task.
  25714. If overridden subclasses must invoke <code>super.close()</code> at the
  25715. end of their <code>close()</code>]]>
  25716. </doc>
  25717. </method>
  25718. <doc>
  25719. <![CDATA[The MultipleOutputs class simplifies writing output data
  25720. to multiple outputs
  25721. <p>
  25722. Case one: writing to additional outputs other than the job default output.
  25723. Each additional output, or named output, may be configured with its own
  25724. <code>OutputFormat</code>, with its own key class and with its own value
  25725. class.
  25726. <p>
  25727. Case two: to write data to different files provided by user
  25728. </p>
  25729. <p>
  25730. MultipleOutputs supports counters, by default they are disabled. The
  25731. counters group is the {@link MultipleOutputs} class name. The names of the
  25732. counters are the same as the output name. These count the number records
  25733. written to each output name.
  25734. </p>
  25735. Usage pattern for job submission:
  25736. <pre>
  25737. Job job = new Job();
  25738. FileInputFormat.setInputPath(job, inDir);
  25739. FileOutputFormat.setOutputPath(job, outDir);
  25740. job.setMapperClass(MOMap.class);
  25741. job.setReducerClass(MOReduce.class);
  25742. ...
  25743. // Defines additional single text based output 'text' for the job
  25744. MultipleOutputs.addNamedOutput(job, "text", TextOutputFormat.class,
  25745. LongWritable.class, Text.class);
  25746. // Defines additional sequence-file based output 'sequence' for the job
  25747. MultipleOutputs.addNamedOutput(job, "seq",
  25748. SequenceFileOutputFormat.class,
  25749. LongWritable.class, Text.class);
  25750. ...
  25751. job.waitForCompletion(true);
  25752. ...
  25753. </pre>
  25754. <p>
  25755. Usage in Reducer:
  25756. <pre>
  25757. <K, V> String generateFileName(K k, V v) {
  25758. return k.toString() + "_" + v.toString();
  25759. }
  25760. public class MOReduce extends
  25761. Reducer&lt;WritableComparable, Writable,WritableComparable, Writable&gt; {
  25762. private MultipleOutputs mos;
  25763. public void setup(Context context) {
  25764. ...
  25765. mos = new MultipleOutputs(context);
  25766. }
  25767. public void reduce(WritableComparable key, Iterator&lt;Writable&gt; values,
  25768. Context context)
  25769. throws IOException {
  25770. ...
  25771. mos.write("text", , key, new Text("Hello"));
  25772. mos.write("seq", LongWritable(1), new Text("Bye"), "seq_a");
  25773. mos.write("seq", LongWritable(2), key, new Text("Chau"), "seq_b");
  25774. mos.write(key, new Text("value"), generateFileName(key, new Text("value")));
  25775. ...
  25776. }
  25777. public void cleanup(Context) throws IOException {
  25778. mos.close();
  25779. ...
  25780. }
  25781. }
  25782. </pre>]]>
  25783. </doc>
  25784. </class>
  25785. <!-- end class org.apache.hadoop.mapreduce.lib.output.MultipleOutputs -->
  25786. <!-- start class org.apache.hadoop.mapreduce.lib.output.NullOutputFormat -->
  25787. <class name="NullOutputFormat" extends="org.apache.hadoop.mapreduce.OutputFormat"
  25788. abstract="false"
  25789. static="false" final="false" visibility="public"
  25790. deprecated="not deprecated">
  25791. <constructor name="NullOutputFormat"
  25792. static="false" final="false" visibility="public"
  25793. deprecated="not deprecated">
  25794. </constructor>
  25795. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  25796. abstract="false" native="false" synchronized="false"
  25797. static="false" final="false" visibility="public"
  25798. deprecated="not deprecated">
  25799. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25800. </method>
  25801. <method name="checkOutputSpecs"
  25802. abstract="false" native="false" synchronized="false"
  25803. static="false" final="false" visibility="public"
  25804. deprecated="not deprecated">
  25805. <param name="context" type="org.apache.hadoop.mapreduce.JobContext"/>
  25806. </method>
  25807. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  25808. abstract="false" native="false" synchronized="false"
  25809. static="false" final="false" visibility="public"
  25810. deprecated="not deprecated">
  25811. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25812. </method>
  25813. <doc>
  25814. <![CDATA[Consume all outputs and put them in /dev/null.]]>
  25815. </doc>
  25816. </class>
  25817. <!-- end class org.apache.hadoop.mapreduce.lib.output.NullOutputFormat -->
  25818. <!-- start class org.apache.hadoop.mapreduce.lib.output.SequenceFileAsBinaryOutputFormat -->
  25819. <class name="SequenceFileAsBinaryOutputFormat" extends="org.apache.hadoop.mapreduce.lib.output.SequenceFileOutputFormat"
  25820. abstract="false"
  25821. static="false" final="false" visibility="public"
  25822. deprecated="not deprecated">
  25823. <constructor name="SequenceFileAsBinaryOutputFormat"
  25824. static="false" final="false" visibility="public"
  25825. deprecated="not deprecated">
  25826. </constructor>
  25827. <method name="setSequenceFileOutputKeyClass"
  25828. abstract="false" native="false" synchronized="false"
  25829. static="true" final="false" visibility="public"
  25830. deprecated="not deprecated">
  25831. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25832. <param name="theClass" type="java.lang.Class"/>
  25833. <doc>
  25834. <![CDATA[Set the key class for the {@link SequenceFile}
  25835. <p>This allows the user to specify the key class to be different
  25836. from the actual class ({@link BytesWritable}) used for writing </p>
  25837. @param job the {@link Job} to modify
  25838. @param theClass the SequenceFile output key class.]]>
  25839. </doc>
  25840. </method>
  25841. <method name="setSequenceFileOutputValueClass"
  25842. abstract="false" native="false" synchronized="false"
  25843. static="true" final="false" visibility="public"
  25844. deprecated="not deprecated">
  25845. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25846. <param name="theClass" type="java.lang.Class"/>
  25847. <doc>
  25848. <![CDATA[Set the value class for the {@link SequenceFile}
  25849. <p>This allows the user to specify the value class to be different
  25850. from the actual class ({@link BytesWritable}) used for writing </p>
  25851. @param job the {@link Job} to modify
  25852. @param theClass the SequenceFile output key class.]]>
  25853. </doc>
  25854. </method>
  25855. <method name="getSequenceFileOutputKeyClass" return="java.lang.Class"
  25856. abstract="false" native="false" synchronized="false"
  25857. static="true" final="false" visibility="public"
  25858. deprecated="not deprecated">
  25859. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25860. <doc>
  25861. <![CDATA[Get the key class for the {@link SequenceFile}
  25862. @return the key class of the {@link SequenceFile}]]>
  25863. </doc>
  25864. </method>
  25865. <method name="getSequenceFileOutputValueClass" return="java.lang.Class"
  25866. abstract="false" native="false" synchronized="false"
  25867. static="true" final="false" visibility="public"
  25868. deprecated="not deprecated">
  25869. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25870. <doc>
  25871. <![CDATA[Get the value class for the {@link SequenceFile}
  25872. @return the value class of the {@link SequenceFile}]]>
  25873. </doc>
  25874. </method>
  25875. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  25876. abstract="false" native="false" synchronized="false"
  25877. static="false" final="false" visibility="public"
  25878. deprecated="not deprecated">
  25879. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25880. <exception name="IOException" type="java.io.IOException"/>
  25881. </method>
  25882. <method name="checkOutputSpecs"
  25883. abstract="false" native="false" synchronized="false"
  25884. static="false" final="false" visibility="public"
  25885. deprecated="not deprecated">
  25886. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25887. <exception name="IOException" type="java.io.IOException"/>
  25888. </method>
  25889. <field name="KEY_CLASS" type="java.lang.String"
  25890. transient="false" volatile="false"
  25891. static="true" final="false" visibility="public"
  25892. deprecated="not deprecated">
  25893. </field>
  25894. <field name="VALUE_CLASS" type="java.lang.String"
  25895. transient="false" volatile="false"
  25896. static="true" final="false" visibility="public"
  25897. deprecated="not deprecated">
  25898. </field>
  25899. <doc>
  25900. <![CDATA[An {@link org.apache.hadoop.mapreduce.OutputFormat} that writes keys,
  25901. values to {@link SequenceFile}s in binary(raw) format]]>
  25902. </doc>
  25903. </class>
  25904. <!-- end class org.apache.hadoop.mapreduce.lib.output.SequenceFileAsBinaryOutputFormat -->
  25905. <!-- start class org.apache.hadoop.mapreduce.lib.output.SequenceFileAsBinaryOutputFormat.WritableValueBytes -->
  25906. <class name="SequenceFileAsBinaryOutputFormat.WritableValueBytes" extends="java.lang.Object"
  25907. abstract="false"
  25908. static="true" final="false" visibility="public"
  25909. deprecated="not deprecated">
  25910. <implements name="org.apache.hadoop.io.SequenceFile.ValueBytes"/>
  25911. <constructor name="SequenceFileAsBinaryOutputFormat.WritableValueBytes"
  25912. static="false" final="false" visibility="public"
  25913. deprecated="not deprecated">
  25914. </constructor>
  25915. <constructor name="SequenceFileAsBinaryOutputFormat.WritableValueBytes" type="org.apache.hadoop.io.BytesWritable"
  25916. static="false" final="false" visibility="public"
  25917. deprecated="not deprecated">
  25918. </constructor>
  25919. <method name="reset"
  25920. abstract="false" native="false" synchronized="false"
  25921. static="false" final="false" visibility="public"
  25922. deprecated="not deprecated">
  25923. <param name="value" type="org.apache.hadoop.io.BytesWritable"/>
  25924. </method>
  25925. <method name="writeUncompressedBytes"
  25926. abstract="false" native="false" synchronized="false"
  25927. static="false" final="false" visibility="public"
  25928. deprecated="not deprecated">
  25929. <param name="outStream" type="java.io.DataOutputStream"/>
  25930. <exception name="IOException" type="java.io.IOException"/>
  25931. </method>
  25932. <method name="writeCompressedBytes"
  25933. abstract="false" native="false" synchronized="false"
  25934. static="false" final="false" visibility="public"
  25935. deprecated="not deprecated">
  25936. <param name="outStream" type="java.io.DataOutputStream"/>
  25937. <exception name="IllegalArgumentException" type="java.lang.IllegalArgumentException"/>
  25938. <exception name="IOException" type="java.io.IOException"/>
  25939. </method>
  25940. <method name="getSize" return="int"
  25941. abstract="false" native="false" synchronized="false"
  25942. static="false" final="false" visibility="public"
  25943. deprecated="not deprecated">
  25944. </method>
  25945. <doc>
  25946. <![CDATA[Inner class used for appendRaw]]>
  25947. </doc>
  25948. </class>
  25949. <!-- end class org.apache.hadoop.mapreduce.lib.output.SequenceFileAsBinaryOutputFormat.WritableValueBytes -->
  25950. <!-- start class org.apache.hadoop.mapreduce.lib.output.SequenceFileOutputFormat -->
  25951. <class name="SequenceFileOutputFormat" extends="org.apache.hadoop.mapreduce.lib.output.FileOutputFormat"
  25952. abstract="false"
  25953. static="false" final="false" visibility="public"
  25954. deprecated="not deprecated">
  25955. <constructor name="SequenceFileOutputFormat"
  25956. static="false" final="false" visibility="public"
  25957. deprecated="not deprecated">
  25958. </constructor>
  25959. <method name="getSequenceWriter" return="org.apache.hadoop.io.SequenceFile.Writer"
  25960. abstract="false" native="false" synchronized="false"
  25961. static="false" final="false" visibility="protected"
  25962. deprecated="not deprecated">
  25963. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25964. <param name="keyClass" type="java.lang.Class"/>
  25965. <param name="valueClass" type="java.lang.Class"/>
  25966. <exception name="IOException" type="java.io.IOException"/>
  25967. </method>
  25968. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  25969. abstract="false" native="false" synchronized="false"
  25970. static="false" final="false" visibility="public"
  25971. deprecated="not deprecated">
  25972. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  25973. <exception name="IOException" type="java.io.IOException"/>
  25974. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  25975. </method>
  25976. <method name="getOutputCompressionType" return="org.apache.hadoop.io.SequenceFile.CompressionType"
  25977. abstract="false" native="false" synchronized="false"
  25978. static="true" final="false" visibility="public"
  25979. deprecated="not deprecated">
  25980. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  25981. <doc>
  25982. <![CDATA[Get the {@link CompressionType} for the output {@link SequenceFile}.
  25983. @param job the {@link Job}
  25984. @return the {@link CompressionType} for the output {@link SequenceFile},
  25985. defaulting to {@link CompressionType#RECORD}]]>
  25986. </doc>
  25987. </method>
  25988. <method name="setOutputCompressionType"
  25989. abstract="false" native="false" synchronized="false"
  25990. static="true" final="false" visibility="public"
  25991. deprecated="not deprecated">
  25992. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  25993. <param name="style" type="org.apache.hadoop.io.SequenceFile.CompressionType"/>
  25994. <doc>
  25995. <![CDATA[Set the {@link CompressionType} for the output {@link SequenceFile}.
  25996. @param job the {@link Job} to modify
  25997. @param style the {@link CompressionType} for the output
  25998. {@link SequenceFile}]]>
  25999. </doc>
  26000. </method>
  26001. <doc>
  26002. <![CDATA[An {@link OutputFormat} that writes {@link SequenceFile}s.]]>
  26003. </doc>
  26004. </class>
  26005. <!-- end class org.apache.hadoop.mapreduce.lib.output.SequenceFileOutputFormat -->
  26006. <!-- start class org.apache.hadoop.mapreduce.lib.output.TextOutputFormat -->
  26007. <class name="TextOutputFormat" extends="org.apache.hadoop.mapreduce.lib.output.FileOutputFormat"
  26008. abstract="false"
  26009. static="false" final="false" visibility="public"
  26010. deprecated="not deprecated">
  26011. <constructor name="TextOutputFormat"
  26012. static="false" final="false" visibility="public"
  26013. deprecated="not deprecated">
  26014. </constructor>
  26015. <method name="getRecordWriter" return="org.apache.hadoop.mapreduce.RecordWriter"
  26016. abstract="false" native="false" synchronized="false"
  26017. static="false" final="false" visibility="public"
  26018. deprecated="not deprecated">
  26019. <param name="job" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  26020. <exception name="IOException" type="java.io.IOException"/>
  26021. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26022. </method>
  26023. <field name="SEPERATOR" type="java.lang.String"
  26024. transient="false" volatile="false"
  26025. static="true" final="false" visibility="public"
  26026. deprecated="not deprecated">
  26027. </field>
  26028. <doc>
  26029. <![CDATA[An {@link OutputFormat} that writes plain text files.]]>
  26030. </doc>
  26031. </class>
  26032. <!-- end class org.apache.hadoop.mapreduce.lib.output.TextOutputFormat -->
  26033. <!-- start class org.apache.hadoop.mapreduce.lib.output.TextOutputFormat.LineRecordWriter -->
  26034. <class name="TextOutputFormat.LineRecordWriter" extends="org.apache.hadoop.mapreduce.RecordWriter"
  26035. abstract="false"
  26036. static="true" final="false" visibility="protected"
  26037. deprecated="not deprecated">
  26038. <constructor name="TextOutputFormat.LineRecordWriter" type="java.io.DataOutputStream, java.lang.String"
  26039. static="false" final="false" visibility="public"
  26040. deprecated="not deprecated">
  26041. </constructor>
  26042. <constructor name="TextOutputFormat.LineRecordWriter" type="java.io.DataOutputStream"
  26043. static="false" final="false" visibility="public"
  26044. deprecated="not deprecated">
  26045. </constructor>
  26046. <method name="write"
  26047. abstract="false" native="false" synchronized="true"
  26048. static="false" final="false" visibility="public"
  26049. deprecated="not deprecated">
  26050. <param name="key" type="K"/>
  26051. <param name="value" type="V"/>
  26052. <exception name="IOException" type="java.io.IOException"/>
  26053. </method>
  26054. <method name="close"
  26055. abstract="false" native="false" synchronized="true"
  26056. static="false" final="false" visibility="public"
  26057. deprecated="not deprecated">
  26058. <param name="context" type="org.apache.hadoop.mapreduce.TaskAttemptContext"/>
  26059. <exception name="IOException" type="java.io.IOException"/>
  26060. </method>
  26061. <field name="out" type="java.io.DataOutputStream"
  26062. transient="false" volatile="false"
  26063. static="false" final="false" visibility="protected"
  26064. deprecated="not deprecated">
  26065. </field>
  26066. </class>
  26067. <!-- end class org.apache.hadoop.mapreduce.lib.output.TextOutputFormat.LineRecordWriter -->
  26068. </package>
  26069. <package name="org.apache.hadoop.mapreduce.lib.partition">
  26070. <!-- start class org.apache.hadoop.mapreduce.lib.partition.BinaryPartitioner -->
  26071. <class name="BinaryPartitioner" extends="org.apache.hadoop.mapreduce.Partitioner"
  26072. abstract="false"
  26073. static="false" final="false" visibility="public"
  26074. deprecated="not deprecated">
  26075. <implements name="org.apache.hadoop.conf.Configurable"/>
  26076. <constructor name="BinaryPartitioner"
  26077. static="false" final="false" visibility="public"
  26078. deprecated="not deprecated">
  26079. </constructor>
  26080. <method name="setOffsets"
  26081. abstract="false" native="false" synchronized="false"
  26082. static="true" final="false" visibility="public"
  26083. deprecated="not deprecated">
  26084. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26085. <param name="left" type="int"/>
  26086. <param name="right" type="int"/>
  26087. <doc>
  26088. <![CDATA[Set the subarray to be used for partitioning to
  26089. <code>bytes[left:(right+1)]</code> in Python syntax.
  26090. @param conf configuration object
  26091. @param left left Python-style offset
  26092. @param right right Python-style offset]]>
  26093. </doc>
  26094. </method>
  26095. <method name="setLeftOffset"
  26096. abstract="false" native="false" synchronized="false"
  26097. static="true" final="false" visibility="public"
  26098. deprecated="not deprecated">
  26099. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26100. <param name="offset" type="int"/>
  26101. <doc>
  26102. <![CDATA[Set the subarray to be used for partitioning to
  26103. <code>bytes[offset:]</code> in Python syntax.
  26104. @param conf configuration object
  26105. @param offset left Python-style offset]]>
  26106. </doc>
  26107. </method>
  26108. <method name="setRightOffset"
  26109. abstract="false" native="false" synchronized="false"
  26110. static="true" final="false" visibility="public"
  26111. deprecated="not deprecated">
  26112. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26113. <param name="offset" type="int"/>
  26114. <doc>
  26115. <![CDATA[Set the subarray to be used for partitioning to
  26116. <code>bytes[:(offset+1)]</code> in Python syntax.
  26117. @param conf configuration object
  26118. @param offset right Python-style offset]]>
  26119. </doc>
  26120. </method>
  26121. <method name="setConf"
  26122. abstract="false" native="false" synchronized="false"
  26123. static="false" final="false" visibility="public"
  26124. deprecated="not deprecated">
  26125. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26126. </method>
  26127. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  26128. abstract="false" native="false" synchronized="false"
  26129. static="false" final="false" visibility="public"
  26130. deprecated="not deprecated">
  26131. </method>
  26132. <method name="getPartition" return="int"
  26133. abstract="false" native="false" synchronized="false"
  26134. static="false" final="false" visibility="public"
  26135. deprecated="not deprecated">
  26136. <param name="key" type="org.apache.hadoop.io.BinaryComparable"/>
  26137. <param name="value" type="V"/>
  26138. <param name="numPartitions" type="int"/>
  26139. <doc>
  26140. <![CDATA[Use (the specified slice of the array returned by)
  26141. {@link BinaryComparable#getBytes()} to partition.]]>
  26142. </doc>
  26143. </method>
  26144. <field name="LEFT_OFFSET_PROPERTY_NAME" type="java.lang.String"
  26145. transient="false" volatile="false"
  26146. static="true" final="true" visibility="public"
  26147. deprecated="not deprecated">
  26148. </field>
  26149. <field name="RIGHT_OFFSET_PROPERTY_NAME" type="java.lang.String"
  26150. transient="false" volatile="false"
  26151. static="true" final="true" visibility="public"
  26152. deprecated="not deprecated">
  26153. </field>
  26154. <doc>
  26155. <![CDATA[<p>Partition {@link BinaryComparable} keys using a configurable part of
  26156. the bytes array returned by {@link BinaryComparable#getBytes()}.</p>
  26157. <p>The subarray to be used for the partitioning can be defined by means
  26158. of the following properties:
  26159. <ul>
  26160. <li>
  26161. <i>mapreduce.partition.binarypartitioner.left.offset</i>:
  26162. left offset in array (0 by default)
  26163. </li>
  26164. <li>
  26165. <i>mapreduce.partition.binarypartitioner.right.offset</i>:
  26166. right offset in array (-1 by default)
  26167. </li>
  26168. </ul>
  26169. Like in Python, both negative and positive offsets are allowed, but
  26170. the meaning is slightly different. In case of an array of length 5,
  26171. for instance, the possible offsets are:
  26172. <pre><code>
  26173. +---+---+---+---+---+
  26174. | B | B | B | B | B |
  26175. +---+---+---+---+---+
  26176. 0 1 2 3 4
  26177. -5 -4 -3 -2 -1
  26178. </code></pre>
  26179. The first row of numbers gives the position of the offsets 0...5 in
  26180. the array; the second row gives the corresponding negative offsets.
  26181. Contrary to Python, the specified subarray has byte <code>i</code>
  26182. and <code>j</code> as first and last element, repectively, when
  26183. <code>i</code> and <code>j</code> are the left and right offset.
  26184. <p>For Hadoop programs written in Java, it is advisable to use one of
  26185. the following static convenience methods for setting the offsets:
  26186. <ul>
  26187. <li>{@link #setOffsets}</li>
  26188. <li>{@link #setLeftOffset}</li>
  26189. <li>{@link #setRightOffset}</li>
  26190. </ul></p>]]>
  26191. </doc>
  26192. </class>
  26193. <!-- end class org.apache.hadoop.mapreduce.lib.partition.BinaryPartitioner -->
  26194. <!-- start class org.apache.hadoop.mapreduce.lib.partition.HashPartitioner -->
  26195. <class name="HashPartitioner" extends="org.apache.hadoop.mapreduce.Partitioner"
  26196. abstract="false"
  26197. static="false" final="false" visibility="public"
  26198. deprecated="not deprecated">
  26199. <constructor name="HashPartitioner"
  26200. static="false" final="false" visibility="public"
  26201. deprecated="not deprecated">
  26202. </constructor>
  26203. <method name="getPartition" return="int"
  26204. abstract="false" native="false" synchronized="false"
  26205. static="false" final="false" visibility="public"
  26206. deprecated="not deprecated">
  26207. <param name="key" type="K"/>
  26208. <param name="value" type="V"/>
  26209. <param name="numReduceTasks" type="int"/>
  26210. <doc>
  26211. <![CDATA[Use {@link Object#hashCode()} to partition.]]>
  26212. </doc>
  26213. </method>
  26214. <doc>
  26215. <![CDATA[Partition keys by their {@link Object#hashCode()}.]]>
  26216. </doc>
  26217. </class>
  26218. <!-- end class org.apache.hadoop.mapreduce.lib.partition.HashPartitioner -->
  26219. <!-- start class org.apache.hadoop.mapreduce.lib.partition.InputSampler -->
  26220. <class name="InputSampler" extends="org.apache.hadoop.conf.Configured"
  26221. abstract="false"
  26222. static="false" final="false" visibility="public"
  26223. deprecated="not deprecated">
  26224. <implements name="org.apache.hadoop.util.Tool"/>
  26225. <constructor name="InputSampler" type="org.apache.hadoop.conf.Configuration"
  26226. static="false" final="false" visibility="public"
  26227. deprecated="not deprecated">
  26228. </constructor>
  26229. <method name="writePartitionFile"
  26230. abstract="false" native="false" synchronized="false"
  26231. static="true" final="false" visibility="public"
  26232. deprecated="not deprecated">
  26233. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  26234. <param name="sampler" type="org.apache.hadoop.mapreduce.lib.partition.InputSampler.Sampler"/>
  26235. <exception name="IOException" type="java.io.IOException"/>
  26236. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  26237. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26238. <doc>
  26239. <![CDATA[Write a partition file for the given job, using the Sampler provided.
  26240. Queries the sampler for a sample keyset, sorts by the output key
  26241. comparator, selects the keys for each rank, and writes to the destination
  26242. returned from {@link TotalOrderPartitioner#getPartitionFile}.]]>
  26243. </doc>
  26244. </method>
  26245. <method name="run" return="int"
  26246. abstract="false" native="false" synchronized="false"
  26247. static="false" final="false" visibility="public"
  26248. deprecated="not deprecated">
  26249. <param name="args" type="java.lang.String[]"/>
  26250. <exception name="Exception" type="java.lang.Exception"/>
  26251. <doc>
  26252. <![CDATA[Driver for InputSampler from the command line.
  26253. Configures a JobConf instance and calls {@link #writePartitionFile}.]]>
  26254. </doc>
  26255. </method>
  26256. <method name="main"
  26257. abstract="false" native="false" synchronized="false"
  26258. static="true" final="false" visibility="public"
  26259. deprecated="not deprecated">
  26260. <param name="args" type="java.lang.String[]"/>
  26261. <exception name="Exception" type="java.lang.Exception"/>
  26262. </method>
  26263. <doc>
  26264. <![CDATA[Utility for collecting samples and writing a partition file for
  26265. {@link TotalOrderPartitioner}.]]>
  26266. </doc>
  26267. </class>
  26268. <!-- end class org.apache.hadoop.mapreduce.lib.partition.InputSampler -->
  26269. <!-- start class org.apache.hadoop.mapreduce.lib.partition.InputSampler.IntervalSampler -->
  26270. <class name="InputSampler.IntervalSampler" extends="java.lang.Object"
  26271. abstract="false"
  26272. static="true" final="false" visibility="public"
  26273. deprecated="not deprecated">
  26274. <implements name="org.apache.hadoop.mapreduce.lib.partition.InputSampler.Sampler"/>
  26275. <constructor name="InputSampler.IntervalSampler" type="double"
  26276. static="false" final="false" visibility="public"
  26277. deprecated="not deprecated">
  26278. <doc>
  26279. <![CDATA[Create a new IntervalSampler sampling <em>all</em> splits.
  26280. @param freq The frequency with which records will be emitted.]]>
  26281. </doc>
  26282. </constructor>
  26283. <constructor name="InputSampler.IntervalSampler" type="double, int"
  26284. static="false" final="false" visibility="public"
  26285. deprecated="not deprecated">
  26286. <doc>
  26287. <![CDATA[Create a new IntervalSampler.
  26288. @param freq The frequency with which records will be emitted.
  26289. @param maxSplitsSampled The maximum number of splits to examine.
  26290. @see #getSample]]>
  26291. </doc>
  26292. </constructor>
  26293. <method name="getSample" return="K[]"
  26294. abstract="false" native="false" synchronized="false"
  26295. static="false" final="false" visibility="public"
  26296. deprecated="not deprecated">
  26297. <param name="inf" type="org.apache.hadoop.mapreduce.InputFormat"/>
  26298. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  26299. <exception name="IOException" type="java.io.IOException"/>
  26300. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26301. <doc>
  26302. <![CDATA[For each split sampled, emit when the ratio of the number of records
  26303. retained to the total record count is less than the specified
  26304. frequency.]]>
  26305. </doc>
  26306. </method>
  26307. <doc>
  26308. <![CDATA[Sample from s splits at regular intervals.
  26309. Useful for sorted data.]]>
  26310. </doc>
  26311. </class>
  26312. <!-- end class org.apache.hadoop.mapreduce.lib.partition.InputSampler.IntervalSampler -->
  26313. <!-- start class org.apache.hadoop.mapreduce.lib.partition.InputSampler.RandomSampler -->
  26314. <class name="InputSampler.RandomSampler" extends="java.lang.Object"
  26315. abstract="false"
  26316. static="true" final="false" visibility="public"
  26317. deprecated="not deprecated">
  26318. <implements name="org.apache.hadoop.mapreduce.lib.partition.InputSampler.Sampler"/>
  26319. <constructor name="InputSampler.RandomSampler" type="double, int"
  26320. static="false" final="false" visibility="public"
  26321. deprecated="not deprecated">
  26322. <doc>
  26323. <![CDATA[Create a new RandomSampler sampling <em>all</em> splits.
  26324. This will read every split at the client, which is very expensive.
  26325. @param freq Probability with which a key will be chosen.
  26326. @param numSamples Total number of samples to obtain from all selected
  26327. splits.]]>
  26328. </doc>
  26329. </constructor>
  26330. <constructor name="InputSampler.RandomSampler" type="double, int, int"
  26331. static="false" final="false" visibility="public"
  26332. deprecated="not deprecated">
  26333. <doc>
  26334. <![CDATA[Create a new RandomSampler.
  26335. @param freq Probability with which a key will be chosen.
  26336. @param numSamples Total number of samples to obtain from all selected
  26337. splits.
  26338. @param maxSplitsSampled The maximum number of splits to examine.]]>
  26339. </doc>
  26340. </constructor>
  26341. <method name="getSample" return="K[]"
  26342. abstract="false" native="false" synchronized="false"
  26343. static="false" final="false" visibility="public"
  26344. deprecated="not deprecated">
  26345. <param name="inf" type="org.apache.hadoop.mapreduce.InputFormat"/>
  26346. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  26347. <exception name="IOException" type="java.io.IOException"/>
  26348. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26349. <doc>
  26350. <![CDATA[Randomize the split order, then take the specified number of keys from
  26351. each split sampled, where each key is selected with the specified
  26352. probability and possibly replaced by a subsequently selected key when
  26353. the quota of keys from that split is satisfied.]]>
  26354. </doc>
  26355. </method>
  26356. <doc>
  26357. <![CDATA[Sample from random points in the input.
  26358. General-purpose sampler. Takes numSamples / maxSplitsSampled inputs from
  26359. each split.]]>
  26360. </doc>
  26361. </class>
  26362. <!-- end class org.apache.hadoop.mapreduce.lib.partition.InputSampler.RandomSampler -->
  26363. <!-- start interface org.apache.hadoop.mapreduce.lib.partition.InputSampler.Sampler -->
  26364. <interface name="InputSampler.Sampler" abstract="true"
  26365. static="true" final="false" visibility="public"
  26366. deprecated="not deprecated">
  26367. <method name="getSample" return="K[]"
  26368. abstract="false" native="false" synchronized="false"
  26369. static="false" final="false" visibility="public"
  26370. deprecated="not deprecated">
  26371. <param name="inf" type="org.apache.hadoop.mapreduce.InputFormat"/>
  26372. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  26373. <exception name="IOException" type="java.io.IOException"/>
  26374. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26375. <doc>
  26376. <![CDATA[For a given job, collect and return a subset of the keys from the
  26377. input data.]]>
  26378. </doc>
  26379. </method>
  26380. <doc>
  26381. <![CDATA[Interface to sample using an
  26382. {@link org.apache.hadoop.mapreduce.InputFormat}.]]>
  26383. </doc>
  26384. </interface>
  26385. <!-- end interface org.apache.hadoop.mapreduce.lib.partition.InputSampler.Sampler -->
  26386. <!-- start class org.apache.hadoop.mapreduce.lib.partition.InputSampler.SplitSampler -->
  26387. <class name="InputSampler.SplitSampler" extends="java.lang.Object"
  26388. abstract="false"
  26389. static="true" final="false" visibility="public"
  26390. deprecated="not deprecated">
  26391. <implements name="org.apache.hadoop.mapreduce.lib.partition.InputSampler.Sampler"/>
  26392. <constructor name="InputSampler.SplitSampler" type="int"
  26393. static="false" final="false" visibility="public"
  26394. deprecated="not deprecated">
  26395. <doc>
  26396. <![CDATA[Create a SplitSampler sampling <em>all</em> splits.
  26397. Takes the first numSamples / numSplits records from each split.
  26398. @param numSamples Total number of samples to obtain from all selected
  26399. splits.]]>
  26400. </doc>
  26401. </constructor>
  26402. <constructor name="InputSampler.SplitSampler" type="int, int"
  26403. static="false" final="false" visibility="public"
  26404. deprecated="not deprecated">
  26405. <doc>
  26406. <![CDATA[Create a new SplitSampler.
  26407. @param numSamples Total number of samples to obtain from all selected
  26408. splits.
  26409. @param maxSplitsSampled The maximum number of splits to examine.]]>
  26410. </doc>
  26411. </constructor>
  26412. <method name="getSample" return="K[]"
  26413. abstract="false" native="false" synchronized="false"
  26414. static="false" final="false" visibility="public"
  26415. deprecated="not deprecated">
  26416. <param name="inf" type="org.apache.hadoop.mapreduce.InputFormat"/>
  26417. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  26418. <exception name="IOException" type="java.io.IOException"/>
  26419. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26420. <doc>
  26421. <![CDATA[From each split sampled, take the first numSamples / numSplits records.]]>
  26422. </doc>
  26423. </method>
  26424. <doc>
  26425. <![CDATA[Samples the first n records from s splits.
  26426. Inexpensive way to sample random data.]]>
  26427. </doc>
  26428. </class>
  26429. <!-- end class org.apache.hadoop.mapreduce.lib.partition.InputSampler.SplitSampler -->
  26430. <!-- start class org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedComparator -->
  26431. <class name="KeyFieldBasedComparator" extends="org.apache.hadoop.io.WritableComparator"
  26432. abstract="false"
  26433. static="false" final="false" visibility="public"
  26434. deprecated="not deprecated">
  26435. <implements name="org.apache.hadoop.conf.Configurable"/>
  26436. <constructor name="KeyFieldBasedComparator"
  26437. static="false" final="false" visibility="public"
  26438. deprecated="not deprecated">
  26439. </constructor>
  26440. <method name="setConf"
  26441. abstract="false" native="false" synchronized="false"
  26442. static="false" final="false" visibility="public"
  26443. deprecated="not deprecated">
  26444. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26445. </method>
  26446. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  26447. abstract="false" native="false" synchronized="false"
  26448. static="false" final="false" visibility="public"
  26449. deprecated="not deprecated">
  26450. </method>
  26451. <method name="compare" return="int"
  26452. abstract="false" native="false" synchronized="false"
  26453. static="false" final="false" visibility="public"
  26454. deprecated="not deprecated">
  26455. <param name="b1" type="byte[]"/>
  26456. <param name="s1" type="int"/>
  26457. <param name="l1" type="int"/>
  26458. <param name="b2" type="byte[]"/>
  26459. <param name="s2" type="int"/>
  26460. <param name="l2" type="int"/>
  26461. </method>
  26462. <method name="setKeyFieldComparatorOptions"
  26463. abstract="false" native="false" synchronized="false"
  26464. static="true" final="false" visibility="public"
  26465. deprecated="not deprecated">
  26466. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  26467. <param name="keySpec" type="java.lang.String"/>
  26468. <doc>
  26469. <![CDATA[Set the {@link KeyFieldBasedComparator} options used to compare keys.
  26470. @param keySpec the key specification of the form -k pos1[,pos2], where,
  26471. pos is of the form f[.c][opts], where f is the number
  26472. of the key field to use, and c is the number of the first character from
  26473. the beginning of the field. Fields and character posns are numbered
  26474. starting with 1; a character position of zero in pos2 indicates the
  26475. field's last character. If '.c' is omitted from pos1, it defaults to 1
  26476. (the beginning of the field); if omitted from pos2, it defaults to 0
  26477. (the end of the field). opts are ordering options. The supported options
  26478. are:
  26479. -n, (Sort numerically)
  26480. -r, (Reverse the result of comparison)]]>
  26481. </doc>
  26482. </method>
  26483. <method name="getKeyFieldComparatorOption" return="java.lang.String"
  26484. abstract="false" native="false" synchronized="false"
  26485. static="true" final="false" visibility="public"
  26486. deprecated="not deprecated">
  26487. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  26488. <doc>
  26489. <![CDATA[Get the {@link KeyFieldBasedComparator} options]]>
  26490. </doc>
  26491. </method>
  26492. <field name="COMPARATOR_OPTIONS" type="java.lang.String"
  26493. transient="false" volatile="false"
  26494. static="true" final="false" visibility="public"
  26495. deprecated="not deprecated">
  26496. </field>
  26497. <doc>
  26498. <![CDATA[This comparator implementation provides a subset of the features provided
  26499. by the Unix/GNU Sort. In particular, the supported features are:
  26500. -n, (Sort numerically)
  26501. -r, (Reverse the result of comparison)
  26502. -k pos1[,pos2], where pos is of the form f[.c][opts], where f is the number
  26503. of the field to use, and c is the number of the first character from the
  26504. beginning of the field. Fields and character posns are numbered starting
  26505. with 1; a character position of zero in pos2 indicates the field's last
  26506. character. If '.c' is omitted from pos1, it defaults to 1 (the beginning
  26507. of the field); if omitted from pos2, it defaults to 0 (the end of the
  26508. field). opts are ordering options (any of 'nr' as described above).
  26509. We assume that the fields in the key are separated by
  26510. {@link JobContext#MAP_OUTPUT_KEY_FIELD_SEPERATOR}.]]>
  26511. </doc>
  26512. </class>
  26513. <!-- end class org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedComparator -->
  26514. <!-- start class org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedPartitioner -->
  26515. <class name="KeyFieldBasedPartitioner" extends="org.apache.hadoop.mapreduce.Partitioner"
  26516. abstract="false"
  26517. static="false" final="false" visibility="public"
  26518. deprecated="not deprecated">
  26519. <implements name="org.apache.hadoop.conf.Configurable"/>
  26520. <constructor name="KeyFieldBasedPartitioner"
  26521. static="false" final="false" visibility="public"
  26522. deprecated="not deprecated">
  26523. </constructor>
  26524. <method name="setConf"
  26525. abstract="false" native="false" synchronized="false"
  26526. static="false" final="false" visibility="public"
  26527. deprecated="not deprecated">
  26528. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26529. </method>
  26530. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  26531. abstract="false" native="false" synchronized="false"
  26532. static="false" final="false" visibility="public"
  26533. deprecated="not deprecated">
  26534. </method>
  26535. <method name="getPartition" return="int"
  26536. abstract="false" native="false" synchronized="false"
  26537. static="false" final="false" visibility="public"
  26538. deprecated="not deprecated">
  26539. <param name="key" type="K2"/>
  26540. <param name="value" type="V2"/>
  26541. <param name="numReduceTasks" type="int"/>
  26542. </method>
  26543. <method name="hashCode" return="int"
  26544. abstract="false" native="false" synchronized="false"
  26545. static="false" final="false" visibility="protected"
  26546. deprecated="not deprecated">
  26547. <param name="b" type="byte[]"/>
  26548. <param name="start" type="int"/>
  26549. <param name="end" type="int"/>
  26550. <param name="currentHash" type="int"/>
  26551. </method>
  26552. <method name="getPartition" return="int"
  26553. abstract="false" native="false" synchronized="false"
  26554. static="false" final="false" visibility="protected"
  26555. deprecated="not deprecated">
  26556. <param name="hash" type="int"/>
  26557. <param name="numReduceTasks" type="int"/>
  26558. </method>
  26559. <method name="setKeyFieldPartitionerOptions"
  26560. abstract="false" native="false" synchronized="false"
  26561. static="false" final="false" visibility="public"
  26562. deprecated="not deprecated">
  26563. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  26564. <param name="keySpec" type="java.lang.String"/>
  26565. <doc>
  26566. <![CDATA[Set the {@link KeyFieldBasedPartitioner} options used for
  26567. {@link Partitioner}
  26568. @param keySpec the key specification of the form -k pos1[,pos2], where,
  26569. pos is of the form f[.c][opts], where f is the number
  26570. of the key field to use, and c is the number of the first character from
  26571. the beginning of the field. Fields and character posns are numbered
  26572. starting with 1; a character position of zero in pos2 indicates the
  26573. field's last character. If '.c' is omitted from pos1, it defaults to 1
  26574. (the beginning of the field); if omitted from pos2, it defaults to 0
  26575. (the end of the field).]]>
  26576. </doc>
  26577. </method>
  26578. <method name="getKeyFieldPartitionerOption" return="java.lang.String"
  26579. abstract="false" native="false" synchronized="false"
  26580. static="false" final="false" visibility="public"
  26581. deprecated="not deprecated">
  26582. <param name="job" type="org.apache.hadoop.mapreduce.JobContext"/>
  26583. <doc>
  26584. <![CDATA[Get the {@link KeyFieldBasedPartitioner} options]]>
  26585. </doc>
  26586. </method>
  26587. <field name="PARTITIONER_OPTIONS" type="java.lang.String"
  26588. transient="false" volatile="false"
  26589. static="true" final="false" visibility="public"
  26590. deprecated="not deprecated">
  26591. </field>
  26592. <doc>
  26593. <![CDATA[Defines a way to partition keys based on certain key fields (also see
  26594. {@link KeyFieldBasedComparator}.
  26595. The key specification supported is of the form -k pos1[,pos2], where,
  26596. pos is of the form f[.c][opts], where f is the number
  26597. of the key field to use, and c is the number of the first character from
  26598. the beginning of the field. Fields and character posns are numbered
  26599. starting with 1; a character position of zero in pos2 indicates the
  26600. field's last character. If '.c' is omitted from pos1, it defaults to 1
  26601. (the beginning of the field); if omitted from pos2, it defaults to 0
  26602. (the end of the field).]]>
  26603. </doc>
  26604. </class>
  26605. <!-- end class org.apache.hadoop.mapreduce.lib.partition.KeyFieldBasedPartitioner -->
  26606. <!-- start class org.apache.hadoop.mapreduce.lib.partition.TotalOrderPartitioner -->
  26607. <class name="TotalOrderPartitioner" extends="org.apache.hadoop.mapreduce.Partitioner"
  26608. abstract="false"
  26609. static="false" final="false" visibility="public"
  26610. deprecated="not deprecated">
  26611. <implements name="org.apache.hadoop.conf.Configurable"/>
  26612. <constructor name="TotalOrderPartitioner"
  26613. static="false" final="false" visibility="public"
  26614. deprecated="not deprecated">
  26615. </constructor>
  26616. <method name="setConf"
  26617. abstract="false" native="false" synchronized="false"
  26618. static="false" final="false" visibility="public"
  26619. deprecated="not deprecated">
  26620. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26621. <doc>
  26622. <![CDATA[Read in the partition file and build indexing data structures.
  26623. If the keytype is {@link org.apache.hadoop.io.BinaryComparable} and
  26624. <tt>total.order.partitioner.natural.order</tt> is not false, a trie
  26625. of the first <tt>total.order.partitioner.max.trie.depth</tt>(2) + 1 bytes
  26626. will be built. Otherwise, keys will be located using a binary search of
  26627. the partition keyset using the {@link org.apache.hadoop.io.RawComparator}
  26628. defined for this job. The input file must be sorted with the same
  26629. comparator and contain {@link Job#getNumReduceTasks()} - 1 keys.]]>
  26630. </doc>
  26631. </method>
  26632. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  26633. abstract="false" native="false" synchronized="false"
  26634. static="false" final="false" visibility="public"
  26635. deprecated="not deprecated">
  26636. </method>
  26637. <method name="getPartition" return="int"
  26638. abstract="false" native="false" synchronized="false"
  26639. static="false" final="false" visibility="public"
  26640. deprecated="not deprecated">
  26641. <param name="key" type="K"/>
  26642. <param name="value" type="V"/>
  26643. <param name="numPartitions" type="int"/>
  26644. </method>
  26645. <method name="setPartitionFile"
  26646. abstract="false" native="false" synchronized="false"
  26647. static="true" final="false" visibility="public"
  26648. deprecated="not deprecated">
  26649. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26650. <param name="p" type="org.apache.hadoop.fs.Path"/>
  26651. <doc>
  26652. <![CDATA[Set the path to the SequenceFile storing the sorted partition keyset.
  26653. It must be the case that for <tt>R</tt> reduces, there are <tt>R-1</tt>
  26654. keys in the SequenceFile.]]>
  26655. </doc>
  26656. </method>
  26657. <method name="getPartitionFile" return="java.lang.String"
  26658. abstract="false" native="false" synchronized="false"
  26659. static="true" final="false" visibility="public"
  26660. deprecated="not deprecated">
  26661. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  26662. <doc>
  26663. <![CDATA[Get the path to the SequenceFile storing the sorted partition keyset.
  26664. @see #setPartitionFile(Configuration, Path)]]>
  26665. </doc>
  26666. </method>
  26667. <field name="DEFAULT_PATH" type="java.lang.String"
  26668. transient="false" volatile="false"
  26669. static="true" final="true" visibility="public"
  26670. deprecated="not deprecated">
  26671. </field>
  26672. <field name="PARTITIONER_PATH" type="java.lang.String"
  26673. transient="false" volatile="false"
  26674. static="true" final="true" visibility="public"
  26675. deprecated="not deprecated">
  26676. </field>
  26677. <field name="MAX_TRIE_DEPTH" type="java.lang.String"
  26678. transient="false" volatile="false"
  26679. static="true" final="true" visibility="public"
  26680. deprecated="not deprecated">
  26681. </field>
  26682. <field name="NATURAL_ORDER" type="java.lang.String"
  26683. transient="false" volatile="false"
  26684. static="true" final="true" visibility="public"
  26685. deprecated="not deprecated">
  26686. </field>
  26687. <doc>
  26688. <![CDATA[Partitioner effecting a total order by reading split points from
  26689. an externally generated source.]]>
  26690. </doc>
  26691. </class>
  26692. <!-- end class org.apache.hadoop.mapreduce.lib.partition.TotalOrderPartitioner -->
  26693. </package>
  26694. <package name="org.apache.hadoop.mapreduce.lib.reduce">
  26695. <!-- start class org.apache.hadoop.mapreduce.lib.reduce.IntSumReducer -->
  26696. <class name="IntSumReducer" extends="org.apache.hadoop.mapreduce.Reducer"
  26697. abstract="false"
  26698. static="false" final="false" visibility="public"
  26699. deprecated="not deprecated">
  26700. <constructor name="IntSumReducer"
  26701. static="false" final="false" visibility="public"
  26702. deprecated="not deprecated">
  26703. </constructor>
  26704. <method name="reduce"
  26705. abstract="false" native="false" synchronized="false"
  26706. static="false" final="false" visibility="public"
  26707. deprecated="not deprecated">
  26708. <param name="key" type="Key"/>
  26709. <param name="values" type="java.lang.Iterable"/>
  26710. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  26711. <exception name="IOException" type="java.io.IOException"/>
  26712. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26713. </method>
  26714. </class>
  26715. <!-- end class org.apache.hadoop.mapreduce.lib.reduce.IntSumReducer -->
  26716. <!-- start class org.apache.hadoop.mapreduce.lib.reduce.LongSumReducer -->
  26717. <class name="LongSumReducer" extends="org.apache.hadoop.mapreduce.Reducer"
  26718. abstract="false"
  26719. static="false" final="false" visibility="public"
  26720. deprecated="not deprecated">
  26721. <constructor name="LongSumReducer"
  26722. static="false" final="false" visibility="public"
  26723. deprecated="not deprecated">
  26724. </constructor>
  26725. <method name="reduce"
  26726. abstract="false" native="false" synchronized="false"
  26727. static="false" final="false" visibility="public"
  26728. deprecated="not deprecated">
  26729. <param name="key" type="KEY"/>
  26730. <param name="values" type="java.lang.Iterable"/>
  26731. <param name="context" type="org.apache.hadoop.mapreduce.Reducer.Context"/>
  26732. <exception name="IOException" type="java.io.IOException"/>
  26733. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26734. </method>
  26735. </class>
  26736. <!-- end class org.apache.hadoop.mapreduce.lib.reduce.LongSumReducer -->
  26737. <!-- start class org.apache.hadoop.mapreduce.lib.reduce.WrappedReducer -->
  26738. <class name="WrappedReducer" extends="org.apache.hadoop.mapreduce.Reducer"
  26739. abstract="false"
  26740. static="false" final="false" visibility="public"
  26741. deprecated="not deprecated">
  26742. <constructor name="WrappedReducer"
  26743. static="false" final="false" visibility="public"
  26744. deprecated="not deprecated">
  26745. </constructor>
  26746. <method name="getReducerContext" return="org.apache.hadoop.mapreduce.Reducer.Context"
  26747. abstract="false" native="false" synchronized="false"
  26748. static="false" final="false" visibility="public"
  26749. deprecated="not deprecated">
  26750. <param name="reduceContext" type="org.apache.hadoop.mapreduce.ReduceContext"/>
  26751. <doc>
  26752. <![CDATA[A a wrapped {@link Reducer.Context} for custom implementations.
  26753. @param reduceContext <code>ReduceContext</code> to be wrapped
  26754. @return a wrapped <code>Reducer.Context</code> for custom implementations]]>
  26755. </doc>
  26756. </method>
  26757. <doc>
  26758. <![CDATA[A {@link Reducer} which wraps a given one to allow for custom
  26759. {@link Reducer.Context} implementations.]]>
  26760. </doc>
  26761. </class>
  26762. <!-- end class org.apache.hadoop.mapreduce.lib.reduce.WrappedReducer -->
  26763. <!-- start class org.apache.hadoop.mapreduce.lib.reduce.WrappedReducer.Context -->
  26764. <class name="WrappedReducer.Context" extends="org.apache.hadoop.mapreduce.Reducer.Context"
  26765. abstract="false"
  26766. static="false" final="false" visibility="public"
  26767. deprecated="not deprecated">
  26768. <constructor name="WrappedReducer.Context" type="org.apache.hadoop.mapreduce.ReduceContext"
  26769. static="false" final="false" visibility="public"
  26770. deprecated="not deprecated">
  26771. </constructor>
  26772. <method name="getCurrentKey" return="KEYIN"
  26773. abstract="false" native="false" synchronized="false"
  26774. static="false" final="false" visibility="public"
  26775. deprecated="not deprecated">
  26776. <exception name="IOException" type="java.io.IOException"/>
  26777. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26778. </method>
  26779. <method name="getCurrentValue" return="VALUEIN"
  26780. abstract="false" native="false" synchronized="false"
  26781. static="false" final="false" visibility="public"
  26782. deprecated="not deprecated">
  26783. <exception name="IOException" type="java.io.IOException"/>
  26784. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26785. </method>
  26786. <method name="nextKeyValue" return="boolean"
  26787. abstract="false" native="false" synchronized="false"
  26788. static="false" final="false" visibility="public"
  26789. deprecated="not deprecated">
  26790. <exception name="IOException" type="java.io.IOException"/>
  26791. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26792. </method>
  26793. <method name="getCounter" return="org.apache.hadoop.mapreduce.Counter"
  26794. abstract="false" native="false" synchronized="false"
  26795. static="false" final="false" visibility="public"
  26796. deprecated="not deprecated">
  26797. <param name="counterName" type="java.lang.Enum"/>
  26798. </method>
  26799. <method name="getCounter" return="org.apache.hadoop.mapreduce.Counter"
  26800. abstract="false" native="false" synchronized="false"
  26801. static="false" final="false" visibility="public"
  26802. deprecated="not deprecated">
  26803. <param name="groupName" type="java.lang.String"/>
  26804. <param name="counterName" type="java.lang.String"/>
  26805. </method>
  26806. <method name="getOutputCommitter" return="org.apache.hadoop.mapreduce.OutputCommitter"
  26807. abstract="false" native="false" synchronized="false"
  26808. static="false" final="false" visibility="public"
  26809. deprecated="not deprecated">
  26810. </method>
  26811. <method name="write"
  26812. abstract="false" native="false" synchronized="false"
  26813. static="false" final="false" visibility="public"
  26814. deprecated="not deprecated">
  26815. <param name="key" type="KEYOUT"/>
  26816. <param name="value" type="VALUEOUT"/>
  26817. <exception name="IOException" type="java.io.IOException"/>
  26818. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  26819. </method>
  26820. <method name="getStatus" return="java.lang.String"
  26821. abstract="false" native="false" synchronized="false"
  26822. static="false" final="false" visibility="public"
  26823. deprecated="not deprecated">
  26824. </method>
  26825. <method name="getTaskAttemptID" return="org.apache.hadoop.mapreduce.TaskAttemptID"
  26826. abstract="false" native="false" synchronized="false"
  26827. static="false" final="false" visibility="public"
  26828. deprecated="not deprecated">
  26829. </method>
  26830. <method name="setStatus"
  26831. abstract="false" native="false" synchronized="false"
  26832. static="false" final="false" visibility="public"
  26833. deprecated="not deprecated">
  26834. <param name="msg" type="java.lang.String"/>
  26835. </method>
  26836. <method name="getArchiveClassPaths" return="org.apache.hadoop.fs.Path[]"
  26837. abstract="false" native="false" synchronized="false"
  26838. static="false" final="false" visibility="public"
  26839. deprecated="not deprecated">
  26840. </method>
  26841. <method name="getArchiveTimestamps" return="java.lang.String[]"
  26842. abstract="false" native="false" synchronized="false"
  26843. static="false" final="false" visibility="public"
  26844. deprecated="not deprecated">
  26845. </method>
  26846. <method name="getCacheArchives" return="java.net.URI[]"
  26847. abstract="false" native="false" synchronized="false"
  26848. static="false" final="false" visibility="public"
  26849. deprecated="not deprecated">
  26850. <exception name="IOException" type="java.io.IOException"/>
  26851. </method>
  26852. <method name="getCacheFiles" return="java.net.URI[]"
  26853. abstract="false" native="false" synchronized="false"
  26854. static="false" final="false" visibility="public"
  26855. deprecated="not deprecated">
  26856. <exception name="IOException" type="java.io.IOException"/>
  26857. </method>
  26858. <method name="getCombinerClass" return="java.lang.Class"
  26859. abstract="false" native="false" synchronized="false"
  26860. static="false" final="false" visibility="public"
  26861. deprecated="not deprecated">
  26862. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  26863. </method>
  26864. <method name="getConfiguration" return="org.apache.hadoop.conf.Configuration"
  26865. abstract="false" native="false" synchronized="false"
  26866. static="false" final="false" visibility="public"
  26867. deprecated="not deprecated">
  26868. </method>
  26869. <method name="getFileClassPaths" return="org.apache.hadoop.fs.Path[]"
  26870. abstract="false" native="false" synchronized="false"
  26871. static="false" final="false" visibility="public"
  26872. deprecated="not deprecated">
  26873. </method>
  26874. <method name="getFileTimestamps" return="java.lang.String[]"
  26875. abstract="false" native="false" synchronized="false"
  26876. static="false" final="false" visibility="public"
  26877. deprecated="not deprecated">
  26878. </method>
  26879. <method name="getGroupingComparator" return="org.apache.hadoop.io.RawComparator"
  26880. abstract="false" native="false" synchronized="false"
  26881. static="false" final="false" visibility="public"
  26882. deprecated="not deprecated">
  26883. </method>
  26884. <method name="getInputFormatClass" return="java.lang.Class"
  26885. abstract="false" native="false" synchronized="false"
  26886. static="false" final="false" visibility="public"
  26887. deprecated="not deprecated">
  26888. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  26889. </method>
  26890. <method name="getJar" return="java.lang.String"
  26891. abstract="false" native="false" synchronized="false"
  26892. static="false" final="false" visibility="public"
  26893. deprecated="not deprecated">
  26894. </method>
  26895. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  26896. abstract="false" native="false" synchronized="false"
  26897. static="false" final="false" visibility="public"
  26898. deprecated="not deprecated">
  26899. </method>
  26900. <method name="getJobName" return="java.lang.String"
  26901. abstract="false" native="false" synchronized="false"
  26902. static="false" final="false" visibility="public"
  26903. deprecated="not deprecated">
  26904. </method>
  26905. <method name="getJobSetupCleanupNeeded" return="boolean"
  26906. abstract="false" native="false" synchronized="false"
  26907. static="false" final="false" visibility="public"
  26908. deprecated="not deprecated">
  26909. </method>
  26910. <method name="getLocalCacheArchives" return="org.apache.hadoop.fs.Path[]"
  26911. abstract="false" native="false" synchronized="false"
  26912. static="false" final="false" visibility="public"
  26913. deprecated="not deprecated">
  26914. <exception name="IOException" type="java.io.IOException"/>
  26915. </method>
  26916. <method name="getLocalCacheFiles" return="org.apache.hadoop.fs.Path[]"
  26917. abstract="false" native="false" synchronized="false"
  26918. static="false" final="false" visibility="public"
  26919. deprecated="not deprecated">
  26920. <exception name="IOException" type="java.io.IOException"/>
  26921. </method>
  26922. <method name="getMapOutputKeyClass" return="java.lang.Class"
  26923. abstract="false" native="false" synchronized="false"
  26924. static="false" final="false" visibility="public"
  26925. deprecated="not deprecated">
  26926. </method>
  26927. <method name="getMapOutputValueClass" return="java.lang.Class"
  26928. abstract="false" native="false" synchronized="false"
  26929. static="false" final="false" visibility="public"
  26930. deprecated="not deprecated">
  26931. </method>
  26932. <method name="getMapperClass" return="java.lang.Class"
  26933. abstract="false" native="false" synchronized="false"
  26934. static="false" final="false" visibility="public"
  26935. deprecated="not deprecated">
  26936. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  26937. </method>
  26938. <method name="getMaxMapAttempts" return="int"
  26939. abstract="false" native="false" synchronized="false"
  26940. static="false" final="false" visibility="public"
  26941. deprecated="not deprecated">
  26942. </method>
  26943. <method name="getMaxReduceAttempts" return="int"
  26944. abstract="false" native="false" synchronized="false"
  26945. static="false" final="false" visibility="public"
  26946. deprecated="not deprecated">
  26947. </method>
  26948. <method name="getNumReduceTasks" return="int"
  26949. abstract="false" native="false" synchronized="false"
  26950. static="false" final="false" visibility="public"
  26951. deprecated="not deprecated">
  26952. </method>
  26953. <method name="getOutputFormatClass" return="java.lang.Class"
  26954. abstract="false" native="false" synchronized="false"
  26955. static="false" final="false" visibility="public"
  26956. deprecated="not deprecated">
  26957. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  26958. </method>
  26959. <method name="getOutputKeyClass" return="java.lang.Class"
  26960. abstract="false" native="false" synchronized="false"
  26961. static="false" final="false" visibility="public"
  26962. deprecated="not deprecated">
  26963. </method>
  26964. <method name="getOutputValueClass" return="java.lang.Class"
  26965. abstract="false" native="false" synchronized="false"
  26966. static="false" final="false" visibility="public"
  26967. deprecated="not deprecated">
  26968. </method>
  26969. <method name="getPartitionerClass" return="java.lang.Class"
  26970. abstract="false" native="false" synchronized="false"
  26971. static="false" final="false" visibility="public"
  26972. deprecated="not deprecated">
  26973. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  26974. </method>
  26975. <method name="getReducerClass" return="java.lang.Class"
  26976. abstract="false" native="false" synchronized="false"
  26977. static="false" final="false" visibility="public"
  26978. deprecated="not deprecated">
  26979. <exception name="ClassNotFoundException" type="java.lang.ClassNotFoundException"/>
  26980. </method>
  26981. <method name="getSortComparator" return="org.apache.hadoop.io.RawComparator"
  26982. abstract="false" native="false" synchronized="false"
  26983. static="false" final="false" visibility="public"
  26984. deprecated="not deprecated">
  26985. </method>
  26986. <method name="getSymlink" return="boolean"
  26987. abstract="false" native="false" synchronized="false"
  26988. static="false" final="false" visibility="public"
  26989. deprecated="not deprecated">
  26990. </method>
  26991. <method name="getWorkingDirectory" return="org.apache.hadoop.fs.Path"
  26992. abstract="false" native="false" synchronized="false"
  26993. static="false" final="false" visibility="public"
  26994. deprecated="not deprecated">
  26995. <exception name="IOException" type="java.io.IOException"/>
  26996. </method>
  26997. <method name="progress"
  26998. abstract="false" native="false" synchronized="false"
  26999. static="false" final="false" visibility="public"
  27000. deprecated="not deprecated">
  27001. </method>
  27002. <method name="getValues" return="java.lang.Iterable"
  27003. abstract="false" native="false" synchronized="false"
  27004. static="false" final="false" visibility="public"
  27005. deprecated="not deprecated">
  27006. <exception name="IOException" type="java.io.IOException"/>
  27007. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  27008. </method>
  27009. <method name="nextKey" return="boolean"
  27010. abstract="false" native="false" synchronized="false"
  27011. static="false" final="false" visibility="public"
  27012. deprecated="not deprecated">
  27013. <exception name="IOException" type="java.io.IOException"/>
  27014. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  27015. </method>
  27016. <method name="getProfileEnabled" return="boolean"
  27017. abstract="false" native="false" synchronized="false"
  27018. static="false" final="false" visibility="public"
  27019. deprecated="not deprecated">
  27020. </method>
  27021. <method name="getProfileParams" return="java.lang.String"
  27022. abstract="false" native="false" synchronized="false"
  27023. static="false" final="false" visibility="public"
  27024. deprecated="not deprecated">
  27025. </method>
  27026. <method name="getProfileTaskRange" return="org.apache.hadoop.conf.Configuration.IntegerRanges"
  27027. abstract="false" native="false" synchronized="false"
  27028. static="false" final="false" visibility="public"
  27029. deprecated="not deprecated">
  27030. <param name="isMap" type="boolean"/>
  27031. </method>
  27032. <method name="getUser" return="java.lang.String"
  27033. abstract="false" native="false" synchronized="false"
  27034. static="false" final="false" visibility="public"
  27035. deprecated="not deprecated">
  27036. </method>
  27037. <method name="getCredentials" return="org.apache.hadoop.security.Credentials"
  27038. abstract="false" native="false" synchronized="false"
  27039. static="false" final="false" visibility="public"
  27040. deprecated="not deprecated">
  27041. </method>
  27042. <field name="reduceContext" type="org.apache.hadoop.mapreduce.ReduceContext"
  27043. transient="false" volatile="false"
  27044. static="false" final="false" visibility="protected"
  27045. deprecated="not deprecated">
  27046. </field>
  27047. </class>
  27048. <!-- end class org.apache.hadoop.mapreduce.lib.reduce.WrappedReducer.Context -->
  27049. </package>
  27050. <package name="org.apache.hadoop.mapreduce.security">
  27051. <!-- start class org.apache.hadoop.mapreduce.security.TokenCache -->
  27052. <class name="TokenCache" extends="java.lang.Object"
  27053. abstract="false"
  27054. static="false" final="false" visibility="public"
  27055. deprecated="not deprecated">
  27056. <constructor name="TokenCache"
  27057. static="false" final="false" visibility="public"
  27058. deprecated="not deprecated">
  27059. </constructor>
  27060. <method name="getSecretKey" return="byte[]"
  27061. abstract="false" native="false" synchronized="false"
  27062. static="true" final="false" visibility="public"
  27063. deprecated="not deprecated">
  27064. <param name="credentials" type="org.apache.hadoop.security.Credentials"/>
  27065. <param name="alias" type="org.apache.hadoop.io.Text"/>
  27066. <doc>
  27067. <![CDATA[auxiliary method to get user's secret keys..
  27068. @param alias
  27069. @return secret key from the storage]]>
  27070. </doc>
  27071. </method>
  27072. <method name="obtainTokensForNamenodes"
  27073. abstract="false" native="false" synchronized="false"
  27074. static="true" final="false" visibility="public"
  27075. deprecated="not deprecated">
  27076. <param name="credentials" type="org.apache.hadoop.security.Credentials"/>
  27077. <param name="ps" type="org.apache.hadoop.fs.Path[]"/>
  27078. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  27079. <exception name="IOException" type="java.io.IOException"/>
  27080. <doc>
  27081. <![CDATA[Convenience method to obtain delegation tokens from namenodes
  27082. corresponding to the paths passed.
  27083. @param credentials
  27084. @param ps array of paths
  27085. @param conf configuration
  27086. @throws IOException]]>
  27087. </doc>
  27088. </method>
  27089. <method name="getDelegationToken" return="org.apache.hadoop.security.token.Token"
  27090. abstract="false" native="false" synchronized="false"
  27091. static="true" final="false" visibility="public"
  27092. deprecated="not deprecated">
  27093. <param name="credentials" type="org.apache.hadoop.security.Credentials"/>
  27094. <param name="namenode" type="java.lang.String"/>
  27095. <doc>
  27096. <![CDATA[@param namenode
  27097. @return delegation token]]>
  27098. </doc>
  27099. </method>
  27100. <method name="loadTokens" return="org.apache.hadoop.security.Credentials"
  27101. abstract="false" native="false" synchronized="false"
  27102. static="true" final="false" visibility="public"
  27103. deprecated="not deprecated">
  27104. <param name="jobTokenFile" type="java.lang.String"/>
  27105. <param name="conf" type="org.apache.hadoop.mapred.JobConf"/>
  27106. <exception name="IOException" type="java.io.IOException"/>
  27107. <doc>
  27108. <![CDATA[load job token from a file
  27109. @param conf
  27110. @throws IOException]]>
  27111. </doc>
  27112. </method>
  27113. <method name="setJobToken"
  27114. abstract="false" native="false" synchronized="false"
  27115. static="true" final="false" visibility="public"
  27116. deprecated="not deprecated">
  27117. <param name="t" type="org.apache.hadoop.security.token.Token"/>
  27118. <param name="credentials" type="org.apache.hadoop.security.Credentials"/>
  27119. <doc>
  27120. <![CDATA[store job token
  27121. @param t]]>
  27122. </doc>
  27123. </method>
  27124. <method name="getJobToken" return="org.apache.hadoop.security.token.Token"
  27125. abstract="false" native="false" synchronized="false"
  27126. static="true" final="false" visibility="public"
  27127. deprecated="not deprecated">
  27128. <param name="credentials" type="org.apache.hadoop.security.Credentials"/>
  27129. <doc>
  27130. <![CDATA[@return job token]]>
  27131. </doc>
  27132. </method>
  27133. <field name="JOB_TOKEN_HDFS_FILE" type="java.lang.String"
  27134. transient="false" volatile="false"
  27135. static="true" final="true" visibility="public"
  27136. deprecated="not deprecated">
  27137. <doc>
  27138. <![CDATA[file name used on HDFS for generated job token]]>
  27139. </doc>
  27140. </field>
  27141. <field name="JOB_TOKENS_FILENAME" type="java.lang.String"
  27142. transient="false" volatile="false"
  27143. static="true" final="true" visibility="public"
  27144. deprecated="not deprecated">
  27145. <doc>
  27146. <![CDATA[conf setting for job tokens cache file name]]>
  27147. </doc>
  27148. </field>
  27149. <doc>
  27150. <![CDATA[This class provides user facing APIs for transferring secrets from
  27151. the job client to the tasks.
  27152. The secrets can be stored just before submission of jobs and read during
  27153. the task execution.]]>
  27154. </doc>
  27155. </class>
  27156. <!-- end class org.apache.hadoop.mapreduce.security.TokenCache -->
  27157. </package>
  27158. <package name="org.apache.hadoop.mapreduce.server.jobtracker">
  27159. <!-- start class org.apache.hadoop.mapreduce.server.jobtracker.State -->
  27160. <class name="State" extends="java.lang.Enum"
  27161. abstract="false"
  27162. static="false" final="true" visibility="public"
  27163. deprecated="Use {@link JobTrackerStatus} instead.">
  27164. <method name="values" return="org.apache.hadoop.mapreduce.server.jobtracker.State[]"
  27165. abstract="false" native="false" synchronized="false"
  27166. static="true" final="false" visibility="public"
  27167. deprecated="not deprecated">
  27168. </method>
  27169. <method name="valueOf" return="org.apache.hadoop.mapreduce.server.jobtracker.State"
  27170. abstract="false" native="false" synchronized="false"
  27171. static="true" final="false" visibility="public"
  27172. deprecated="not deprecated">
  27173. <param name="name" type="java.lang.String"/>
  27174. </method>
  27175. <doc>
  27176. <![CDATA[Describes the state of JobTracker
  27177. @deprecated Use {@link JobTrackerStatus} instead.]]>
  27178. </doc>
  27179. </class>
  27180. <!-- end class org.apache.hadoop.mapreduce.server.jobtracker.State -->
  27181. </package>
  27182. <package name="org.apache.hadoop.mapreduce.tools">
  27183. <!-- start class org.apache.hadoop.mapreduce.tools.CLI -->
  27184. <class name="CLI" extends="org.apache.hadoop.conf.Configured"
  27185. abstract="false"
  27186. static="false" final="false" visibility="public"
  27187. deprecated="not deprecated">
  27188. <implements name="org.apache.hadoop.util.Tool"/>
  27189. <constructor name="CLI"
  27190. static="false" final="false" visibility="public"
  27191. deprecated="not deprecated">
  27192. </constructor>
  27193. <constructor name="CLI" type="org.apache.hadoop.conf.Configuration"
  27194. static="false" final="false" visibility="public"
  27195. deprecated="not deprecated">
  27196. </constructor>
  27197. <method name="run" return="int"
  27198. abstract="false" native="false" synchronized="false"
  27199. static="false" final="false" visibility="public"
  27200. deprecated="not deprecated">
  27201. <param name="argv" type="java.lang.String[]"/>
  27202. <exception name="Exception" type="java.lang.Exception"/>
  27203. </method>
  27204. <method name="getCounter" return="long"
  27205. abstract="false" native="false" synchronized="false"
  27206. static="false" final="false" visibility="protected"
  27207. deprecated="not deprecated">
  27208. <param name="counters" type="org.apache.hadoop.mapreduce.Counters"/>
  27209. <param name="counterGroupName" type="java.lang.String"/>
  27210. <param name="counterName" type="java.lang.String"/>
  27211. <exception name="IOException" type="java.io.IOException"/>
  27212. </method>
  27213. <method name="getTaskLogURL" return="java.lang.String"
  27214. abstract="false" native="false" synchronized="false"
  27215. static="true" final="false" visibility="protected"
  27216. deprecated="not deprecated">
  27217. <param name="taskId" type="org.apache.hadoop.mapreduce.TaskAttemptID"/>
  27218. <param name="baseUrl" type="java.lang.String"/>
  27219. </method>
  27220. <method name="displayTasks"
  27221. abstract="false" native="false" synchronized="false"
  27222. static="false" final="false" visibility="protected"
  27223. deprecated="not deprecated">
  27224. <param name="job" type="org.apache.hadoop.mapreduce.Job"/>
  27225. <param name="type" type="java.lang.String"/>
  27226. <param name="state" type="java.lang.String"/>
  27227. <exception name="IOException" type="java.io.IOException"/>
  27228. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  27229. <doc>
  27230. <![CDATA[Display the information about a job's tasks, of a particular type and
  27231. in a particular state
  27232. @param job the job
  27233. @param type the type of the task (map/reduce/setup/cleanup)
  27234. @param state the state of the task
  27235. (pending/running/completed/failed/killed)]]>
  27236. </doc>
  27237. </method>
  27238. <method name="displayJobList"
  27239. abstract="false" native="false" synchronized="false"
  27240. static="false" final="false" visibility="protected"
  27241. deprecated="not deprecated">
  27242. <param name="jobs" type="org.apache.hadoop.mapreduce.Job[]"/>
  27243. <exception name="IOException" type="java.io.IOException"/>
  27244. <exception name="InterruptedException" type="java.lang.InterruptedException"/>
  27245. </method>
  27246. <method name="main"
  27247. abstract="false" native="false" synchronized="false"
  27248. static="true" final="false" visibility="public"
  27249. deprecated="not deprecated">
  27250. <param name="argv" type="java.lang.String[]"/>
  27251. <exception name="Exception" type="java.lang.Exception"/>
  27252. </method>
  27253. <doc>
  27254. <![CDATA[Interprets the map reduce cli options]]>
  27255. </doc>
  27256. </class>
  27257. <!-- end class org.apache.hadoop.mapreduce.tools.CLI -->
  27258. </package>
  27259. <package name="org.apache.hadoop.fs">
  27260. <!-- start class org.apache.hadoop.fs.HarFileSystem -->
  27261. <class name="HarFileSystem" extends="org.apache.hadoop.fs.FilterFileSystem"
  27262. abstract="false"
  27263. static="false" final="false" visibility="public"
  27264. deprecated="not deprecated">
  27265. <constructor name="HarFileSystem"
  27266. static="false" final="false" visibility="public"
  27267. deprecated="not deprecated">
  27268. <doc>
  27269. <![CDATA[public construction of harfilesystem]]>
  27270. </doc>
  27271. </constructor>
  27272. <constructor name="HarFileSystem" type="org.apache.hadoop.fs.FileSystem"
  27273. static="false" final="false" visibility="public"
  27274. deprecated="not deprecated">
  27275. <doc>
  27276. <![CDATA[Constructor to create a HarFileSystem with an
  27277. underlying filesystem.
  27278. @param fs]]>
  27279. </doc>
  27280. </constructor>
  27281. <method name="initialize"
  27282. abstract="false" native="false" synchronized="false"
  27283. static="false" final="false" visibility="public"
  27284. deprecated="not deprecated">
  27285. <param name="name" type="java.net.URI"/>
  27286. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  27287. <exception name="IOException" type="java.io.IOException"/>
  27288. <doc>
  27289. <![CDATA[Initialize a Har filesystem per har archive. The
  27290. archive home directory is the top level directory
  27291. in the filesystem that contains the HAR archive.
  27292. Be careful with this method, you do not want to go
  27293. on creating new Filesystem instances per call to
  27294. path.getFileSystem().
  27295. the uri of Har is
  27296. har://underlyingfsscheme-host:port/archivepath.
  27297. or
  27298. har:///archivepath. This assumes the underlying filesystem
  27299. to be used in case not specified.]]>
  27300. </doc>
  27301. </method>
  27302. <method name="getHarVersion" return="int"
  27303. abstract="false" native="false" synchronized="false"
  27304. static="false" final="false" visibility="public"
  27305. deprecated="not deprecated">
  27306. <exception name="IOException" type="java.io.IOException"/>
  27307. </method>
  27308. <method name="getWorkingDirectory" return="org.apache.hadoop.fs.Path"
  27309. abstract="false" native="false" synchronized="false"
  27310. static="false" final="false" visibility="public"
  27311. deprecated="not deprecated">
  27312. <doc>
  27313. <![CDATA[return the top level archive.]]>
  27314. </doc>
  27315. </method>
  27316. <method name="getUri" return="java.net.URI"
  27317. abstract="false" native="false" synchronized="false"
  27318. static="false" final="false" visibility="public"
  27319. deprecated="not deprecated">
  27320. <doc>
  27321. <![CDATA[Returns the uri of this filesystem.
  27322. The uri is of the form
  27323. har://underlyingfsschema-host:port/pathintheunderlyingfs]]>
  27324. </doc>
  27325. </method>
  27326. <method name="makeQualified" return="org.apache.hadoop.fs.Path"
  27327. abstract="false" native="false" synchronized="false"
  27328. static="false" final="false" visibility="public"
  27329. deprecated="not deprecated">
  27330. <param name="path" type="org.apache.hadoop.fs.Path"/>
  27331. </method>
  27332. <method name="getFileBlockLocations" return="org.apache.hadoop.fs.BlockLocation[]"
  27333. abstract="false" native="false" synchronized="false"
  27334. static="false" final="false" visibility="public"
  27335. deprecated="not deprecated">
  27336. <param name="file" type="org.apache.hadoop.fs.FileStatus"/>
  27337. <param name="start" type="long"/>
  27338. <param name="len" type="long"/>
  27339. <exception name="IOException" type="java.io.IOException"/>
  27340. <doc>
  27341. <![CDATA[get block locations from the underlying fs
  27342. @param file the input filestatus to get block locations
  27343. @param start the start in the file
  27344. @param len the length in the file
  27345. @return block locations for this segment of file
  27346. @throws IOException]]>
  27347. </doc>
  27348. </method>
  27349. <method name="getHarHash" return="int"
  27350. abstract="false" native="false" synchronized="false"
  27351. static="true" final="false" visibility="public"
  27352. deprecated="not deprecated">
  27353. <param name="p" type="org.apache.hadoop.fs.Path"/>
  27354. <doc>
  27355. <![CDATA[the hash of the path p inside iniside
  27356. the filesystem
  27357. @param p the path in the harfilesystem
  27358. @return the hash code of the path.]]>
  27359. </doc>
  27360. </method>
  27361. <method name="getFileStatus" return="org.apache.hadoop.fs.FileStatus"
  27362. abstract="false" native="false" synchronized="false"
  27363. static="false" final="false" visibility="public"
  27364. deprecated="not deprecated">
  27365. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27366. <exception name="IOException" type="java.io.IOException"/>
  27367. <doc>
  27368. <![CDATA[return the filestatus of files in har archive.
  27369. The permission returned are that of the archive
  27370. index files. The permissions are not persisted
  27371. while creating a hadoop archive.
  27372. @param f the path in har filesystem
  27373. @return filestatus.
  27374. @throws IOException]]>
  27375. </doc>
  27376. </method>
  27377. <method name="getFileChecksum" return="org.apache.hadoop.fs.FileChecksum"
  27378. abstract="false" native="false" synchronized="false"
  27379. static="false" final="false" visibility="public"
  27380. deprecated="not deprecated">
  27381. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27382. <doc>
  27383. <![CDATA[@return null since no checksum algorithm is implemented.]]>
  27384. </doc>
  27385. </method>
  27386. <method name="open" return="org.apache.hadoop.fs.FSDataInputStream"
  27387. abstract="false" native="false" synchronized="false"
  27388. static="false" final="false" visibility="public"
  27389. deprecated="not deprecated">
  27390. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27391. <param name="bufferSize" type="int"/>
  27392. <exception name="IOException" type="java.io.IOException"/>
  27393. <doc>
  27394. <![CDATA[Returns a har input stream which fakes end of
  27395. file. It reads the index files to get the part
  27396. file name and the size and start of the file.]]>
  27397. </doc>
  27398. </method>
  27399. <method name="create" return="org.apache.hadoop.fs.FSDataOutputStream"
  27400. abstract="false" native="false" synchronized="false"
  27401. static="false" final="false" visibility="public"
  27402. deprecated="not deprecated">
  27403. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27404. <param name="bufferSize" type="int"/>
  27405. <exception name="IOException" type="java.io.IOException"/>
  27406. </method>
  27407. <method name="create" return="org.apache.hadoop.fs.FSDataOutputStream"
  27408. abstract="false" native="false" synchronized="false"
  27409. static="false" final="false" visibility="public"
  27410. deprecated="not deprecated">
  27411. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27412. <param name="permission" type="org.apache.hadoop.fs.permission.FsPermission"/>
  27413. <param name="flag" type="java.util.EnumSet"/>
  27414. <param name="bufferSize" type="int"/>
  27415. <param name="replication" type="short"/>
  27416. <param name="blockSize" type="long"/>
  27417. <param name="progress" type="org.apache.hadoop.util.Progressable"/>
  27418. <exception name="IOException" type="java.io.IOException"/>
  27419. </method>
  27420. <method name="close"
  27421. abstract="false" native="false" synchronized="false"
  27422. static="false" final="false" visibility="public"
  27423. deprecated="not deprecated">
  27424. <exception name="IOException" type="java.io.IOException"/>
  27425. </method>
  27426. <method name="setReplication" return="boolean"
  27427. abstract="false" native="false" synchronized="false"
  27428. static="false" final="false" visibility="public"
  27429. deprecated="not deprecated">
  27430. <param name="src" type="org.apache.hadoop.fs.Path"/>
  27431. <param name="replication" type="short"/>
  27432. <exception name="IOException" type="java.io.IOException"/>
  27433. <doc>
  27434. <![CDATA[Not implemented.]]>
  27435. </doc>
  27436. </method>
  27437. <method name="delete" return="boolean"
  27438. abstract="false" native="false" synchronized="false"
  27439. static="false" final="false" visibility="public"
  27440. deprecated="not deprecated">
  27441. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27442. <param name="recursive" type="boolean"/>
  27443. <exception name="IOException" type="java.io.IOException"/>
  27444. <doc>
  27445. <![CDATA[Not implemented.]]>
  27446. </doc>
  27447. </method>
  27448. <method name="listStatus" return="org.apache.hadoop.fs.FileStatus[]"
  27449. abstract="false" native="false" synchronized="false"
  27450. static="false" final="false" visibility="public"
  27451. deprecated="not deprecated">
  27452. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27453. <exception name="IOException" type="java.io.IOException"/>
  27454. <doc>
  27455. <![CDATA[liststatus returns the children of a directory
  27456. after looking up the index files.]]>
  27457. </doc>
  27458. </method>
  27459. <method name="getHomeDirectory" return="org.apache.hadoop.fs.Path"
  27460. abstract="false" native="false" synchronized="false"
  27461. static="false" final="false" visibility="public"
  27462. deprecated="not deprecated">
  27463. <doc>
  27464. <![CDATA[return the top level archive path.]]>
  27465. </doc>
  27466. </method>
  27467. <method name="setWorkingDirectory"
  27468. abstract="false" native="false" synchronized="false"
  27469. static="false" final="false" visibility="public"
  27470. deprecated="not deprecated">
  27471. <param name="newDir" type="org.apache.hadoop.fs.Path"/>
  27472. </method>
  27473. <method name="mkdirs" return="boolean"
  27474. abstract="false" native="false" synchronized="false"
  27475. static="false" final="false" visibility="public"
  27476. deprecated="not deprecated">
  27477. <param name="f" type="org.apache.hadoop.fs.Path"/>
  27478. <param name="permission" type="org.apache.hadoop.fs.permission.FsPermission"/>
  27479. <exception name="IOException" type="java.io.IOException"/>
  27480. <doc>
  27481. <![CDATA[not implemented.]]>
  27482. </doc>
  27483. </method>
  27484. <method name="copyFromLocalFile"
  27485. abstract="false" native="false" synchronized="false"
  27486. static="false" final="false" visibility="public"
  27487. deprecated="not deprecated">
  27488. <param name="delSrc" type="boolean"/>
  27489. <param name="src" type="org.apache.hadoop.fs.Path"/>
  27490. <param name="dst" type="org.apache.hadoop.fs.Path"/>
  27491. <exception name="IOException" type="java.io.IOException"/>
  27492. <doc>
  27493. <![CDATA[not implemented.]]>
  27494. </doc>
  27495. </method>
  27496. <method name="copyToLocalFile"
  27497. abstract="false" native="false" synchronized="false"
  27498. static="false" final="false" visibility="public"
  27499. deprecated="not deprecated">
  27500. <param name="delSrc" type="boolean"/>
  27501. <param name="src" type="org.apache.hadoop.fs.Path"/>
  27502. <param name="dst" type="org.apache.hadoop.fs.Path"/>
  27503. <exception name="IOException" type="java.io.IOException"/>
  27504. <doc>
  27505. <![CDATA[copies the file in the har filesystem to a local file.]]>
  27506. </doc>
  27507. </method>
  27508. <method name="startLocalOutput" return="org.apache.hadoop.fs.Path"
  27509. abstract="false" native="false" synchronized="false"
  27510. static="false" final="false" visibility="public"
  27511. deprecated="not deprecated">
  27512. <param name="fsOutputFile" type="org.apache.hadoop.fs.Path"/>
  27513. <param name="tmpLocalFile" type="org.apache.hadoop.fs.Path"/>
  27514. <exception name="IOException" type="java.io.IOException"/>
  27515. <doc>
  27516. <![CDATA[not implemented.]]>
  27517. </doc>
  27518. </method>
  27519. <method name="completeLocalOutput"
  27520. abstract="false" native="false" synchronized="false"
  27521. static="false" final="false" visibility="public"
  27522. deprecated="not deprecated">
  27523. <param name="fsOutputFile" type="org.apache.hadoop.fs.Path"/>
  27524. <param name="tmpLocalFile" type="org.apache.hadoop.fs.Path"/>
  27525. <exception name="IOException" type="java.io.IOException"/>
  27526. <doc>
  27527. <![CDATA[not implemented.]]>
  27528. </doc>
  27529. </method>
  27530. <method name="setOwner"
  27531. abstract="false" native="false" synchronized="false"
  27532. static="false" final="false" visibility="public"
  27533. deprecated="not deprecated">
  27534. <param name="p" type="org.apache.hadoop.fs.Path"/>
  27535. <param name="username" type="java.lang.String"/>
  27536. <param name="groupname" type="java.lang.String"/>
  27537. <exception name="IOException" type="java.io.IOException"/>
  27538. <doc>
  27539. <![CDATA[not implemented.]]>
  27540. </doc>
  27541. </method>
  27542. <method name="setPermission"
  27543. abstract="false" native="false" synchronized="false"
  27544. static="false" final="false" visibility="public"
  27545. deprecated="not deprecated">
  27546. <param name="p" type="org.apache.hadoop.fs.Path"/>
  27547. <param name="permisssion" type="org.apache.hadoop.fs.permission.FsPermission"/>
  27548. <exception name="IOException" type="java.io.IOException"/>
  27549. <doc>
  27550. <![CDATA[Not implemented.]]>
  27551. </doc>
  27552. </method>
  27553. <field name="VERSION" type="int"
  27554. transient="false" volatile="false"
  27555. static="true" final="true" visibility="public"
  27556. deprecated="not deprecated">
  27557. </field>
  27558. <doc>
  27559. <![CDATA[This is an implementation of the Hadoop Archive
  27560. Filesystem. This archive Filesystem has index files
  27561. of the form _index* and has contents of the form
  27562. part-*. The index files store the indexes of the
  27563. real files. The index files are of the form _masterindex
  27564. and _index. The master index is a level of indirection
  27565. in to the index file to make the look ups faster. the index
  27566. file is sorted with hash code of the paths that it contains
  27567. and the master index contains pointers to the positions in
  27568. index for ranges of hashcodes.]]>
  27569. </doc>
  27570. </class>
  27571. <!-- end class org.apache.hadoop.fs.HarFileSystem -->
  27572. </package>
  27573. <package name="org.apache.hadoop.tools">
  27574. <!-- start class org.apache.hadoop.tools.DistCh -->
  27575. <class name="DistCh" extends="org.apache.hadoop.tools.DistTool"
  27576. abstract="false"
  27577. static="false" final="false" visibility="public"
  27578. deprecated="not deprecated">
  27579. <method name="run" return="int"
  27580. abstract="false" native="false" synchronized="false"
  27581. static="false" final="false" visibility="public"
  27582. deprecated="not deprecated">
  27583. <param name="args" type="java.lang.String[]"/>
  27584. <exception name="Exception" type="java.lang.Exception"/>
  27585. <doc>
  27586. <![CDATA[This is the main driver for recursively changing files properties.]]>
  27587. </doc>
  27588. </method>
  27589. <method name="main"
  27590. abstract="false" native="false" synchronized="false"
  27591. static="true" final="false" visibility="public"
  27592. deprecated="not deprecated">
  27593. <param name="args" type="java.lang.String[]"/>
  27594. <exception name="Exception" type="java.lang.Exception"/>
  27595. </method>
  27596. <doc>
  27597. <![CDATA[A Map-reduce program to recursively change files properties
  27598. such as owner, group and permission.]]>
  27599. </doc>
  27600. </class>
  27601. <!-- end class org.apache.hadoop.tools.DistCh -->
  27602. <!-- start class org.apache.hadoop.tools.DistCp -->
  27603. <class name="DistCp" extends="java.lang.Object"
  27604. abstract="false"
  27605. static="false" final="false" visibility="public"
  27606. deprecated="not deprecated">
  27607. <implements name="org.apache.hadoop.util.Tool"/>
  27608. <constructor name="DistCp" type="org.apache.hadoop.conf.Configuration"
  27609. static="false" final="false" visibility="public"
  27610. deprecated="not deprecated">
  27611. </constructor>
  27612. <method name="setConf"
  27613. abstract="false" native="false" synchronized="false"
  27614. static="false" final="false" visibility="public"
  27615. deprecated="not deprecated">
  27616. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  27617. </method>
  27618. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  27619. abstract="false" native="false" synchronized="false"
  27620. static="false" final="false" visibility="public"
  27621. deprecated="not deprecated">
  27622. </method>
  27623. <method name="copy"
  27624. abstract="false" native="false" synchronized="false"
  27625. static="true" final="false" visibility="public"
  27626. deprecated="not deprecated">
  27627. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  27628. <param name="srcPath" type="java.lang.String"/>
  27629. <param name="destPath" type="java.lang.String"/>
  27630. <param name="logPath" type="org.apache.hadoop.fs.Path"/>
  27631. <param name="srcAsList" type="boolean"/>
  27632. <param name="ignoreReadFailures" type="boolean"/>
  27633. <exception name="IOException" type="java.io.IOException"/>
  27634. </method>
  27635. <method name="run" return="int"
  27636. abstract="false" native="false" synchronized="false"
  27637. static="false" final="false" visibility="public"
  27638. deprecated="not deprecated">
  27639. <param name="args" type="java.lang.String[]"/>
  27640. <doc>
  27641. <![CDATA[This is the main driver for recursively copying directories
  27642. across file systems. It takes at least two cmdline parameters. A source
  27643. URL and a destination URL. It then essentially does an "ls -lR" on the
  27644. source URL, and writes the output in a round-robin manner to all the map
  27645. input files. The mapper actually copies the files allotted to it. The
  27646. reduce is empty.]]>
  27647. </doc>
  27648. </method>
  27649. <method name="main"
  27650. abstract="false" native="false" synchronized="false"
  27651. static="true" final="false" visibility="public"
  27652. deprecated="not deprecated">
  27653. <param name="args" type="java.lang.String[]"/>
  27654. <exception name="Exception" type="java.lang.Exception"/>
  27655. </method>
  27656. <method name="getRandomId" return="java.lang.String"
  27657. abstract="false" native="false" synchronized="false"
  27658. static="true" final="false" visibility="public"
  27659. deprecated="not deprecated">
  27660. </method>
  27661. <field name="LOG" type="org.apache.commons.logging.Log"
  27662. transient="false" volatile="false"
  27663. static="true" final="true" visibility="public"
  27664. deprecated="not deprecated">
  27665. </field>
  27666. <doc>
  27667. <![CDATA[A Map-reduce program to recursively copy directories between
  27668. different file-systems.]]>
  27669. </doc>
  27670. </class>
  27671. <!-- end class org.apache.hadoop.tools.DistCp -->
  27672. <!-- start class org.apache.hadoop.tools.DistCp.DuplicationException -->
  27673. <class name="DistCp.DuplicationException" extends="java.io.IOException"
  27674. abstract="false"
  27675. static="true" final="false" visibility="public"
  27676. deprecated="not deprecated">
  27677. <field name="ERROR_CODE" type="int"
  27678. transient="false" volatile="false"
  27679. static="true" final="true" visibility="public"
  27680. deprecated="not deprecated">
  27681. <doc>
  27682. <![CDATA[Error code for this exception]]>
  27683. </doc>
  27684. </field>
  27685. <doc>
  27686. <![CDATA[An exception class for duplicated source files.]]>
  27687. </doc>
  27688. </class>
  27689. <!-- end class org.apache.hadoop.tools.DistCp.DuplicationException -->
  27690. <!-- start class org.apache.hadoop.tools.HadoopArchives -->
  27691. <class name="HadoopArchives" extends="java.lang.Object"
  27692. abstract="false"
  27693. static="false" final="false" visibility="public"
  27694. deprecated="not deprecated">
  27695. <implements name="org.apache.hadoop.util.Tool"/>
  27696. <constructor name="HadoopArchives" type="org.apache.hadoop.conf.Configuration"
  27697. static="false" final="false" visibility="public"
  27698. deprecated="not deprecated">
  27699. </constructor>
  27700. <method name="setConf"
  27701. abstract="false" native="false" synchronized="false"
  27702. static="false" final="false" visibility="public"
  27703. deprecated="not deprecated">
  27704. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  27705. </method>
  27706. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  27707. abstract="false" native="false" synchronized="false"
  27708. static="false" final="false" visibility="public"
  27709. deprecated="not deprecated">
  27710. </method>
  27711. <method name="run" return="int"
  27712. abstract="false" native="false" synchronized="false"
  27713. static="false" final="false" visibility="public"
  27714. deprecated="not deprecated">
  27715. <param name="args" type="java.lang.String[]"/>
  27716. <exception name="Exception" type="java.lang.Exception"/>
  27717. <doc>
  27718. <![CDATA[the main driver for creating the archives
  27719. it takes at least three command line parameters. The parent path,
  27720. The src and the dest. It does an lsr on the source paths.
  27721. The mapper created archuves and the reducer creates
  27722. the archive index.]]>
  27723. </doc>
  27724. </method>
  27725. <method name="main"
  27726. abstract="false" native="false" synchronized="false"
  27727. static="true" final="false" visibility="public"
  27728. deprecated="not deprecated">
  27729. <param name="args" type="java.lang.String[]"/>
  27730. <doc>
  27731. <![CDATA[the main functions]]>
  27732. </doc>
  27733. </method>
  27734. <field name="VERSION" type="int"
  27735. transient="false" volatile="false"
  27736. static="true" final="true" visibility="public"
  27737. deprecated="not deprecated">
  27738. </field>
  27739. <doc>
  27740. <![CDATA[a archive creation utility.
  27741. This class provides methods that can be used
  27742. to create hadoop archives. For understanding of
  27743. Hadoop archives look at {@link HarFileSystem}.]]>
  27744. </doc>
  27745. </class>
  27746. <!-- end class org.apache.hadoop.tools.HadoopArchives -->
  27747. <!-- start class org.apache.hadoop.tools.Logalyzer -->
  27748. <class name="Logalyzer" extends="java.lang.Object"
  27749. abstract="false"
  27750. static="false" final="false" visibility="public"
  27751. deprecated="not deprecated">
  27752. <constructor name="Logalyzer"
  27753. static="false" final="false" visibility="public"
  27754. deprecated="not deprecated">
  27755. </constructor>
  27756. <method name="doArchive"
  27757. abstract="false" native="false" synchronized="false"
  27758. static="false" final="false" visibility="public"
  27759. deprecated="not deprecated">
  27760. <param name="logListURI" type="java.lang.String"/>
  27761. <param name="archiveDirectory" type="java.lang.String"/>
  27762. <exception name="IOException" type="java.io.IOException"/>
  27763. <doc>
  27764. <![CDATA[doArchive: Workhorse function to archive log-files.
  27765. @param logListURI : The uri which will serve list of log-files to archive.
  27766. @param archiveDirectory : The directory to store archived logfiles.
  27767. @throws IOException]]>
  27768. </doc>
  27769. </method>
  27770. <method name="doAnalyze"
  27771. abstract="false" native="false" synchronized="false"
  27772. static="false" final="false" visibility="public"
  27773. deprecated="not deprecated">
  27774. <param name="inputFilesDirectory" type="java.lang.String"/>
  27775. <param name="outputDirectory" type="java.lang.String"/>
  27776. <param name="grepPattern" type="java.lang.String"/>
  27777. <param name="sortColumns" type="java.lang.String"/>
  27778. <param name="columnSeparator" type="java.lang.String"/>
  27779. <exception name="IOException" type="java.io.IOException"/>
  27780. <doc>
  27781. <![CDATA[doAnalyze:
  27782. @param inputFilesDirectory : Directory containing the files to be analyzed.
  27783. @param outputDirectory : Directory to store analysis (output).
  27784. @param grepPattern : Pattern to *grep* for.
  27785. @param sortColumns : Sort specification for output.
  27786. @param columnSeparator : Column separator.
  27787. @throws IOException]]>
  27788. </doc>
  27789. </method>
  27790. <method name="main"
  27791. abstract="false" native="false" synchronized="false"
  27792. static="true" final="false" visibility="public"
  27793. deprecated="not deprecated">
  27794. <param name="args" type="java.lang.String[]"/>
  27795. </method>
  27796. <field name="SORT_COLUMNS" type="java.lang.String"
  27797. transient="false" volatile="false"
  27798. static="true" final="false" visibility="public"
  27799. deprecated="not deprecated">
  27800. </field>
  27801. <field name="COLUMN_SEPARATOR" type="java.lang.String"
  27802. transient="false" volatile="false"
  27803. static="true" final="false" visibility="public"
  27804. deprecated="not deprecated">
  27805. </field>
  27806. <doc>
  27807. <![CDATA[Logalyzer: A utility tool for archiving and analyzing hadoop logs.
  27808. <p>
  27809. This tool supports archiving and anaylzing (sort/grep) of log-files.
  27810. It takes as input
  27811. a) Input uri which will serve uris of the logs to be archived.
  27812. b) Output directory (not mandatory).
  27813. b) Directory on dfs to archive the logs.
  27814. c) The sort/grep patterns for analyzing the files and separator for boundaries.
  27815. Usage:
  27816. Logalyzer -archive -archiveDir <directory to archive logs> -analysis <directory> -logs <log-list uri> -grep <pattern> -sort <col1, col2> -separator <separator>
  27817. <p>]]>
  27818. </doc>
  27819. </class>
  27820. <!-- end class org.apache.hadoop.tools.Logalyzer -->
  27821. <!-- start class org.apache.hadoop.tools.Logalyzer.LogComparator -->
  27822. <class name="Logalyzer.LogComparator" extends="org.apache.hadoop.io.Text.Comparator"
  27823. abstract="false"
  27824. static="true" final="false" visibility="public"
  27825. deprecated="not deprecated">
  27826. <implements name="org.apache.hadoop.conf.Configurable"/>
  27827. <constructor name="Logalyzer.LogComparator"
  27828. static="false" final="false" visibility="public"
  27829. deprecated="not deprecated">
  27830. </constructor>
  27831. <method name="setConf"
  27832. abstract="false" native="false" synchronized="false"
  27833. static="false" final="false" visibility="public"
  27834. deprecated="not deprecated">
  27835. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  27836. </method>
  27837. <method name="getConf" return="org.apache.hadoop.conf.Configuration"
  27838. abstract="false" native="false" synchronized="false"
  27839. static="false" final="false" visibility="public"
  27840. deprecated="not deprecated">
  27841. </method>
  27842. <method name="compare" return="int"
  27843. abstract="false" native="false" synchronized="false"
  27844. static="false" final="false" visibility="public"
  27845. deprecated="not deprecated">
  27846. <param name="b1" type="byte[]"/>
  27847. <param name="s1" type="int"/>
  27848. <param name="l1" type="int"/>
  27849. <param name="b2" type="byte[]"/>
  27850. <param name="s2" type="int"/>
  27851. <param name="l2" type="int"/>
  27852. </method>
  27853. <doc>
  27854. <![CDATA[A WritableComparator optimized for UTF8 keys of the logs.]]>
  27855. </doc>
  27856. </class>
  27857. <!-- end class org.apache.hadoop.tools.Logalyzer.LogComparator -->
  27858. <!-- start class org.apache.hadoop.tools.Logalyzer.LogRegexMapper -->
  27859. <class name="Logalyzer.LogRegexMapper" extends="org.apache.hadoop.mapred.MapReduceBase"
  27860. abstract="false"
  27861. static="true" final="false" visibility="public"
  27862. deprecated="not deprecated">
  27863. <implements name="org.apache.hadoop.mapred.Mapper"/>
  27864. <constructor name="Logalyzer.LogRegexMapper"
  27865. static="false" final="false" visibility="public"
  27866. deprecated="not deprecated">
  27867. </constructor>
  27868. <method name="configure"
  27869. abstract="false" native="false" synchronized="false"
  27870. static="false" final="false" visibility="public"
  27871. deprecated="not deprecated">
  27872. <param name="job" type="org.apache.hadoop.mapred.JobConf"/>
  27873. </method>
  27874. <method name="map"
  27875. abstract="false" native="false" synchronized="false"
  27876. static="false" final="false" visibility="public"
  27877. deprecated="not deprecated">
  27878. <param name="key" type="K"/>
  27879. <param name="value" type="org.apache.hadoop.io.Text"/>
  27880. <param name="output" type="org.apache.hadoop.mapred.OutputCollector"/>
  27881. <param name="reporter" type="org.apache.hadoop.mapred.Reporter"/>
  27882. <exception name="IOException" type="java.io.IOException"/>
  27883. </method>
  27884. <doc>
  27885. <![CDATA[A {@link Mapper} that extracts text matching a regular expression.]]>
  27886. </doc>
  27887. </class>
  27888. <!-- end class org.apache.hadoop.tools.Logalyzer.LogRegexMapper -->
  27889. </package>
  27890. <package name="org.apache.hadoop.tools.rumen">
  27891. <!-- start class org.apache.hadoop.tools.rumen.AbstractClusterStory -->
  27892. <class name="AbstractClusterStory" extends="java.lang.Object"
  27893. abstract="true"
  27894. static="false" final="false" visibility="public"
  27895. deprecated="not deprecated">
  27896. <implements name="org.apache.hadoop.tools.rumen.ClusterStory"/>
  27897. <constructor name="AbstractClusterStory"
  27898. static="false" final="false" visibility="public"
  27899. deprecated="not deprecated">
  27900. </constructor>
  27901. <method name="getMachines" return="java.util.Set"
  27902. abstract="false" native="false" synchronized="false"
  27903. static="false" final="false" visibility="public"
  27904. deprecated="not deprecated">
  27905. </method>
  27906. <method name="getRacks" return="java.util.Set"
  27907. abstract="false" native="false" synchronized="true"
  27908. static="false" final="false" visibility="public"
  27909. deprecated="not deprecated">
  27910. </method>
  27911. <method name="getRandomMachines" return="org.apache.hadoop.tools.rumen.MachineNode[]"
  27912. abstract="false" native="false" synchronized="true"
  27913. static="false" final="false" visibility="public"
  27914. deprecated="not deprecated">
  27915. <param name="expected" type="int"/>
  27916. <param name="random" type="java.util.Random"/>
  27917. </method>
  27918. <method name="buildMachineNodeMap"
  27919. abstract="false" native="false" synchronized="true"
  27920. static="false" final="false" visibility="protected"
  27921. deprecated="not deprecated">
  27922. </method>
  27923. <method name="getMachineByName" return="org.apache.hadoop.tools.rumen.MachineNode"
  27924. abstract="false" native="false" synchronized="false"
  27925. static="false" final="false" visibility="public"
  27926. deprecated="not deprecated">
  27927. <param name="name" type="java.lang.String"/>
  27928. </method>
  27929. <method name="distance" return="int"
  27930. abstract="false" native="false" synchronized="false"
  27931. static="false" final="false" visibility="public"
  27932. deprecated="not deprecated">
  27933. <param name="a" type="org.apache.hadoop.tools.rumen.Node"/>
  27934. <param name="b" type="org.apache.hadoop.tools.rumen.Node"/>
  27935. </method>
  27936. <method name="buildRackNodeMap"
  27937. abstract="false" native="false" synchronized="true"
  27938. static="false" final="false" visibility="protected"
  27939. deprecated="not deprecated">
  27940. </method>
  27941. <method name="getRackByName" return="org.apache.hadoop.tools.rumen.RackNode"
  27942. abstract="false" native="false" synchronized="false"
  27943. static="false" final="false" visibility="public"
  27944. deprecated="not deprecated">
  27945. <param name="name" type="java.lang.String"/>
  27946. </method>
  27947. <method name="getMaximumDistance" return="int"
  27948. abstract="false" native="false" synchronized="false"
  27949. static="false" final="false" visibility="public"
  27950. deprecated="not deprecated">
  27951. </method>
  27952. <method name="parseTopologyTree"
  27953. abstract="false" native="false" synchronized="true"
  27954. static="false" final="false" visibility="protected"
  27955. deprecated="not deprecated">
  27956. </method>
  27957. <field name="machineNodes" type="java.util.Set"
  27958. transient="false" volatile="false"
  27959. static="false" final="false" visibility="protected"
  27960. deprecated="not deprecated">
  27961. </field>
  27962. <field name="rackNodes" type="java.util.Set"
  27963. transient="false" volatile="false"
  27964. static="false" final="false" visibility="protected"
  27965. deprecated="not deprecated">
  27966. </field>
  27967. <field name="mNodesFlattened" type="org.apache.hadoop.tools.rumen.MachineNode[]"
  27968. transient="false" volatile="false"
  27969. static="false" final="false" visibility="protected"
  27970. deprecated="not deprecated">
  27971. </field>
  27972. <field name="mNodeMap" type="java.util.Map"
  27973. transient="false" volatile="false"
  27974. static="false" final="false" visibility="protected"
  27975. deprecated="not deprecated">
  27976. </field>
  27977. <field name="rNodeMap" type="java.util.Map"
  27978. transient="false" volatile="false"
  27979. static="false" final="false" visibility="protected"
  27980. deprecated="not deprecated">
  27981. </field>
  27982. <field name="maximumDistance" type="int"
  27983. transient="false" volatile="false"
  27984. static="false" final="false" visibility="protected"
  27985. deprecated="not deprecated">
  27986. </field>
  27987. <doc>
  27988. <![CDATA[{@link AbstractClusterStory} provides a partial implementation of
  27989. {@link ClusterStory} by parsing the topology tree.]]>
  27990. </doc>
  27991. </class>
  27992. <!-- end class org.apache.hadoop.tools.rumen.AbstractClusterStory -->
  27993. <!-- start class org.apache.hadoop.tools.rumen.CDFPiecewiseLinearRandomGenerator -->
  27994. <class name="CDFPiecewiseLinearRandomGenerator" extends="org.apache.hadoop.tools.rumen.CDFRandomGenerator"
  27995. abstract="false"
  27996. static="false" final="false" visibility="public"
  27997. deprecated="not deprecated">
  27998. <constructor name="CDFPiecewiseLinearRandomGenerator" type="org.apache.hadoop.tools.rumen.LoggedDiscreteCDF"
  27999. static="false" final="false" visibility="public"
  28000. deprecated="not deprecated">
  28001. <doc>
  28002. <![CDATA[@param cdf
  28003. builds a CDFRandomValue engine around this
  28004. {@link LoggedDiscreteCDF}, with a defaultly seeded RNG]]>
  28005. </doc>
  28006. </constructor>
  28007. <constructor name="CDFPiecewiseLinearRandomGenerator" type="org.apache.hadoop.tools.rumen.LoggedDiscreteCDF, long"
  28008. static="false" final="false" visibility="public"
  28009. deprecated="not deprecated">
  28010. <doc>
  28011. <![CDATA[@param cdf
  28012. builds a CDFRandomValue engine around this
  28013. {@link LoggedDiscreteCDF}, with an explicitly seeded RNG
  28014. @param seed
  28015. the random number generator seed]]>
  28016. </doc>
  28017. </constructor>
  28018. <method name="valueAt" return="long"
  28019. abstract="false" native="false" synchronized="false"
  28020. static="false" final="false" visibility="public"
  28021. deprecated="not deprecated">
  28022. <param name="probability" type="double"/>
  28023. <doc>
  28024. <![CDATA[TODO This code assumes that the empirical minimum resp. maximum is the
  28025. epistomological minimum resp. maximum. This is probably okay for the
  28026. minimum, because that likely represents a task where everything went well,
  28027. but for the maximum we may want to develop a way of extrapolating past the
  28028. maximum.]]>
  28029. </doc>
  28030. </method>
  28031. </class>
  28032. <!-- end class org.apache.hadoop.tools.rumen.CDFPiecewiseLinearRandomGenerator -->
  28033. <!-- start class org.apache.hadoop.tools.rumen.CDFRandomGenerator -->
  28034. <class name="CDFRandomGenerator" extends="java.lang.Object"
  28035. abstract="true"
  28036. static="false" final="false" visibility="public"
  28037. deprecated="not deprecated">
  28038. <method name="initializeTables"
  28039. abstract="false" native="false" synchronized="false"
  28040. static="false" final="true" visibility="protected"
  28041. deprecated="not deprecated">
  28042. <param name="cdf" type="org.apache.hadoop.tools.rumen.LoggedDiscreteCDF"/>
  28043. </method>
  28044. <method name="floorIndex" return="int"
  28045. abstract="false" native="false" synchronized="false"
  28046. static="false" final="false" visibility="protected"
  28047. deprecated="not deprecated">
  28048. <param name="probe" type="double"/>
  28049. </method>
  28050. <method name="getRankingAt" return="double"
  28051. abstract="false" native="false" synchronized="false"
  28052. static="false" final="false" visibility="protected"
  28053. deprecated="not deprecated">
  28054. <param name="index" type="int"/>
  28055. </method>
  28056. <method name="getDatumAt" return="long"
  28057. abstract="false" native="false" synchronized="false"
  28058. static="false" final="false" visibility="protected"
  28059. deprecated="not deprecated">
  28060. <param name="index" type="int"/>
  28061. </method>
  28062. <method name="randomValue" return="long"
  28063. abstract="false" native="false" synchronized="false"
  28064. static="false" final="false" visibility="public"
  28065. deprecated="not deprecated">
  28066. </method>
  28067. <method name="valueAt" return="long"
  28068. abstract="true" native="false" synchronized="false"
  28069. static="false" final="false" visibility="public"
  28070. deprecated="not deprecated">
  28071. <param name="probability" type="double"/>
  28072. </method>
  28073. <doc>
  28074. <![CDATA[An instance of this class generates random values that confirm to the
  28075. embedded {@link LoggedDiscreteCDF} . The discrete CDF is a pointwise
  28076. approximation of the "real" CDF. We therefore have a choice of interpolation
  28077. rules.
  28078. A concrete subclass of this abstract class will implement valueAt(double)
  28079. using a class-dependent interpolation rule.]]>
  28080. </doc>
  28081. </class>
  28082. <!-- end class org.apache.hadoop.tools.rumen.CDFRandomGenerator -->
  28083. <!-- start interface org.apache.hadoop.tools.rumen.ClusterStory -->
  28084. <interface name="ClusterStory" abstract="true"
  28085. static="false" final="false" visibility="public"
  28086. deprecated="not deprecated">
  28087. <method name="getMachines" return="java.util.Set"
  28088. abstract="false" native="false" synchronized="false"
  28089. static="false" final="false" visibility="public"
  28090. deprecated="not deprecated">
  28091. <doc>
  28092. <![CDATA[Get all machines of the cluster.
  28093. @return A read-only set that contains all machines of the cluster.]]>
  28094. </doc>
  28095. </method>
  28096. <method name="getRacks" return="java.util.Set"
  28097. abstract="false" native="false" synchronized="false"
  28098. static="false" final="false" visibility="public"
  28099. deprecated="not deprecated">
  28100. <doc>
  28101. <![CDATA[Get all racks of the cluster.
  28102. @return A read-only set that contains all racks of the cluster.]]>
  28103. </doc>
  28104. </method>
  28105. <method name="getClusterTopology" return="org.apache.hadoop.tools.rumen.Node"
  28106. abstract="false" native="false" synchronized="false"
  28107. static="false" final="false" visibility="public"
  28108. deprecated="not deprecated">
  28109. <doc>
  28110. <![CDATA[Get the cluster topology tree.
  28111. @return The root node of the cluster topology tree.]]>
  28112. </doc>
  28113. </method>
  28114. <method name="getRandomMachines" return="org.apache.hadoop.tools.rumen.MachineNode[]"
  28115. abstract="false" native="false" synchronized="false"
  28116. static="false" final="false" visibility="public"
  28117. deprecated="not deprecated">
  28118. <param name="expected" type="int"/>
  28119. <param name="random" type="java.util.Random"/>
  28120. <doc>
  28121. <![CDATA[Select a random set of machines.
  28122. @param expected The expected sample size.
  28123. @param random Random number generator to use.
  28124. @return An array of up to expected number of {@link MachineNode}s.]]>
  28125. </doc>
  28126. </method>
  28127. <method name="getMachineByName" return="org.apache.hadoop.tools.rumen.MachineNode"
  28128. abstract="false" native="false" synchronized="false"
  28129. static="false" final="false" visibility="public"
  28130. deprecated="not deprecated">
  28131. <param name="name" type="java.lang.String"/>
  28132. <doc>
  28133. <![CDATA[Get {@link MachineNode} by its host name.
  28134. @return The {@link MachineNode} with the same name. Or null if not found.]]>
  28135. </doc>
  28136. </method>
  28137. <method name="getRackByName" return="org.apache.hadoop.tools.rumen.RackNode"
  28138. abstract="false" native="false" synchronized="false"
  28139. static="false" final="false" visibility="public"
  28140. deprecated="not deprecated">
  28141. <param name="name" type="java.lang.String"/>
  28142. <doc>
  28143. <![CDATA[Get {@link RackNode} by its name.
  28144. @return The {@link RackNode} with the same name. Or null if not found.]]>
  28145. </doc>
  28146. </method>
  28147. <method name="distance" return="int"
  28148. abstract="false" native="false" synchronized="false"
  28149. static="false" final="false" visibility="public"
  28150. deprecated="not deprecated">
  28151. <param name="a" type="org.apache.hadoop.tools.rumen.Node"/>
  28152. <param name="b" type="org.apache.hadoop.tools.rumen.Node"/>
  28153. <doc>
  28154. <![CDATA[Determine the distance between two {@link Node}s. Currently, the distance
  28155. is loosely defined as the length of the longer path for either a or b to
  28156. reach their common ancestor.
  28157. @param a
  28158. @param b
  28159. @return The distance between {@link Node} a and {@link Node} b.]]>
  28160. </doc>
  28161. </method>
  28162. <method name="getMaximumDistance" return="int"
  28163. abstract="false" native="false" synchronized="false"
  28164. static="false" final="false" visibility="public"
  28165. deprecated="not deprecated">
  28166. <doc>
  28167. <![CDATA[Get the maximum distance possible between any two nodes.
  28168. @return the maximum distance possible between any two nodes.]]>
  28169. </doc>
  28170. </method>
  28171. <doc>
  28172. <![CDATA[{@link ClusterStory} represents all configurations of a MapReduce cluster,
  28173. including nodes, network topology, and slot configurations.]]>
  28174. </doc>
  28175. </interface>
  28176. <!-- end interface org.apache.hadoop.tools.rumen.ClusterStory -->
  28177. <!-- start class org.apache.hadoop.tools.rumen.ClusterTopologyReader -->
  28178. <class name="ClusterTopologyReader" extends="java.lang.Object"
  28179. abstract="false"
  28180. static="false" final="false" visibility="public"
  28181. deprecated="not deprecated">
  28182. <constructor name="ClusterTopologyReader" type="org.apache.hadoop.fs.Path, org.apache.hadoop.conf.Configuration"
  28183. static="false" final="false" visibility="public"
  28184. deprecated="not deprecated">
  28185. <exception name="IOException" type="java.io.IOException"/>
  28186. <doc>
  28187. <![CDATA[Constructor.
  28188. @param path
  28189. Path to the JSON-encoded topology file, possibly compressed.
  28190. @param conf
  28191. @throws IOException]]>
  28192. </doc>
  28193. </constructor>
  28194. <constructor name="ClusterTopologyReader" type="java.io.InputStream"
  28195. static="false" final="false" visibility="public"
  28196. deprecated="not deprecated">
  28197. <exception name="IOException" type="java.io.IOException"/>
  28198. <doc>
  28199. <![CDATA[Constructor.
  28200. @param input
  28201. The input stream for the JSON-encoded topology data.]]>
  28202. </doc>
  28203. </constructor>
  28204. <method name="get" return="org.apache.hadoop.tools.rumen.LoggedNetworkTopology"
  28205. abstract="false" native="false" synchronized="false"
  28206. static="false" final="false" visibility="public"
  28207. deprecated="not deprecated">
  28208. <doc>
  28209. <![CDATA[Get the {@link LoggedNetworkTopology} object.
  28210. @return The {@link LoggedNetworkTopology} object parsed from the input.]]>
  28211. </doc>
  28212. </method>
  28213. <doc>
  28214. <![CDATA[Reading JSON-encoded cluster topology and produce the parsed
  28215. {@link LoggedNetworkTopology} object.]]>
  28216. </doc>
  28217. </class>
  28218. <!-- end class org.apache.hadoop.tools.rumen.ClusterTopologyReader -->
  28219. <!-- start class org.apache.hadoop.tools.rumen.CurrentJHParser -->
  28220. <class name="CurrentJHParser" extends="java.lang.Object"
  28221. abstract="false"
  28222. static="false" final="false" visibility="public"
  28223. deprecated="not deprecated">
  28224. <implements name="org.apache.hadoop.tools.rumen.JobHistoryParser"/>
  28225. <constructor name="CurrentJHParser" type="java.io.InputStream"
  28226. static="false" final="false" visibility="public"
  28227. deprecated="not deprecated">
  28228. <exception name="IOException" type="java.io.IOException"/>
  28229. </constructor>
  28230. <method name="canParse" return="boolean"
  28231. abstract="false" native="false" synchronized="false"
  28232. static="true" final="false" visibility="public"
  28233. deprecated="not deprecated">
  28234. <param name="input" type="java.io.InputStream"/>
  28235. <exception name="IOException" type="java.io.IOException"/>
  28236. <doc>
  28237. <![CDATA[Can this parser parse the input?
  28238. @param input
  28239. @return Whether this parser can parse the input.
  28240. @throws IOException]]>
  28241. </doc>
  28242. </method>
  28243. <method name="nextEvent" return="org.apache.hadoop.mapreduce.jobhistory.HistoryEvent"
  28244. abstract="false" native="false" synchronized="false"
  28245. static="false" final="false" visibility="public"
  28246. deprecated="not deprecated">
  28247. <exception name="IOException" type="java.io.IOException"/>
  28248. </method>
  28249. <method name="close"
  28250. abstract="false" native="false" synchronized="false"
  28251. static="false" final="false" visibility="public"
  28252. deprecated="not deprecated">
  28253. <exception name="IOException" type="java.io.IOException"/>
  28254. </method>
  28255. <doc>
  28256. <![CDATA[{@link JobHistoryParser} that parses {@link JobHistory} files produced by
  28257. {@link org.apache.hadoop.mapreduce.jobhistory.JobHistory} in the same source
  28258. code tree as rumen.]]>
  28259. </doc>
  28260. </class>
  28261. <!-- end class org.apache.hadoop.tools.rumen.CurrentJHParser -->
  28262. <!-- start interface org.apache.hadoop.tools.rumen.DeepCompare -->
  28263. <interface name="DeepCompare" abstract="true"
  28264. static="false" final="false" visibility="public"
  28265. deprecated="not deprecated">
  28266. <method name="deepCompare"
  28267. abstract="false" native="false" synchronized="false"
  28268. static="false" final="false" visibility="public"
  28269. deprecated="not deprecated">
  28270. <param name="other" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  28271. <param name="myLocation" type="org.apache.hadoop.tools.rumen.TreePath"/>
  28272. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  28273. <doc>
  28274. <![CDATA[@param other
  28275. the other comparand that's being compared to me
  28276. @param myLocation
  28277. the path that got to me. In the root, myLocation is null. To
  28278. process the scalar {@code foo} field of the root we will make a
  28279. recursive call with a {@link TreePath} whose {@code fieldName} is
  28280. {@code "bar"} and whose {@code index} is -1 and whose {@code
  28281. parent} is {@code null}. To process the plural {@code bar} field
  28282. of the root we will make a recursive call with a {@link TreePath}
  28283. whose fieldName is {@code "foo"} and whose {@code index} is -1 and
  28284. whose {@code parent} is also {@code null}.
  28285. @throws DeepInequalityException]]>
  28286. </doc>
  28287. </method>
  28288. <doc>
  28289. <![CDATA[Classes that implement this interface can deep-compare [for equality only,
  28290. not order] with another instance. They do a deep compare. If there is any
  28291. semantically significant difference, an implementer throws an Exception to be
  28292. thrown with a chain of causes describing the chain of field references and
  28293. indices that get you to the miscompared point.]]>
  28294. </doc>
  28295. </interface>
  28296. <!-- end interface org.apache.hadoop.tools.rumen.DeepCompare -->
  28297. <!-- start class org.apache.hadoop.tools.rumen.DeepInequalityException -->
  28298. <class name="DeepInequalityException" extends="java.lang.Exception"
  28299. abstract="false"
  28300. static="false" final="false" visibility="public"
  28301. deprecated="not deprecated">
  28302. <constructor name="DeepInequalityException" type="java.lang.String, org.apache.hadoop.tools.rumen.TreePath, java.lang.Throwable"
  28303. static="false" final="false" visibility="public"
  28304. deprecated="not deprecated">
  28305. <doc>
  28306. <![CDATA[@param message
  28307. an exception message
  28308. @param path
  28309. the path that gets from the root to the inequality
  28310. This is the constructor that I intend to have used for this
  28311. exception.]]>
  28312. </doc>
  28313. </constructor>
  28314. <constructor name="DeepInequalityException" type="java.lang.String, org.apache.hadoop.tools.rumen.TreePath"
  28315. static="false" final="false" visibility="public"
  28316. deprecated="not deprecated">
  28317. <doc>
  28318. <![CDATA[@param message
  28319. an exception message
  28320. @param path
  28321. the path that gets from the root to the inequality
  28322. This is the constructor that I intend to have used for this
  28323. exception.]]>
  28324. </doc>
  28325. </constructor>
  28326. <doc>
  28327. <![CDATA[We use this exception class in the unit test, and we do a deep comparison
  28328. when we run the]]>
  28329. </doc>
  28330. </class>
  28331. <!-- end class org.apache.hadoop.tools.rumen.DeepInequalityException -->
  28332. <!-- start class org.apache.hadoop.tools.rumen.DefaultInputDemuxer -->
  28333. <class name="DefaultInputDemuxer" extends="java.lang.Object"
  28334. abstract="false"
  28335. static="false" final="false" visibility="public"
  28336. deprecated="not deprecated">
  28337. <implements name="org.apache.hadoop.tools.rumen.InputDemuxer"/>
  28338. <constructor name="DefaultInputDemuxer"
  28339. static="false" final="false" visibility="public"
  28340. deprecated="not deprecated">
  28341. </constructor>
  28342. <method name="bindTo"
  28343. abstract="false" native="false" synchronized="false"
  28344. static="false" final="false" visibility="public"
  28345. deprecated="not deprecated">
  28346. <param name="path" type="org.apache.hadoop.fs.Path"/>
  28347. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  28348. <exception name="IOException" type="java.io.IOException"/>
  28349. </method>
  28350. <method name="getNext" return="org.apache.hadoop.tools.rumen.Pair"
  28351. abstract="false" native="false" synchronized="false"
  28352. static="false" final="false" visibility="public"
  28353. deprecated="not deprecated">
  28354. <exception name="IOException" type="java.io.IOException"/>
  28355. </method>
  28356. <method name="close"
  28357. abstract="false" native="false" synchronized="false"
  28358. static="false" final="false" visibility="public"
  28359. deprecated="not deprecated">
  28360. <exception name="IOException" type="java.io.IOException"/>
  28361. </method>
  28362. <doc>
  28363. <![CDATA[{@link DefaultInputDemuxer} acts as a pass-through demuxer. It just opens
  28364. each file and returns back the input stream. If the input is compressed, it
  28365. would return a decompression stream.]]>
  28366. </doc>
  28367. </class>
  28368. <!-- end class org.apache.hadoop.tools.rumen.DefaultInputDemuxer -->
  28369. <!-- start class org.apache.hadoop.tools.rumen.DefaultOutputter -->
  28370. <class name="DefaultOutputter" extends="java.lang.Object"
  28371. abstract="false"
  28372. static="false" final="false" visibility="public"
  28373. deprecated="not deprecated">
  28374. <implements name="org.apache.hadoop.tools.rumen.Outputter"/>
  28375. <constructor name="DefaultOutputter"
  28376. static="false" final="false" visibility="public"
  28377. deprecated="not deprecated">
  28378. </constructor>
  28379. <method name="init"
  28380. abstract="false" native="false" synchronized="false"
  28381. static="false" final="false" visibility="public"
  28382. deprecated="not deprecated">
  28383. <param name="path" type="org.apache.hadoop.fs.Path"/>
  28384. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  28385. <exception name="IOException" type="java.io.IOException"/>
  28386. </method>
  28387. <method name="output"
  28388. abstract="false" native="false" synchronized="false"
  28389. static="false" final="false" visibility="public"
  28390. deprecated="not deprecated">
  28391. <param name="object" type="T"/>
  28392. <exception name="IOException" type="java.io.IOException"/>
  28393. </method>
  28394. <method name="close"
  28395. abstract="false" native="false" synchronized="false"
  28396. static="false" final="false" visibility="public"
  28397. deprecated="not deprecated">
  28398. <exception name="IOException" type="java.io.IOException"/>
  28399. </method>
  28400. <doc>
  28401. <![CDATA[The default {@link Outputter} that outputs to a plain file. Compression
  28402. will be applied if the path has the right suffix.]]>
  28403. </doc>
  28404. </class>
  28405. <!-- end class org.apache.hadoop.tools.rumen.DefaultOutputter -->
  28406. <!-- start class org.apache.hadoop.tools.rumen.DeskewedJobTraceReader -->
  28407. <class name="DeskewedJobTraceReader" extends="java.lang.Object"
  28408. abstract="false"
  28409. static="false" final="false" visibility="public"
  28410. deprecated="not deprecated">
  28411. <implements name="java.io.Closeable"/>
  28412. <constructor name="DeskewedJobTraceReader" type="org.apache.hadoop.tools.rumen.JobTraceReader, int, boolean"
  28413. static="false" final="false" visibility="public"
  28414. deprecated="not deprecated">
  28415. <exception name="IOException" type="java.io.IOException"/>
  28416. <doc>
  28417. <![CDATA[Constructor.
  28418. @param reader
  28419. the {@link JobTraceReader} that's being protected
  28420. @param skewBufferLength
  28421. [the number of late jobs that can preced a later out-of-order
  28422. earlier job
  28423. @throws IOException]]>
  28424. </doc>
  28425. </constructor>
  28426. <constructor name="DeskewedJobTraceReader" type="org.apache.hadoop.tools.rumen.JobTraceReader"
  28427. static="false" final="false" visibility="public"
  28428. deprecated="not deprecated">
  28429. <exception name="IOException" type="java.io.IOException"/>
  28430. </constructor>
  28431. <method name="close"
  28432. abstract="false" native="false" synchronized="false"
  28433. static="false" final="false" visibility="public"
  28434. deprecated="not deprecated">
  28435. <exception name="IOException" type="java.io.IOException"/>
  28436. </method>
  28437. </class>
  28438. <!-- end class org.apache.hadoop.tools.rumen.DeskewedJobTraceReader -->
  28439. <!-- start class org.apache.hadoop.tools.rumen.Folder -->
  28440. <class name="Folder" extends="org.apache.hadoop.conf.Configured"
  28441. abstract="false"
  28442. static="false" final="false" visibility="public"
  28443. deprecated="not deprecated">
  28444. <implements name="org.apache.hadoop.util.Tool"/>
  28445. <constructor name="Folder"
  28446. static="false" final="false" visibility="public"
  28447. deprecated="not deprecated">
  28448. </constructor>
  28449. <method name="run" return="int"
  28450. abstract="false" native="false" synchronized="false"
  28451. static="false" final="false" visibility="public"
  28452. deprecated="not deprecated">
  28453. <param name="args" type="java.lang.String[]"/>
  28454. <exception name="IOException" type="java.io.IOException"/>
  28455. </method>
  28456. <method name="run" return="int"
  28457. abstract="false" native="false" synchronized="false"
  28458. static="false" final="false" visibility="public"
  28459. deprecated="not deprecated">
  28460. <exception name="IOException" type="java.io.IOException"/>
  28461. </method>
  28462. <method name="main"
  28463. abstract="false" native="false" synchronized="false"
  28464. static="true" final="false" visibility="public"
  28465. deprecated="not deprecated">
  28466. <param name="args" type="java.lang.String[]"/>
  28467. <doc>
  28468. <![CDATA[@param args]]>
  28469. </doc>
  28470. </method>
  28471. </class>
  28472. <!-- end class org.apache.hadoop.tools.rumen.Folder -->
  28473. <!-- start class org.apache.hadoop.tools.rumen.Hadoop20JHParser -->
  28474. <class name="Hadoop20JHParser" extends="java.lang.Object"
  28475. abstract="false"
  28476. static="false" final="false" visibility="public"
  28477. deprecated="not deprecated">
  28478. <implements name="org.apache.hadoop.tools.rumen.JobHistoryParser"/>
  28479. <constructor name="Hadoop20JHParser" type="java.io.InputStream"
  28480. static="false" final="false" visibility="public"
  28481. deprecated="not deprecated">
  28482. <exception name="IOException" type="java.io.IOException"/>
  28483. </constructor>
  28484. <method name="canParse" return="boolean"
  28485. abstract="false" native="false" synchronized="false"
  28486. static="true" final="false" visibility="public"
  28487. deprecated="not deprecated">
  28488. <param name="input" type="java.io.InputStream"/>
  28489. <exception name="IOException" type="java.io.IOException"/>
  28490. <doc>
  28491. <![CDATA[Can this parser parse the input?
  28492. @param input
  28493. @return Whether this parser can parse the input.
  28494. @throws IOException
  28495. We will deem a stream to be a good 0.20 job history stream if the
  28496. first line is exactly "Meta VERSION=\"1\" ."]]>
  28497. </doc>
  28498. </method>
  28499. <method name="nextEvent" return="org.apache.hadoop.mapreduce.jobhistory.HistoryEvent"
  28500. abstract="false" native="false" synchronized="false"
  28501. static="false" final="false" visibility="public"
  28502. deprecated="not deprecated">
  28503. </method>
  28504. <method name="close"
  28505. abstract="false" native="false" synchronized="false"
  28506. static="false" final="false" visibility="public"
  28507. deprecated="not deprecated">
  28508. <exception name="IOException" type="java.io.IOException"/>
  28509. </method>
  28510. <doc>
  28511. <![CDATA[{@link JobHistoryParser} to parse job histories for hadoop 0.20 (META=1).]]>
  28512. </doc>
  28513. </class>
  28514. <!-- end class org.apache.hadoop.tools.rumen.Hadoop20JHParser -->
  28515. <!-- start class org.apache.hadoop.tools.rumen.HadoopLogsAnalyzer -->
  28516. <class name="HadoopLogsAnalyzer" extends="org.apache.hadoop.conf.Configured"
  28517. abstract="false"
  28518. static="false" final="false" visibility="public"
  28519. deprecated="not deprecated">
  28520. <implements name="org.apache.hadoop.util.Tool"/>
  28521. <constructor name="HadoopLogsAnalyzer"
  28522. static="false" final="false" visibility="public"
  28523. deprecated="not deprecated">
  28524. </constructor>
  28525. <method name="run" return="int"
  28526. abstract="false" native="false" synchronized="false"
  28527. static="false" final="false" visibility="public"
  28528. deprecated="not deprecated">
  28529. <param name="args" type="java.lang.String[]"/>
  28530. <exception name="IOException" type="java.io.IOException"/>
  28531. </method>
  28532. <method name="main"
  28533. abstract="false" native="false" synchronized="false"
  28534. static="true" final="false" visibility="public"
  28535. deprecated="not deprecated">
  28536. <param name="args" type="java.lang.String[]"/>
  28537. <doc>
  28538. <![CDATA[@param args
  28539. Last arg is the input file. That file can be a directory, in which
  28540. case you get all the files in sorted order. We will decompress
  28541. files whose nmes end in .gz .
  28542. switches: -c collect line types.
  28543. -d debug mode
  28544. -delays print out the delays [interval between job submit time and
  28545. launch time]
  28546. -runtimes print out the job runtimes
  28547. -spreads print out the ratio of 10%ile and 90%ile, of both the
  28548. successful map task attempt run times and the the successful
  28549. reduce task attempt run times
  28550. -tasktimes prints out individual task time distributions
  28551. collects all the line types and prints the first example of each
  28552. one]]>
  28553. </doc>
  28554. </method>
  28555. <doc>
  28556. <![CDATA[This is the main class for rumen log mining functionality.
  28557. It reads a directory of job tracker logs, and computes various information
  28558. about it. See {@code usage()}, below.]]>
  28559. </doc>
  28560. </class>
  28561. <!-- end class org.apache.hadoop.tools.rumen.HadoopLogsAnalyzer -->
  28562. <!-- start interface org.apache.hadoop.tools.rumen.InputDemuxer -->
  28563. <interface name="InputDemuxer" abstract="true"
  28564. static="false" final="false" visibility="public"
  28565. deprecated="not deprecated">
  28566. <implements name="java.io.Closeable"/>
  28567. <method name="bindTo"
  28568. abstract="false" native="false" synchronized="false"
  28569. static="false" final="false" visibility="public"
  28570. deprecated="not deprecated">
  28571. <param name="path" type="org.apache.hadoop.fs.Path"/>
  28572. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  28573. <exception name="IOException" type="java.io.IOException"/>
  28574. <doc>
  28575. <![CDATA[Bind the {@link InputDemuxer} to a particular file.
  28576. @param path
  28577. The path to the file it should bind to.
  28578. @param conf
  28579. Configuration
  28580. @throws IOException
  28581. Returns true when the binding succeeds. If the file can be read
  28582. but is in the wrong format, returns false. IOException is
  28583. reserved for read errors.]]>
  28584. </doc>
  28585. </method>
  28586. <method name="getNext" return="org.apache.hadoop.tools.rumen.Pair"
  28587. abstract="false" native="false" synchronized="false"
  28588. static="false" final="false" visibility="public"
  28589. deprecated="not deprecated">
  28590. <exception name="IOException" type="java.io.IOException"/>
  28591. <doc>
  28592. <![CDATA[Get the next <name, input> pair. The name should preserve the original job
  28593. history file or job conf file name. The input object should be closed
  28594. before calling getNext() again. The old input object would be invalid after
  28595. calling getNext() again.
  28596. @return the next <name, input> pair.]]>
  28597. </doc>
  28598. </method>
  28599. <doc>
  28600. <![CDATA[{@link InputDemuxer} dem-ultiplexes the input files into individual input
  28601. streams.]]>
  28602. </doc>
  28603. </interface>
  28604. <!-- end interface org.apache.hadoop.tools.rumen.InputDemuxer -->
  28605. <!-- start class org.apache.hadoop.tools.rumen.Job20LineHistoryEventEmitter -->
  28606. <class name="Job20LineHistoryEventEmitter" extends="org.apache.hadoop.tools.rumen.HistoryEventEmitter"
  28607. abstract="false"
  28608. static="false" final="false" visibility="public"
  28609. deprecated="not deprecated">
  28610. </class>
  28611. <!-- end class org.apache.hadoop.tools.rumen.Job20LineHistoryEventEmitter -->
  28612. <!-- start class org.apache.hadoop.tools.rumen.JobBuilder -->
  28613. <class name="JobBuilder" extends="java.lang.Object"
  28614. abstract="false"
  28615. static="false" final="false" visibility="public"
  28616. deprecated="not deprecated">
  28617. <constructor name="JobBuilder" type="java.lang.String"
  28618. static="false" final="false" visibility="public"
  28619. deprecated="not deprecated">
  28620. </constructor>
  28621. <method name="getJobID" return="java.lang.String"
  28622. abstract="false" native="false" synchronized="false"
  28623. static="false" final="false" visibility="public"
  28624. deprecated="not deprecated">
  28625. </method>
  28626. <method name="process"
  28627. abstract="false" native="false" synchronized="false"
  28628. static="false" final="false" visibility="public"
  28629. deprecated="not deprecated">
  28630. <param name="event" type="org.apache.hadoop.mapreduce.jobhistory.HistoryEvent"/>
  28631. <doc>
  28632. <![CDATA[Process one {@link HistoryEvent}
  28633. @param event
  28634. The {@link HistoryEvent} to be processed.]]>
  28635. </doc>
  28636. </method>
  28637. <method name="process"
  28638. abstract="false" native="false" synchronized="false"
  28639. static="false" final="false" visibility="public"
  28640. deprecated="not deprecated">
  28641. <param name="conf" type="java.util.Properties"/>
  28642. <doc>
  28643. <![CDATA[Process a collection of JobConf {@link Properties}. We do not restrict it
  28644. to be called once. It is okay to process a conf before, during or after the
  28645. events.
  28646. @param conf
  28647. The job conf properties to be added.]]>
  28648. </doc>
  28649. </method>
  28650. <method name="build" return="org.apache.hadoop.tools.rumen.LoggedJob"
  28651. abstract="false" native="false" synchronized="false"
  28652. static="false" final="false" visibility="public"
  28653. deprecated="not deprecated">
  28654. <doc>
  28655. <![CDATA[Request the builder to build the final object. Once called, the
  28656. {@link JobBuilder} would accept no more events or job-conf properties.
  28657. @return Parsed {@link LoggedJob} object.]]>
  28658. </doc>
  28659. </method>
  28660. <doc>
  28661. <![CDATA[{@link JobBuilder} builds one job. It processes a sequence of
  28662. {@link HistoryEvent}s.]]>
  28663. </doc>
  28664. </class>
  28665. <!-- end class org.apache.hadoop.tools.rumen.JobBuilder -->
  28666. <!-- start class org.apache.hadoop.tools.rumen.JobConfigurationParser -->
  28667. <class name="JobConfigurationParser" extends="java.lang.Object"
  28668. abstract="false"
  28669. static="false" final="false" visibility="public"
  28670. deprecated="not deprecated">
  28671. <constructor name="JobConfigurationParser" type="java.util.List"
  28672. static="false" final="false" visibility="public"
  28673. deprecated="not deprecated">
  28674. <doc>
  28675. <![CDATA[Constructor
  28676. @param interested
  28677. properties we should extract from the job configuration xml.]]>
  28678. </doc>
  28679. </constructor>
  28680. <doc>
  28681. <![CDATA[{@link JobConfigurationParser} parses the job configuration xml file, and
  28682. extracts various framework specific properties. It parses the file using a
  28683. stream-parser and thus is more memory efficient. [This optimization may be
  28684. postponed for a future release]]]>
  28685. </doc>
  28686. </class>
  28687. <!-- end class org.apache.hadoop.tools.rumen.JobConfigurationParser -->
  28688. <!-- start class org.apache.hadoop.tools.rumen.JobConfPropertyNames -->
  28689. <class name="JobConfPropertyNames" extends="java.lang.Enum"
  28690. abstract="false"
  28691. static="false" final="true" visibility="public"
  28692. deprecated="not deprecated">
  28693. <method name="values" return="org.apache.hadoop.tools.rumen.JobConfPropertyNames[]"
  28694. abstract="false" native="false" synchronized="false"
  28695. static="true" final="false" visibility="public"
  28696. deprecated="not deprecated">
  28697. </method>
  28698. <method name="valueOf" return="org.apache.hadoop.tools.rumen.JobConfPropertyNames"
  28699. abstract="false" native="false" synchronized="false"
  28700. static="true" final="false" visibility="public"
  28701. deprecated="not deprecated">
  28702. <param name="name" type="java.lang.String"/>
  28703. </method>
  28704. <method name="getCandidates" return="java.lang.String[]"
  28705. abstract="false" native="false" synchronized="false"
  28706. static="false" final="false" visibility="public"
  28707. deprecated="not deprecated">
  28708. </method>
  28709. </class>
  28710. <!-- end class org.apache.hadoop.tools.rumen.JobConfPropertyNames -->
  28711. <!-- start interface org.apache.hadoop.tools.rumen.JobHistoryParser -->
  28712. <interface name="JobHistoryParser" abstract="true"
  28713. static="false" final="false" visibility="public"
  28714. deprecated="not deprecated">
  28715. <implements name="java.io.Closeable"/>
  28716. <method name="nextEvent" return="org.apache.hadoop.mapreduce.jobhistory.HistoryEvent"
  28717. abstract="false" native="false" synchronized="false"
  28718. static="false" final="false" visibility="public"
  28719. deprecated="not deprecated">
  28720. <exception name="IOException" type="java.io.IOException"/>
  28721. <doc>
  28722. <![CDATA[Get the next {@link HistoryEvent}
  28723. @return the next {@link HistoryEvent}. If no more events left, return null.
  28724. @throws IOException]]>
  28725. </doc>
  28726. </method>
  28727. <doc>
  28728. <![CDATA[{@link JobHistoryParser} defines the interface of a Job History file parser.]]>
  28729. </doc>
  28730. </interface>
  28731. <!-- end interface org.apache.hadoop.tools.rumen.JobHistoryParser -->
  28732. <!-- start class org.apache.hadoop.tools.rumen.JobHistoryParserFactory -->
  28733. <class name="JobHistoryParserFactory" extends="java.lang.Object"
  28734. abstract="false"
  28735. static="false" final="false" visibility="public"
  28736. deprecated="not deprecated">
  28737. <constructor name="JobHistoryParserFactory"
  28738. static="false" final="false" visibility="public"
  28739. deprecated="not deprecated">
  28740. </constructor>
  28741. <method name="getParser" return="org.apache.hadoop.tools.rumen.JobHistoryParser"
  28742. abstract="false" native="false" synchronized="false"
  28743. static="true" final="false" visibility="public"
  28744. deprecated="not deprecated">
  28745. <param name="ris" type="org.apache.hadoop.tools.rumen.RewindableInputStream"/>
  28746. <exception name="IOException" type="java.io.IOException"/>
  28747. </method>
  28748. <doc>
  28749. <![CDATA[{@link JobHistoryParserFactory} is a singleton class that attempts to
  28750. determine the version of job history and return a proper parser.]]>
  28751. </doc>
  28752. </class>
  28753. <!-- end class org.apache.hadoop.tools.rumen.JobHistoryParserFactory -->
  28754. <!-- start class org.apache.hadoop.tools.rumen.JobHistoryParserFactory.VersionDetector -->
  28755. <class name="JobHistoryParserFactory.VersionDetector" extends="java.lang.Enum"
  28756. abstract="false"
  28757. static="true" final="false" visibility="public"
  28758. deprecated="not deprecated">
  28759. <method name="values" return="org.apache.hadoop.tools.rumen.JobHistoryParserFactory.VersionDetector[]"
  28760. abstract="false" native="false" synchronized="false"
  28761. static="true" final="false" visibility="public"
  28762. deprecated="not deprecated">
  28763. </method>
  28764. <method name="valueOf" return="org.apache.hadoop.tools.rumen.JobHistoryParserFactory.VersionDetector"
  28765. abstract="false" native="false" synchronized="false"
  28766. static="true" final="false" visibility="public"
  28767. deprecated="not deprecated">
  28768. <param name="name" type="java.lang.String"/>
  28769. </method>
  28770. </class>
  28771. <!-- end class org.apache.hadoop.tools.rumen.JobHistoryParserFactory.VersionDetector -->
  28772. <!-- start interface org.apache.hadoop.tools.rumen.JobStory -->
  28773. <interface name="JobStory" abstract="true"
  28774. static="false" final="false" visibility="public"
  28775. deprecated="not deprecated">
  28776. <method name="getJobConf" return="org.apache.hadoop.mapred.JobConf"
  28777. abstract="false" native="false" synchronized="false"
  28778. static="false" final="false" visibility="public"
  28779. deprecated="not deprecated">
  28780. <doc>
  28781. <![CDATA[Get the {@link JobConf} for the job.
  28782. @return the <code>JobConf</code> for the job]]>
  28783. </doc>
  28784. </method>
  28785. <method name="getName" return="java.lang.String"
  28786. abstract="false" native="false" synchronized="false"
  28787. static="false" final="false" visibility="public"
  28788. deprecated="not deprecated">
  28789. <doc>
  28790. <![CDATA[Get the job name.
  28791. @return the job name]]>
  28792. </doc>
  28793. </method>
  28794. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  28795. abstract="false" native="false" synchronized="false"
  28796. static="false" final="false" visibility="public"
  28797. deprecated="not deprecated">
  28798. <doc>
  28799. <![CDATA[Get the job ID
  28800. @return the job ID]]>
  28801. </doc>
  28802. </method>
  28803. <method name="getUser" return="java.lang.String"
  28804. abstract="false" native="false" synchronized="false"
  28805. static="false" final="false" visibility="public"
  28806. deprecated="not deprecated">
  28807. <doc>
  28808. <![CDATA[Get the user who ran the job.
  28809. @return the user who ran the job]]>
  28810. </doc>
  28811. </method>
  28812. <method name="getSubmissionTime" return="long"
  28813. abstract="false" native="false" synchronized="false"
  28814. static="false" final="false" visibility="public"
  28815. deprecated="not deprecated">
  28816. <doc>
  28817. <![CDATA[Get the job submission time.
  28818. @return the job submission time]]>
  28819. </doc>
  28820. </method>
  28821. <method name="getNumberMaps" return="int"
  28822. abstract="false" native="false" synchronized="false"
  28823. static="false" final="false" visibility="public"
  28824. deprecated="not deprecated">
  28825. <doc>
  28826. <![CDATA[Get the number of maps in the {@link JobStory}.
  28827. @return the number of maps in the <code>Job</code>]]>
  28828. </doc>
  28829. </method>
  28830. <method name="getNumberReduces" return="int"
  28831. abstract="false" native="false" synchronized="false"
  28832. static="false" final="false" visibility="public"
  28833. deprecated="not deprecated">
  28834. <doc>
  28835. <![CDATA[Get the number of reduce in the {@link JobStory}.
  28836. @return the number of reduces in the <code>Job</code>]]>
  28837. </doc>
  28838. </method>
  28839. <method name="getInputSplits" return="org.apache.hadoop.mapreduce.InputSplit[]"
  28840. abstract="false" native="false" synchronized="false"
  28841. static="false" final="false" visibility="public"
  28842. deprecated="not deprecated">
  28843. <doc>
  28844. <![CDATA[Get the input splits for the job.
  28845. @return the input splits for the job]]>
  28846. </doc>
  28847. </method>
  28848. <method name="getTaskInfo" return="org.apache.hadoop.tools.rumen.TaskInfo"
  28849. abstract="false" native="false" synchronized="false"
  28850. static="false" final="false" visibility="public"
  28851. deprecated="not deprecated">
  28852. <param name="taskType" type="org.apache.hadoop.mapreduce.TaskType"/>
  28853. <param name="taskNumber" type="int"/>
  28854. <doc>
  28855. <![CDATA[Get {@link TaskInfo} for a given task.
  28856. @param taskType {@link TaskType} of the task
  28857. @param taskNumber Partition number of the task
  28858. @return the <code>TaskInfo</code> for the given task]]>
  28859. </doc>
  28860. </method>
  28861. <method name="getTaskAttemptInfo" return="org.apache.hadoop.tools.rumen.TaskAttemptInfo"
  28862. abstract="false" native="false" synchronized="false"
  28863. static="false" final="false" visibility="public"
  28864. deprecated="not deprecated">
  28865. <param name="taskType" type="org.apache.hadoop.mapreduce.TaskType"/>
  28866. <param name="taskNumber" type="int"/>
  28867. <param name="taskAttemptNumber" type="int"/>
  28868. <doc>
  28869. <![CDATA[Get {@link TaskAttemptInfo} for a given task-attempt, without regard to
  28870. impact of locality (e.g. not needed to make scheduling decisions).
  28871. @param taskType {@link TaskType} of the task-attempt
  28872. @param taskNumber Partition number of the task-attempt
  28873. @param taskAttemptNumber Attempt number of the task
  28874. @return the <code>TaskAttemptInfo</code> for the given task-attempt]]>
  28875. </doc>
  28876. </method>
  28877. <method name="getMapTaskAttemptInfoAdjusted" return="org.apache.hadoop.tools.rumen.TaskAttemptInfo"
  28878. abstract="false" native="false" synchronized="false"
  28879. static="false" final="false" visibility="public"
  28880. deprecated="not deprecated">
  28881. <param name="taskNumber" type="int"/>
  28882. <param name="taskAttemptNumber" type="int"/>
  28883. <param name="locality" type="int"/>
  28884. <doc>
  28885. <![CDATA[Get {@link TaskAttemptInfo} for a given task-attempt, considering impact
  28886. of locality.
  28887. @param taskNumber Partition number of the task-attempt
  28888. @param taskAttemptNumber Attempt number of the task
  28889. @param locality Data locality of the task as scheduled in simulation
  28890. @return the <code>TaskAttemptInfo</code> for the given task-attempt]]>
  28891. </doc>
  28892. </method>
  28893. <method name="getOutcome" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values"
  28894. abstract="false" native="false" synchronized="false"
  28895. static="false" final="false" visibility="public"
  28896. deprecated="not deprecated">
  28897. <doc>
  28898. <![CDATA[Get the outcome of the job execution.
  28899. @return The outcome of the job execution.]]>
  28900. </doc>
  28901. </method>
  28902. <method name="getQueueName" return="java.lang.String"
  28903. abstract="false" native="false" synchronized="false"
  28904. static="false" final="false" visibility="public"
  28905. deprecated="not deprecated">
  28906. <doc>
  28907. <![CDATA[Get the queue where the job is submitted.
  28908. @return the queue where the job is submitted.]]>
  28909. </doc>
  28910. </method>
  28911. <doc>
  28912. <![CDATA[{@link JobStory} represents the runtime information available for a
  28913. completed Map-Reduce job.]]>
  28914. </doc>
  28915. </interface>
  28916. <!-- end interface org.apache.hadoop.tools.rumen.JobStory -->
  28917. <!-- start interface org.apache.hadoop.tools.rumen.JobStoryProducer -->
  28918. <interface name="JobStoryProducer" abstract="true"
  28919. static="false" final="false" visibility="public"
  28920. deprecated="not deprecated">
  28921. <implements name="java.io.Closeable"/>
  28922. <method name="getNextJob" return="org.apache.hadoop.tools.rumen.JobStory"
  28923. abstract="false" native="false" synchronized="false"
  28924. static="false" final="false" visibility="public"
  28925. deprecated="not deprecated">
  28926. <exception name="IOException" type="java.io.IOException"/>
  28927. <doc>
  28928. <![CDATA[Get the next job.
  28929. @return The next job. Or null if no more job is available.
  28930. @throws IOException]]>
  28931. </doc>
  28932. </method>
  28933. <doc>
  28934. <![CDATA[{@link JobStoryProducer} produces the sequence of {@link JobStory}'s.]]>
  28935. </doc>
  28936. </interface>
  28937. <!-- end interface org.apache.hadoop.tools.rumen.JobStoryProducer -->
  28938. <!-- start class org.apache.hadoop.tools.rumen.JobTraceReader -->
  28939. <class name="JobTraceReader" extends="org.apache.hadoop.tools.rumen.JsonObjectMapperParser"
  28940. abstract="false"
  28941. static="false" final="false" visibility="public"
  28942. deprecated="not deprecated">
  28943. <constructor name="JobTraceReader" type="org.apache.hadoop.fs.Path, org.apache.hadoop.conf.Configuration"
  28944. static="false" final="false" visibility="public"
  28945. deprecated="not deprecated">
  28946. <exception name="IOException" type="java.io.IOException"/>
  28947. <doc>
  28948. <![CDATA[Constructor.
  28949. @param path
  28950. Path to the JSON trace file, possibly compressed.
  28951. @param conf
  28952. @throws IOException]]>
  28953. </doc>
  28954. </constructor>
  28955. <constructor name="JobTraceReader" type="java.io.InputStream"
  28956. static="false" final="false" visibility="public"
  28957. deprecated="not deprecated">
  28958. <exception name="IOException" type="java.io.IOException"/>
  28959. <doc>
  28960. <![CDATA[Constructor.
  28961. @param input
  28962. The input stream for the JSON trace.]]>
  28963. </doc>
  28964. </constructor>
  28965. <doc>
  28966. <![CDATA[Reading JSON-encoded job traces and produce {@link LoggedJob} instances.]]>
  28967. </doc>
  28968. </class>
  28969. <!-- end class org.apache.hadoop.tools.rumen.JobTraceReader -->
  28970. <!-- start class org.apache.hadoop.tools.rumen.JsonObjectMapperWriter -->
  28971. <class name="JsonObjectMapperWriter" extends="java.lang.Object"
  28972. abstract="false"
  28973. static="false" final="false" visibility="public"
  28974. deprecated="not deprecated">
  28975. <implements name="java.io.Closeable"/>
  28976. <constructor name="JsonObjectMapperWriter" type="java.io.OutputStream, boolean"
  28977. static="false" final="false" visibility="public"
  28978. deprecated="not deprecated">
  28979. <exception name="IOException" type="java.io.IOException"/>
  28980. </constructor>
  28981. <method name="write"
  28982. abstract="false" native="false" synchronized="false"
  28983. static="false" final="false" visibility="public"
  28984. deprecated="not deprecated">
  28985. <param name="object" type="T"/>
  28986. <exception name="IOException" type="java.io.IOException"/>
  28987. </method>
  28988. <method name="close"
  28989. abstract="false" native="false" synchronized="false"
  28990. static="false" final="false" visibility="public"
  28991. deprecated="not deprecated">
  28992. <exception name="IOException" type="java.io.IOException"/>
  28993. </method>
  28994. <doc>
  28995. <![CDATA[Simple wrapper around {@link JsonGenerator} to write objects in JSON format.
  28996. @param <T> The type of the objects to be written.]]>
  28997. </doc>
  28998. </class>
  28999. <!-- end class org.apache.hadoop.tools.rumen.JsonObjectMapperWriter -->
  29000. <!-- start class org.apache.hadoop.tools.rumen.LoggedDiscreteCDF -->
  29001. <class name="LoggedDiscreteCDF" extends="java.lang.Object"
  29002. abstract="false"
  29003. static="false" final="false" visibility="public"
  29004. deprecated="not deprecated">
  29005. <implements name="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29006. <constructor name="LoggedDiscreteCDF"
  29007. static="false" final="false" visibility="public"
  29008. deprecated="not deprecated">
  29009. </constructor>
  29010. <method name="getMinimum" return="long"
  29011. abstract="false" native="false" synchronized="false"
  29012. static="false" final="false" visibility="public"
  29013. deprecated="not deprecated">
  29014. </method>
  29015. <method name="getRankings" return="java.util.List"
  29016. abstract="false" native="false" synchronized="false"
  29017. static="false" final="false" visibility="public"
  29018. deprecated="not deprecated">
  29019. </method>
  29020. <method name="getMaximum" return="long"
  29021. abstract="false" native="false" synchronized="false"
  29022. static="false" final="false" visibility="public"
  29023. deprecated="not deprecated">
  29024. </method>
  29025. <method name="getNumberValues" return="long"
  29026. abstract="false" native="false" synchronized="false"
  29027. static="false" final="false" visibility="public"
  29028. deprecated="not deprecated">
  29029. </method>
  29030. <method name="deepCompare"
  29031. abstract="false" native="false" synchronized="false"
  29032. static="false" final="false" visibility="public"
  29033. deprecated="not deprecated">
  29034. <param name="comparand" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29035. <param name="loc" type="org.apache.hadoop.tools.rumen.TreePath"/>
  29036. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  29037. </method>
  29038. <doc>
  29039. <![CDATA[A {@link LoggedDiscreteCDF} is a discrete approximation of a cumulative
  29040. distribution function, with this class set up to meet the requirements of the
  29041. Jackson JSON parser/generator.
  29042. All of the public methods are simply accessors for the instance variables we
  29043. want to write out in the JSON files.]]>
  29044. </doc>
  29045. </class>
  29046. <!-- end class org.apache.hadoop.tools.rumen.LoggedDiscreteCDF -->
  29047. <!-- start class org.apache.hadoop.tools.rumen.LoggedJob -->
  29048. <class name="LoggedJob" extends="java.lang.Object"
  29049. abstract="false"
  29050. static="false" final="false" visibility="public"
  29051. deprecated="not deprecated">
  29052. <implements name="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29053. <method name="setUnknownAttribute"
  29054. abstract="false" native="false" synchronized="false"
  29055. static="false" final="false" visibility="public"
  29056. deprecated="not deprecated">
  29057. <param name="attributeName" type="java.lang.String"/>
  29058. <param name="ignored" type="java.lang.Object"/>
  29059. </method>
  29060. <method name="getUser" return="java.lang.String"
  29061. abstract="false" native="false" synchronized="false"
  29062. static="false" final="false" visibility="public"
  29063. deprecated="not deprecated">
  29064. </method>
  29065. <method name="getJobID" return="java.lang.String"
  29066. abstract="false" native="false" synchronized="false"
  29067. static="false" final="false" visibility="public"
  29068. deprecated="not deprecated">
  29069. </method>
  29070. <method name="getPriority" return="org.apache.hadoop.tools.rumen.LoggedJob.JobPriority"
  29071. abstract="false" native="false" synchronized="false"
  29072. static="false" final="false" visibility="public"
  29073. deprecated="not deprecated">
  29074. </method>
  29075. <method name="getComputonsPerMapInputByte" return="long"
  29076. abstract="false" native="false" synchronized="false"
  29077. static="false" final="false" visibility="public"
  29078. deprecated="not deprecated">
  29079. </method>
  29080. <method name="getComputonsPerMapOutputByte" return="long"
  29081. abstract="false" native="false" synchronized="false"
  29082. static="false" final="false" visibility="public"
  29083. deprecated="not deprecated">
  29084. </method>
  29085. <method name="getComputonsPerReduceInputByte" return="long"
  29086. abstract="false" native="false" synchronized="false"
  29087. static="false" final="false" visibility="public"
  29088. deprecated="not deprecated">
  29089. </method>
  29090. <method name="getComputonsPerReduceOutputByte" return="long"
  29091. abstract="false" native="false" synchronized="false"
  29092. static="false" final="false" visibility="public"
  29093. deprecated="not deprecated">
  29094. </method>
  29095. <method name="getSubmitTime" return="long"
  29096. abstract="false" native="false" synchronized="false"
  29097. static="false" final="false" visibility="public"
  29098. deprecated="not deprecated">
  29099. </method>
  29100. <method name="getLaunchTime" return="long"
  29101. abstract="false" native="false" synchronized="false"
  29102. static="false" final="false" visibility="public"
  29103. deprecated="not deprecated">
  29104. </method>
  29105. <method name="getFinishTime" return="long"
  29106. abstract="false" native="false" synchronized="false"
  29107. static="false" final="false" visibility="public"
  29108. deprecated="not deprecated">
  29109. </method>
  29110. <method name="getHeapMegabytes" return="int"
  29111. abstract="false" native="false" synchronized="false"
  29112. static="false" final="false" visibility="public"
  29113. deprecated="not deprecated">
  29114. </method>
  29115. <method name="getTotalMaps" return="int"
  29116. abstract="false" native="false" synchronized="false"
  29117. static="false" final="false" visibility="public"
  29118. deprecated="not deprecated">
  29119. </method>
  29120. <method name="getTotalReduces" return="int"
  29121. abstract="false" native="false" synchronized="false"
  29122. static="false" final="false" visibility="public"
  29123. deprecated="not deprecated">
  29124. </method>
  29125. <method name="getOutcome" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values"
  29126. abstract="false" native="false" synchronized="false"
  29127. static="false" final="false" visibility="public"
  29128. deprecated="not deprecated">
  29129. </method>
  29130. <method name="getJobtype" return="org.apache.hadoop.tools.rumen.LoggedJob.JobType"
  29131. abstract="false" native="false" synchronized="false"
  29132. static="false" final="false" visibility="public"
  29133. deprecated="not deprecated">
  29134. </method>
  29135. <method name="getDirectDependantJobs" return="java.util.List"
  29136. abstract="false" native="false" synchronized="false"
  29137. static="false" final="false" visibility="public"
  29138. deprecated="not deprecated">
  29139. </method>
  29140. <method name="getMapTasks" return="java.util.List"
  29141. abstract="false" native="false" synchronized="false"
  29142. static="false" final="false" visibility="public"
  29143. deprecated="not deprecated">
  29144. </method>
  29145. <method name="getReduceTasks" return="java.util.List"
  29146. abstract="false" native="false" synchronized="false"
  29147. static="false" final="false" visibility="public"
  29148. deprecated="not deprecated">
  29149. </method>
  29150. <method name="getOtherTasks" return="java.util.List"
  29151. abstract="false" native="false" synchronized="false"
  29152. static="false" final="false" visibility="public"
  29153. deprecated="not deprecated">
  29154. </method>
  29155. <method name="getSuccessfulMapAttemptCDFs" return="java.util.ArrayList"
  29156. abstract="false" native="false" synchronized="false"
  29157. static="false" final="false" visibility="public"
  29158. deprecated="not deprecated">
  29159. </method>
  29160. <method name="getFailedMapAttemptCDFs" return="java.util.ArrayList"
  29161. abstract="false" native="false" synchronized="false"
  29162. static="false" final="false" visibility="public"
  29163. deprecated="not deprecated">
  29164. </method>
  29165. <method name="getSuccessfulReduceAttemptCDF" return="org.apache.hadoop.tools.rumen.LoggedDiscreteCDF"
  29166. abstract="false" native="false" synchronized="false"
  29167. static="false" final="false" visibility="public"
  29168. deprecated="not deprecated">
  29169. </method>
  29170. <method name="getFailedReduceAttemptCDF" return="org.apache.hadoop.tools.rumen.LoggedDiscreteCDF"
  29171. abstract="false" native="false" synchronized="false"
  29172. static="false" final="false" visibility="public"
  29173. deprecated="not deprecated">
  29174. </method>
  29175. <method name="getMapperTriesToSucceed" return="double[]"
  29176. abstract="false" native="false" synchronized="false"
  29177. static="false" final="false" visibility="public"
  29178. deprecated="not deprecated">
  29179. </method>
  29180. <method name="getFailedMapperFraction" return="double"
  29181. abstract="false" native="false" synchronized="false"
  29182. static="false" final="false" visibility="public"
  29183. deprecated="not deprecated">
  29184. </method>
  29185. <method name="getRelativeTime" return="long"
  29186. abstract="false" native="false" synchronized="false"
  29187. static="false" final="false" visibility="public"
  29188. deprecated="not deprecated">
  29189. </method>
  29190. <method name="getQueue" return="java.lang.String"
  29191. abstract="false" native="false" synchronized="false"
  29192. static="false" final="false" visibility="public"
  29193. deprecated="not deprecated">
  29194. </method>
  29195. <method name="getJobName" return="java.lang.String"
  29196. abstract="false" native="false" synchronized="false"
  29197. static="false" final="false" visibility="public"
  29198. deprecated="not deprecated">
  29199. </method>
  29200. <method name="getClusterMapMB" return="int"
  29201. abstract="false" native="false" synchronized="false"
  29202. static="false" final="false" visibility="public"
  29203. deprecated="not deprecated">
  29204. </method>
  29205. <method name="getClusterReduceMB" return="int"
  29206. abstract="false" native="false" synchronized="false"
  29207. static="false" final="false" visibility="public"
  29208. deprecated="not deprecated">
  29209. </method>
  29210. <method name="getJobMapMB" return="int"
  29211. abstract="false" native="false" synchronized="false"
  29212. static="false" final="false" visibility="public"
  29213. deprecated="not deprecated">
  29214. </method>
  29215. <method name="getJobReduceMB" return="int"
  29216. abstract="false" native="false" synchronized="false"
  29217. static="false" final="false" visibility="public"
  29218. deprecated="not deprecated">
  29219. </method>
  29220. <method name="deepCompare"
  29221. abstract="false" native="false" synchronized="false"
  29222. static="false" final="false" visibility="public"
  29223. deprecated="not deprecated">
  29224. <param name="comparand" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29225. <param name="loc" type="org.apache.hadoop.tools.rumen.TreePath"/>
  29226. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  29227. </method>
  29228. <doc>
  29229. <![CDATA[A {@link LoggedDiscreteCDF} is a representation of an hadoop job, with the
  29230. details of this class set up to meet the requirements of the Jackson JSON
  29231. parser/generator.
  29232. All of the public methods are simply accessors for the instance variables we
  29233. want to write out in the JSON files.]]>
  29234. </doc>
  29235. </class>
  29236. <!-- end class org.apache.hadoop.tools.rumen.LoggedJob -->
  29237. <!-- start class org.apache.hadoop.tools.rumen.LoggedJob.JobPriority -->
  29238. <class name="LoggedJob.JobPriority" extends="java.lang.Enum"
  29239. abstract="false"
  29240. static="true" final="true" visibility="public"
  29241. deprecated="not deprecated">
  29242. <method name="values" return="org.apache.hadoop.tools.rumen.LoggedJob.JobPriority[]"
  29243. abstract="false" native="false" synchronized="false"
  29244. static="true" final="false" visibility="public"
  29245. deprecated="not deprecated">
  29246. </method>
  29247. <method name="valueOf" return="org.apache.hadoop.tools.rumen.LoggedJob.JobPriority"
  29248. abstract="false" native="false" synchronized="false"
  29249. static="true" final="false" visibility="public"
  29250. deprecated="not deprecated">
  29251. <param name="name" type="java.lang.String"/>
  29252. </method>
  29253. </class>
  29254. <!-- end class org.apache.hadoop.tools.rumen.LoggedJob.JobPriority -->
  29255. <!-- start class org.apache.hadoop.tools.rumen.LoggedJob.JobType -->
  29256. <class name="LoggedJob.JobType" extends="java.lang.Enum"
  29257. abstract="false"
  29258. static="true" final="true" visibility="public"
  29259. deprecated="not deprecated">
  29260. <method name="values" return="org.apache.hadoop.tools.rumen.LoggedJob.JobType[]"
  29261. abstract="false" native="false" synchronized="false"
  29262. static="true" final="false" visibility="public"
  29263. deprecated="not deprecated">
  29264. </method>
  29265. <method name="valueOf" return="org.apache.hadoop.tools.rumen.LoggedJob.JobType"
  29266. abstract="false" native="false" synchronized="false"
  29267. static="true" final="false" visibility="public"
  29268. deprecated="not deprecated">
  29269. <param name="name" type="java.lang.String"/>
  29270. </method>
  29271. </class>
  29272. <!-- end class org.apache.hadoop.tools.rumen.LoggedJob.JobType -->
  29273. <!-- start class org.apache.hadoop.tools.rumen.LoggedLocation -->
  29274. <class name="LoggedLocation" extends="java.lang.Object"
  29275. abstract="false"
  29276. static="false" final="false" visibility="public"
  29277. deprecated="not deprecated">
  29278. <implements name="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29279. <constructor name="LoggedLocation"
  29280. static="false" final="false" visibility="public"
  29281. deprecated="not deprecated">
  29282. </constructor>
  29283. <method name="getLayers" return="java.util.List"
  29284. abstract="false" native="false" synchronized="false"
  29285. static="false" final="false" visibility="public"
  29286. deprecated="not deprecated">
  29287. </method>
  29288. <method name="setUnknownAttribute"
  29289. abstract="false" native="false" synchronized="false"
  29290. static="false" final="false" visibility="public"
  29291. deprecated="not deprecated">
  29292. <param name="attributeName" type="java.lang.String"/>
  29293. <param name="ignored" type="java.lang.Object"/>
  29294. </method>
  29295. <method name="deepCompare"
  29296. abstract="false" native="false" synchronized="false"
  29297. static="false" final="false" visibility="public"
  29298. deprecated="not deprecated">
  29299. <param name="comparand" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29300. <param name="loc" type="org.apache.hadoop.tools.rumen.TreePath"/>
  29301. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  29302. </method>
  29303. <doc>
  29304. <![CDATA[A {@link LoggedLocation} is a representation of a point in an hierarchical
  29305. network, represented as a series of membership names, broadest first.
  29306. For example, if your network has <i>hosts</i> grouped into <i>racks</i>, then
  29307. in onecluster you might have a node {@code node1} on rack {@code rack1}. This
  29308. would be represented with a ArrayList of two layers, with two {@link String}
  29309. s being {@code "rack1"} and {@code "node1"}.
  29310. The details of this class are set up to meet the requirements of the Jackson
  29311. JSON parser/generator.
  29312. All of the public methods are simply accessors for the instance variables we
  29313. want to write out in the JSON files.]]>
  29314. </doc>
  29315. </class>
  29316. <!-- end class org.apache.hadoop.tools.rumen.LoggedLocation -->
  29317. <!-- start class org.apache.hadoop.tools.rumen.LoggedNetworkTopology -->
  29318. <class name="LoggedNetworkTopology" extends="java.lang.Object"
  29319. abstract="false"
  29320. static="false" final="false" visibility="public"
  29321. deprecated="not deprecated">
  29322. <implements name="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29323. <constructor name="LoggedNetworkTopology"
  29324. static="false" final="false" visibility="public"
  29325. deprecated="not deprecated">
  29326. </constructor>
  29327. <method name="setUnknownAttribute"
  29328. abstract="false" native="false" synchronized="false"
  29329. static="false" final="false" visibility="public"
  29330. deprecated="not deprecated">
  29331. <param name="attributeName" type="java.lang.String"/>
  29332. <param name="ignored" type="java.lang.Object"/>
  29333. </method>
  29334. <method name="getName" return="java.lang.String"
  29335. abstract="false" native="false" synchronized="false"
  29336. static="false" final="false" visibility="public"
  29337. deprecated="not deprecated">
  29338. </method>
  29339. <method name="getChildren" return="java.util.List"
  29340. abstract="false" native="false" synchronized="false"
  29341. static="false" final="false" visibility="public"
  29342. deprecated="not deprecated">
  29343. </method>
  29344. <method name="deepCompare"
  29345. abstract="false" native="false" synchronized="false"
  29346. static="false" final="false" visibility="public"
  29347. deprecated="not deprecated">
  29348. <param name="comparand" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29349. <param name="loc" type="org.apache.hadoop.tools.rumen.TreePath"/>
  29350. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  29351. </method>
  29352. <doc>
  29353. <![CDATA[A {@link LoggedNetworkTopology} represents a tree that in turn represents a
  29354. hierarchy of hosts. The current version requires the tree to have all leaves
  29355. at the same level.
  29356. All of the public methods are simply accessors for the instance variables we
  29357. want to write out in the JSON files.]]>
  29358. </doc>
  29359. </class>
  29360. <!-- end class org.apache.hadoop.tools.rumen.LoggedNetworkTopology -->
  29361. <!-- start class org.apache.hadoop.tools.rumen.LoggedSingleRelativeRanking -->
  29362. <class name="LoggedSingleRelativeRanking" extends="java.lang.Object"
  29363. abstract="false"
  29364. static="false" final="false" visibility="public"
  29365. deprecated="not deprecated">
  29366. <implements name="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29367. <constructor name="LoggedSingleRelativeRanking"
  29368. static="false" final="false" visibility="public"
  29369. deprecated="not deprecated">
  29370. </constructor>
  29371. <method name="setUnknownAttribute"
  29372. abstract="false" native="false" synchronized="false"
  29373. static="false" final="false" visibility="public"
  29374. deprecated="not deprecated">
  29375. <param name="attributeName" type="java.lang.String"/>
  29376. <param name="ignored" type="java.lang.Object"/>
  29377. </method>
  29378. <method name="getRelativeRanking" return="double"
  29379. abstract="false" native="false" synchronized="false"
  29380. static="false" final="false" visibility="public"
  29381. deprecated="not deprecated">
  29382. </method>
  29383. <method name="getDatum" return="long"
  29384. abstract="false" native="false" synchronized="false"
  29385. static="false" final="false" visibility="public"
  29386. deprecated="not deprecated">
  29387. </method>
  29388. <method name="deepCompare"
  29389. abstract="false" native="false" synchronized="false"
  29390. static="false" final="false" visibility="public"
  29391. deprecated="not deprecated">
  29392. <param name="comparand" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29393. <param name="loc" type="org.apache.hadoop.tools.rumen.TreePath"/>
  29394. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  29395. </method>
  29396. <doc>
  29397. <![CDATA[A {@link LoggedSingleRelativeRanking} represents an X-Y coordinate of a
  29398. single point in a discrete CDF.
  29399. All of the public methods are simply accessors for the instance variables we
  29400. want to write out in the JSON files.]]>
  29401. </doc>
  29402. </class>
  29403. <!-- end class org.apache.hadoop.tools.rumen.LoggedSingleRelativeRanking -->
  29404. <!-- start class org.apache.hadoop.tools.rumen.LoggedTask -->
  29405. <class name="LoggedTask" extends="java.lang.Object"
  29406. abstract="false"
  29407. static="false" final="false" visibility="public"
  29408. deprecated="not deprecated">
  29409. <implements name="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29410. <method name="setUnknownAttribute"
  29411. abstract="false" native="false" synchronized="false"
  29412. static="false" final="false" visibility="public"
  29413. deprecated="not deprecated">
  29414. <param name="attributeName" type="java.lang.String"/>
  29415. <param name="ignored" type="java.lang.Object"/>
  29416. </method>
  29417. <method name="getInputBytes" return="long"
  29418. abstract="false" native="false" synchronized="false"
  29419. static="false" final="false" visibility="public"
  29420. deprecated="not deprecated">
  29421. </method>
  29422. <method name="getInputRecords" return="long"
  29423. abstract="false" native="false" synchronized="false"
  29424. static="false" final="false" visibility="public"
  29425. deprecated="not deprecated">
  29426. </method>
  29427. <method name="getOutputBytes" return="long"
  29428. abstract="false" native="false" synchronized="false"
  29429. static="false" final="false" visibility="public"
  29430. deprecated="not deprecated">
  29431. </method>
  29432. <method name="getOutputRecords" return="long"
  29433. abstract="false" native="false" synchronized="false"
  29434. static="false" final="false" visibility="public"
  29435. deprecated="not deprecated">
  29436. </method>
  29437. <method name="getTaskID" return="java.lang.String"
  29438. abstract="false" native="false" synchronized="false"
  29439. static="false" final="false" visibility="public"
  29440. deprecated="not deprecated">
  29441. </method>
  29442. <method name="getStartTime" return="long"
  29443. abstract="false" native="false" synchronized="false"
  29444. static="false" final="false" visibility="public"
  29445. deprecated="not deprecated">
  29446. </method>
  29447. <method name="getFinishTime" return="long"
  29448. abstract="false" native="false" synchronized="false"
  29449. static="false" final="false" visibility="public"
  29450. deprecated="not deprecated">
  29451. </method>
  29452. <method name="getAttempts" return="java.util.List"
  29453. abstract="false" native="false" synchronized="false"
  29454. static="false" final="false" visibility="public"
  29455. deprecated="not deprecated">
  29456. </method>
  29457. <method name="getPreferredLocations" return="java.util.List"
  29458. abstract="false" native="false" synchronized="false"
  29459. static="false" final="false" visibility="public"
  29460. deprecated="not deprecated">
  29461. </method>
  29462. <method name="getTaskStatus" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values"
  29463. abstract="false" native="false" synchronized="false"
  29464. static="false" final="false" visibility="public"
  29465. deprecated="not deprecated">
  29466. </method>
  29467. <method name="getTaskType" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values"
  29468. abstract="false" native="false" synchronized="false"
  29469. static="false" final="false" visibility="public"
  29470. deprecated="not deprecated">
  29471. </method>
  29472. <method name="incorporateCounters"
  29473. abstract="false" native="false" synchronized="false"
  29474. static="false" final="false" visibility="public"
  29475. deprecated="not deprecated">
  29476. <param name="counters" type="org.apache.hadoop.mapreduce.jobhistory.JhCounters"/>
  29477. </method>
  29478. <method name="deepCompare"
  29479. abstract="false" native="false" synchronized="false"
  29480. static="false" final="false" visibility="public"
  29481. deprecated="not deprecated">
  29482. <param name="comparand" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29483. <param name="loc" type="org.apache.hadoop.tools.rumen.TreePath"/>
  29484. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  29485. </method>
  29486. <doc>
  29487. <![CDATA[A {@link LoggedTask} represents a [hadoop] task that is part of a hadoop job.
  29488. It knows about the [pssibly empty] sequence of attempts, its I/O footprint,
  29489. and its runtime.
  29490. All of the public methods are simply accessors for the instance variables we
  29491. want to write out in the JSON files.]]>
  29492. </doc>
  29493. </class>
  29494. <!-- end class org.apache.hadoop.tools.rumen.LoggedTask -->
  29495. <!-- start class org.apache.hadoop.tools.rumen.LoggedTaskAttempt -->
  29496. <class name="LoggedTaskAttempt" extends="java.lang.Object"
  29497. abstract="false"
  29498. static="false" final="false" visibility="public"
  29499. deprecated="not deprecated">
  29500. <implements name="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29501. <method name="setUnknownAttribute"
  29502. abstract="false" native="false" synchronized="false"
  29503. static="false" final="false" visibility="public"
  29504. deprecated="not deprecated">
  29505. <param name="attributeName" type="java.lang.String"/>
  29506. <param name="ignored" type="java.lang.Object"/>
  29507. </method>
  29508. <method name="getShuffleFinished" return="long"
  29509. abstract="false" native="false" synchronized="false"
  29510. static="false" final="false" visibility="public"
  29511. deprecated="not deprecated">
  29512. </method>
  29513. <method name="getSortFinished" return="long"
  29514. abstract="false" native="false" synchronized="false"
  29515. static="false" final="false" visibility="public"
  29516. deprecated="not deprecated">
  29517. </method>
  29518. <method name="getAttemptID" return="java.lang.String"
  29519. abstract="false" native="false" synchronized="false"
  29520. static="false" final="false" visibility="public"
  29521. deprecated="not deprecated">
  29522. </method>
  29523. <method name="getResult" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values"
  29524. abstract="false" native="false" synchronized="false"
  29525. static="false" final="false" visibility="public"
  29526. deprecated="not deprecated">
  29527. </method>
  29528. <method name="getStartTime" return="long"
  29529. abstract="false" native="false" synchronized="false"
  29530. static="false" final="false" visibility="public"
  29531. deprecated="not deprecated">
  29532. </method>
  29533. <method name="getFinishTime" return="long"
  29534. abstract="false" native="false" synchronized="false"
  29535. static="false" final="false" visibility="public"
  29536. deprecated="not deprecated">
  29537. </method>
  29538. <method name="getHostName" return="java.lang.String"
  29539. abstract="false" native="false" synchronized="false"
  29540. static="false" final="false" visibility="public"
  29541. deprecated="not deprecated">
  29542. </method>
  29543. <method name="getHdfsBytesRead" return="long"
  29544. abstract="false" native="false" synchronized="false"
  29545. static="false" final="false" visibility="public"
  29546. deprecated="not deprecated">
  29547. </method>
  29548. <method name="getHdfsBytesWritten" return="long"
  29549. abstract="false" native="false" synchronized="false"
  29550. static="false" final="false" visibility="public"
  29551. deprecated="not deprecated">
  29552. </method>
  29553. <method name="getFileBytesRead" return="long"
  29554. abstract="false" native="false" synchronized="false"
  29555. static="false" final="false" visibility="public"
  29556. deprecated="not deprecated">
  29557. </method>
  29558. <method name="getFileBytesWritten" return="long"
  29559. abstract="false" native="false" synchronized="false"
  29560. static="false" final="false" visibility="public"
  29561. deprecated="not deprecated">
  29562. </method>
  29563. <method name="getMapInputRecords" return="long"
  29564. abstract="false" native="false" synchronized="false"
  29565. static="false" final="false" visibility="public"
  29566. deprecated="not deprecated">
  29567. </method>
  29568. <method name="getMapOutputBytes" return="long"
  29569. abstract="false" native="false" synchronized="false"
  29570. static="false" final="false" visibility="public"
  29571. deprecated="not deprecated">
  29572. </method>
  29573. <method name="getMapOutputRecords" return="long"
  29574. abstract="false" native="false" synchronized="false"
  29575. static="false" final="false" visibility="public"
  29576. deprecated="not deprecated">
  29577. </method>
  29578. <method name="getCombineInputRecords" return="long"
  29579. abstract="false" native="false" synchronized="false"
  29580. static="false" final="false" visibility="public"
  29581. deprecated="not deprecated">
  29582. </method>
  29583. <method name="getReduceInputGroups" return="long"
  29584. abstract="false" native="false" synchronized="false"
  29585. static="false" final="false" visibility="public"
  29586. deprecated="not deprecated">
  29587. </method>
  29588. <method name="getReduceInputRecords" return="long"
  29589. abstract="false" native="false" synchronized="false"
  29590. static="false" final="false" visibility="public"
  29591. deprecated="not deprecated">
  29592. </method>
  29593. <method name="getReduceShuffleBytes" return="long"
  29594. abstract="false" native="false" synchronized="false"
  29595. static="false" final="false" visibility="public"
  29596. deprecated="not deprecated">
  29597. </method>
  29598. <method name="getReduceOutputRecords" return="long"
  29599. abstract="false" native="false" synchronized="false"
  29600. static="false" final="false" visibility="public"
  29601. deprecated="not deprecated">
  29602. </method>
  29603. <method name="getSpilledRecords" return="long"
  29604. abstract="false" native="false" synchronized="false"
  29605. static="false" final="false" visibility="public"
  29606. deprecated="not deprecated">
  29607. </method>
  29608. <method name="getLocation" return="org.apache.hadoop.tools.rumen.LoggedLocation"
  29609. abstract="false" native="false" synchronized="false"
  29610. static="false" final="false" visibility="public"
  29611. deprecated="not deprecated">
  29612. </method>
  29613. <method name="getMapInputBytes" return="long"
  29614. abstract="false" native="false" synchronized="false"
  29615. static="false" final="false" visibility="public"
  29616. deprecated="not deprecated">
  29617. </method>
  29618. <method name="incorporateCounters"
  29619. abstract="false" native="false" synchronized="false"
  29620. static="false" final="false" visibility="public"
  29621. deprecated="not deprecated">
  29622. <param name="counters" type="org.apache.hadoop.mapreduce.jobhistory.JhCounters"/>
  29623. </method>
  29624. <method name="deepCompare"
  29625. abstract="false" native="false" synchronized="false"
  29626. static="false" final="false" visibility="public"
  29627. deprecated="not deprecated">
  29628. <param name="comparand" type="org.apache.hadoop.tools.rumen.DeepCompare"/>
  29629. <param name="loc" type="org.apache.hadoop.tools.rumen.TreePath"/>
  29630. <exception name="DeepInequalityException" type="org.apache.hadoop.tools.rumen.DeepInequalityException"/>
  29631. </method>
  29632. <doc>
  29633. <![CDATA[A {@link LoggedTaskAttempt} represents an attempt to run an hadoop task in a
  29634. hadoop job. Note that a task can have several attempts.
  29635. All of the public methods are simply accessors for the instance variables we
  29636. want to write out in the JSON files.]]>
  29637. </doc>
  29638. </class>
  29639. <!-- end class org.apache.hadoop.tools.rumen.LoggedTaskAttempt -->
  29640. <!-- start class org.apache.hadoop.tools.rumen.MachineNode -->
  29641. <class name="MachineNode" extends="org.apache.hadoop.tools.rumen.Node"
  29642. abstract="false"
  29643. static="false" final="true" visibility="public"
  29644. deprecated="not deprecated">
  29645. <method name="equals" return="boolean"
  29646. abstract="false" native="false" synchronized="false"
  29647. static="false" final="false" visibility="public"
  29648. deprecated="not deprecated">
  29649. <param name="obj" type="java.lang.Object"/>
  29650. </method>
  29651. <method name="hashCode" return="int"
  29652. abstract="false" native="false" synchronized="false"
  29653. static="false" final="false" visibility="public"
  29654. deprecated="not deprecated">
  29655. </method>
  29656. <method name="getMemory" return="long"
  29657. abstract="false" native="false" synchronized="false"
  29658. static="false" final="false" visibility="public"
  29659. deprecated="not deprecated">
  29660. <doc>
  29661. <![CDATA[Get the available physical RAM of the node.
  29662. @return The available physical RAM of the node, in KB.]]>
  29663. </doc>
  29664. </method>
  29665. <method name="getMapSlots" return="int"
  29666. abstract="false" native="false" synchronized="false"
  29667. static="false" final="false" visibility="public"
  29668. deprecated="not deprecated">
  29669. <doc>
  29670. <![CDATA[Get the number of map slots of the node.
  29671. @return The number of map slots of the node.]]>
  29672. </doc>
  29673. </method>
  29674. <method name="getReduceSlots" return="int"
  29675. abstract="false" native="false" synchronized="false"
  29676. static="false" final="false" visibility="public"
  29677. deprecated="not deprecated">
  29678. <doc>
  29679. <![CDATA[Get the number of reduce slots of the node.
  29680. @return The number of reduce slots fo the node.]]>
  29681. </doc>
  29682. </method>
  29683. <method name="getMemoryPerMapSlot" return="long"
  29684. abstract="false" native="false" synchronized="false"
  29685. static="false" final="false" visibility="public"
  29686. deprecated="not deprecated">
  29687. <doc>
  29688. <![CDATA[Get the amount of RAM reserved for each map slot.
  29689. @return the amount of RAM reserved for each map slot, in KB.]]>
  29690. </doc>
  29691. </method>
  29692. <method name="getMemoryPerReduceSlot" return="long"
  29693. abstract="false" native="false" synchronized="false"
  29694. static="false" final="false" visibility="public"
  29695. deprecated="not deprecated">
  29696. <doc>
  29697. <![CDATA[Get the amount of RAM reserved for each reduce slot.
  29698. @return the amount of RAM reserved for each reduce slot, in KB.]]>
  29699. </doc>
  29700. </method>
  29701. <method name="getNumCores" return="int"
  29702. abstract="false" native="false" synchronized="false"
  29703. static="false" final="false" visibility="public"
  29704. deprecated="not deprecated">
  29705. <doc>
  29706. <![CDATA[Get the number of cores of the node.
  29707. @return the number of cores of the node.]]>
  29708. </doc>
  29709. </method>
  29710. <method name="getRackNode" return="org.apache.hadoop.tools.rumen.RackNode"
  29711. abstract="false" native="false" synchronized="false"
  29712. static="false" final="false" visibility="public"
  29713. deprecated="not deprecated">
  29714. <doc>
  29715. <![CDATA[Get the rack node that the machine belongs to.
  29716. @return The rack node that the machine belongs to. Returns null if the
  29717. machine does not belong to any rack.]]>
  29718. </doc>
  29719. </method>
  29720. <method name="addChild" return="boolean"
  29721. abstract="false" native="false" synchronized="true"
  29722. static="false" final="false" visibility="public"
  29723. deprecated="not deprecated">
  29724. <param name="child" type="org.apache.hadoop.tools.rumen.Node"/>
  29725. </method>
  29726. <doc>
  29727. <![CDATA[{@link MachineNode} represents the configuration of a cluster node.
  29728. {@link MachineNode} should be constructed by {@link MachineNode.Builder}.]]>
  29729. </doc>
  29730. </class>
  29731. <!-- end class org.apache.hadoop.tools.rumen.MachineNode -->
  29732. <!-- start class org.apache.hadoop.tools.rumen.MachineNode.Builder -->
  29733. <class name="MachineNode.Builder" extends="java.lang.Object"
  29734. abstract="false"
  29735. static="true" final="true" visibility="public"
  29736. deprecated="not deprecated">
  29737. <constructor name="MachineNode.Builder" type="java.lang.String, int"
  29738. static="false" final="false" visibility="public"
  29739. deprecated="not deprecated">
  29740. <doc>
  29741. <![CDATA[Start building a new NodeInfo object.
  29742. @param name
  29743. Unique name of the node. Typically the fully qualified domain
  29744. name.]]>
  29745. </doc>
  29746. </constructor>
  29747. <method name="setMemory" return="org.apache.hadoop.tools.rumen.MachineNode.Builder"
  29748. abstract="false" native="false" synchronized="false"
  29749. static="false" final="false" visibility="public"
  29750. deprecated="not deprecated">
  29751. <param name="memory" type="long"/>
  29752. <doc>
  29753. <![CDATA[Set the physical memory of the node.
  29754. @param memory Available RAM in KB.]]>
  29755. </doc>
  29756. </method>
  29757. <method name="setMapSlots" return="org.apache.hadoop.tools.rumen.MachineNode.Builder"
  29758. abstract="false" native="false" synchronized="false"
  29759. static="false" final="false" visibility="public"
  29760. deprecated="not deprecated">
  29761. <param name="mapSlots" type="int"/>
  29762. <doc>
  29763. <![CDATA[Set the number of map slot for the node.
  29764. @param mapSlots The number of map slots for the node.]]>
  29765. </doc>
  29766. </method>
  29767. <method name="setReduceSlots" return="org.apache.hadoop.tools.rumen.MachineNode.Builder"
  29768. abstract="false" native="false" synchronized="false"
  29769. static="false" final="false" visibility="public"
  29770. deprecated="not deprecated">
  29771. <param name="reduceSlots" type="int"/>
  29772. <doc>
  29773. <![CDATA[Set the number of reduce slot for the node.
  29774. @param reduceSlots The number of reduce slots for the node.]]>
  29775. </doc>
  29776. </method>
  29777. <method name="setMemoryPerMapSlot" return="org.apache.hadoop.tools.rumen.MachineNode.Builder"
  29778. abstract="false" native="false" synchronized="false"
  29779. static="false" final="false" visibility="public"
  29780. deprecated="not deprecated">
  29781. <param name="memoryPerMapSlot" type="long"/>
  29782. <doc>
  29783. <![CDATA[Set the amount of RAM reserved for each map slot.
  29784. @param memoryPerMapSlot The amount of RAM reserved for each map slot, in KB.]]>
  29785. </doc>
  29786. </method>
  29787. <method name="setMemoryPerReduceSlot" return="org.apache.hadoop.tools.rumen.MachineNode.Builder"
  29788. abstract="false" native="false" synchronized="false"
  29789. static="false" final="false" visibility="public"
  29790. deprecated="not deprecated">
  29791. <param name="memoryPerReduceSlot" type="long"/>
  29792. <doc>
  29793. <![CDATA[Set the amount of RAM reserved for each reduce slot.
  29794. @param memoryPerReduceSlot The amount of RAM reserved for each reduce slot, in KB.]]>
  29795. </doc>
  29796. </method>
  29797. <method name="setNumCores" return="org.apache.hadoop.tools.rumen.MachineNode.Builder"
  29798. abstract="false" native="false" synchronized="false"
  29799. static="false" final="false" visibility="public"
  29800. deprecated="not deprecated">
  29801. <param name="numCores" type="int"/>
  29802. <doc>
  29803. <![CDATA[Set the number of cores for the node.
  29804. @param numCores Number of cores for the node.]]>
  29805. </doc>
  29806. </method>
  29807. <method name="cloneFrom" return="org.apache.hadoop.tools.rumen.MachineNode.Builder"
  29808. abstract="false" native="false" synchronized="false"
  29809. static="false" final="false" visibility="public"
  29810. deprecated="not deprecated">
  29811. <param name="ref" type="org.apache.hadoop.tools.rumen.MachineNode"/>
  29812. <doc>
  29813. <![CDATA[Clone the settings from a reference {@link MachineNode} object.
  29814. @param ref The reference {@link MachineNode} object.]]>
  29815. </doc>
  29816. </method>
  29817. <method name="build" return="org.apache.hadoop.tools.rumen.MachineNode"
  29818. abstract="false" native="false" synchronized="false"
  29819. static="false" final="false" visibility="public"
  29820. deprecated="not deprecated">
  29821. <doc>
  29822. <![CDATA[Build the {@link MachineNode} object.
  29823. @return The {@link MachineNode} object being built.]]>
  29824. </doc>
  29825. </method>
  29826. <doc>
  29827. <![CDATA[Builder for a NodeInfo object]]>
  29828. </doc>
  29829. </class>
  29830. <!-- end class org.apache.hadoop.tools.rumen.MachineNode.Builder -->
  29831. <!-- start class org.apache.hadoop.tools.rumen.MapAttempt20LineHistoryEventEmitter -->
  29832. <class name="MapAttempt20LineHistoryEventEmitter" extends="org.apache.hadoop.tools.rumen.TaskAttempt20LineEventEmitter"
  29833. abstract="false"
  29834. static="false" final="false" visibility="public"
  29835. deprecated="not deprecated">
  29836. <constructor name="MapAttempt20LineHistoryEventEmitter"
  29837. static="false" final="false" visibility="protected"
  29838. deprecated="not deprecated">
  29839. </constructor>
  29840. </class>
  29841. <!-- end class org.apache.hadoop.tools.rumen.MapAttempt20LineHistoryEventEmitter -->
  29842. <!-- start class org.apache.hadoop.tools.rumen.MapTaskAttemptInfo -->
  29843. <class name="MapTaskAttemptInfo" extends="org.apache.hadoop.tools.rumen.TaskAttemptInfo"
  29844. abstract="false"
  29845. static="false" final="false" visibility="public"
  29846. deprecated="not deprecated">
  29847. <constructor name="MapTaskAttemptInfo" type="org.apache.hadoop.mapred.TaskStatus.State, org.apache.hadoop.tools.rumen.TaskInfo, long"
  29848. static="false" final="false" visibility="public"
  29849. deprecated="not deprecated">
  29850. </constructor>
  29851. <method name="getRuntime" return="long"
  29852. abstract="false" native="false" synchronized="false"
  29853. static="false" final="false" visibility="public"
  29854. deprecated="not deprecated">
  29855. </method>
  29856. <method name="getMapRuntime" return="long"
  29857. abstract="false" native="false" synchronized="false"
  29858. static="false" final="false" visibility="public"
  29859. deprecated="not deprecated">
  29860. <doc>
  29861. <![CDATA[Get the runtime for the <b>map</b> phase of the map-task attempt.
  29862. @return the runtime for the <b>map</b> phase of the map-task attempt]]>
  29863. </doc>
  29864. </method>
  29865. <doc>
  29866. <![CDATA[{@link MapTaskAttemptInfo} represents the information with regard to a
  29867. map task attempt.]]>
  29868. </doc>
  29869. </class>
  29870. <!-- end class org.apache.hadoop.tools.rumen.MapTaskAttemptInfo -->
  29871. <!-- start class org.apache.hadoop.tools.rumen.Node -->
  29872. <class name="Node" extends="java.lang.Object"
  29873. abstract="false"
  29874. static="false" final="false" visibility="public"
  29875. deprecated="not deprecated">
  29876. <implements name="java.lang.Comparable"/>
  29877. <constructor name="Node" type="java.lang.String, int"
  29878. static="false" final="false" visibility="public"
  29879. deprecated="not deprecated">
  29880. <doc>
  29881. <![CDATA[@param name
  29882. A unique name to identify a node in the cluster.
  29883. @param level
  29884. The level of the node in the cluster]]>
  29885. </doc>
  29886. </constructor>
  29887. <method name="getName" return="java.lang.String"
  29888. abstract="false" native="false" synchronized="false"
  29889. static="false" final="false" visibility="public"
  29890. deprecated="not deprecated">
  29891. <doc>
  29892. <![CDATA[Get the name of the node.
  29893. @return The name of the node.]]>
  29894. </doc>
  29895. </method>
  29896. <method name="getLevel" return="int"
  29897. abstract="false" native="false" synchronized="false"
  29898. static="false" final="false" visibility="public"
  29899. deprecated="not deprecated">
  29900. <doc>
  29901. <![CDATA[Get the level of the node.
  29902. @return The level of the node.]]>
  29903. </doc>
  29904. </method>
  29905. <method name="addChild" return="boolean"
  29906. abstract="false" native="false" synchronized="true"
  29907. static="false" final="false" visibility="public"
  29908. deprecated="not deprecated">
  29909. <param name="child" type="org.apache.hadoop.tools.rumen.Node"/>
  29910. <doc>
  29911. <![CDATA[Add a child node to this node.
  29912. @param child The child node to be added. The child node should currently not be belong to another cluster topology.
  29913. @return Boolean indicating whether the node is successfully added.]]>
  29914. </doc>
  29915. </method>
  29916. <method name="hasChildren" return="boolean"
  29917. abstract="false" native="false" synchronized="true"
  29918. static="false" final="false" visibility="public"
  29919. deprecated="not deprecated">
  29920. <doc>
  29921. <![CDATA[Does this node have any children?
  29922. @return Boolean indicate whether this node has any children.]]>
  29923. </doc>
  29924. </method>
  29925. <method name="getChildren" return="java.util.Set"
  29926. abstract="false" native="false" synchronized="true"
  29927. static="false" final="false" visibility="public"
  29928. deprecated="not deprecated">
  29929. <doc>
  29930. <![CDATA[Get the children of this node.
  29931. @return The children of this node. If no child, an empty set will be
  29932. returned. The returned set is read-only.]]>
  29933. </doc>
  29934. </method>
  29935. <method name="getParent" return="org.apache.hadoop.tools.rumen.Node"
  29936. abstract="false" native="false" synchronized="false"
  29937. static="false" final="false" visibility="public"
  29938. deprecated="not deprecated">
  29939. <doc>
  29940. <![CDATA[Get the parent node.
  29941. @return the parent node. If root node, return null.]]>
  29942. </doc>
  29943. </method>
  29944. <method name="hashCode" return="int"
  29945. abstract="false" native="false" synchronized="false"
  29946. static="false" final="false" visibility="public"
  29947. deprecated="not deprecated">
  29948. </method>
  29949. <method name="equals" return="boolean"
  29950. abstract="false" native="false" synchronized="false"
  29951. static="false" final="false" visibility="public"
  29952. deprecated="not deprecated">
  29953. <param name="obj" type="java.lang.Object"/>
  29954. </method>
  29955. <method name="toString" return="java.lang.String"
  29956. abstract="false" native="false" synchronized="false"
  29957. static="false" final="false" visibility="public"
  29958. deprecated="not deprecated">
  29959. </method>
  29960. <method name="compareTo" return="int"
  29961. abstract="false" native="false" synchronized="false"
  29962. static="false" final="false" visibility="public"
  29963. deprecated="not deprecated">
  29964. <param name="o" type="org.apache.hadoop.tools.rumen.Node"/>
  29965. </method>
  29966. <doc>
  29967. <![CDATA[{@link Node} represents a node in the cluster topology. A node can be a
  29968. {@link MachineNode}, or a {@link RackNode}, etc.]]>
  29969. </doc>
  29970. </class>
  29971. <!-- end class org.apache.hadoop.tools.rumen.Node -->
  29972. <!-- start interface org.apache.hadoop.tools.rumen.Outputter -->
  29973. <interface name="Outputter" abstract="true"
  29974. static="false" final="false" visibility="public"
  29975. deprecated="not deprecated">
  29976. <implements name="java.io.Closeable"/>
  29977. <method name="init"
  29978. abstract="false" native="false" synchronized="false"
  29979. static="false" final="false" visibility="public"
  29980. deprecated="not deprecated">
  29981. <param name="path" type="org.apache.hadoop.fs.Path"/>
  29982. <param name="conf" type="org.apache.hadoop.conf.Configuration"/>
  29983. <exception name="IOException" type="java.io.IOException"/>
  29984. <doc>
  29985. <![CDATA[Initialize the {@link Outputter} to a specific path.
  29986. @param path The {@link Path} to the output file.
  29987. @param conf Configuration
  29988. @throws IOException]]>
  29989. </doc>
  29990. </method>
  29991. <method name="output"
  29992. abstract="false" native="false" synchronized="false"
  29993. static="false" final="false" visibility="public"
  29994. deprecated="not deprecated">
  29995. <param name="object" type="T"/>
  29996. <exception name="IOException" type="java.io.IOException"/>
  29997. <doc>
  29998. <![CDATA[Output an object.
  29999. @param object The objecte.
  30000. @throws IOException]]>
  30001. </doc>
  30002. </method>
  30003. <doc>
  30004. <![CDATA[Interface to output a sequence of objects of type T.]]>
  30005. </doc>
  30006. </interface>
  30007. <!-- end interface org.apache.hadoop.tools.rumen.Outputter -->
  30008. <!-- start class org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants -->
  30009. <class name="Pre21JobHistoryConstants" extends="java.lang.Object"
  30010. abstract="false"
  30011. static="false" final="false" visibility="public"
  30012. deprecated="not deprecated">
  30013. <constructor name="Pre21JobHistoryConstants"
  30014. static="false" final="false" visibility="public"
  30015. deprecated="not deprecated">
  30016. </constructor>
  30017. </class>
  30018. <!-- end class org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants -->
  30019. <!-- start class org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values -->
  30020. <class name="Pre21JobHistoryConstants.Values" extends="java.lang.Enum"
  30021. abstract="false"
  30022. static="true" final="true" visibility="public"
  30023. deprecated="not deprecated">
  30024. <method name="values" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values[]"
  30025. abstract="false" native="false" synchronized="false"
  30026. static="true" final="false" visibility="public"
  30027. deprecated="not deprecated">
  30028. </method>
  30029. <method name="valueOf" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values"
  30030. abstract="false" native="false" synchronized="false"
  30031. static="true" final="false" visibility="public"
  30032. deprecated="not deprecated">
  30033. <param name="name" type="java.lang.String"/>
  30034. </method>
  30035. <doc>
  30036. <![CDATA[This enum contains some of the values commonly used by history log events.
  30037. since values in history can only be strings - Values.name() is used in
  30038. most places in history file.]]>
  30039. </doc>
  30040. </class>
  30041. <!-- end class org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values -->
  30042. <!-- start class org.apache.hadoop.tools.rumen.RackNode -->
  30043. <class name="RackNode" extends="org.apache.hadoop.tools.rumen.Node"
  30044. abstract="false"
  30045. static="false" final="true" visibility="public"
  30046. deprecated="not deprecated">
  30047. <constructor name="RackNode" type="java.lang.String, int"
  30048. static="false" final="false" visibility="public"
  30049. deprecated="not deprecated">
  30050. </constructor>
  30051. <method name="addChild" return="boolean"
  30052. abstract="false" native="false" synchronized="true"
  30053. static="false" final="false" visibility="public"
  30054. deprecated="not deprecated">
  30055. <param name="child" type="org.apache.hadoop.tools.rumen.Node"/>
  30056. </method>
  30057. <method name="getMachinesInRack" return="java.util.Set"
  30058. abstract="false" native="false" synchronized="false"
  30059. static="false" final="false" visibility="public"
  30060. deprecated="not deprecated">
  30061. <doc>
  30062. <![CDATA[Get the machine nodes that belong to the rack.
  30063. @return The machine nodes that belong to the rack.]]>
  30064. </doc>
  30065. </method>
  30066. <doc>
  30067. <![CDATA[{@link RackNode} represents a rack node in the cluster topology.]]>
  30068. </doc>
  30069. </class>
  30070. <!-- end class org.apache.hadoop.tools.rumen.RackNode -->
  30071. <!-- start class org.apache.hadoop.tools.rumen.RandomSeedGenerator -->
  30072. <class name="RandomSeedGenerator" extends="java.lang.Object"
  30073. abstract="false"
  30074. static="false" final="false" visibility="public"
  30075. deprecated="not deprecated">
  30076. <constructor name="RandomSeedGenerator"
  30077. static="false" final="false" visibility="public"
  30078. deprecated="not deprecated">
  30079. </constructor>
  30080. <method name="getSeed" return="long"
  30081. abstract="false" native="false" synchronized="false"
  30082. static="true" final="false" visibility="public"
  30083. deprecated="not deprecated">
  30084. <param name="streamId" type="java.lang.String"/>
  30085. <param name="masterSeed" type="long"/>
  30086. <doc>
  30087. <![CDATA[Generates a new random seed.
  30088. @param streamId a string identifying the stream of random numbers
  30089. @param masterSeed higher level master random seed
  30090. @return the random seed. Different (streamId, masterSeed) pairs result in
  30091. (vastly) different random seeds.]]>
  30092. </doc>
  30093. </method>
  30094. <doc>
  30095. <![CDATA[The purpose of this class is to generate new random seeds from a master
  30096. seed. This is needed to make the Random().next*() calls in rumen and mumak
  30097. deterministic so that mumak simulations become deterministically replayable.
  30098. In these tools we need many independent streams of random numbers, some of
  30099. which are created dynamically. We seed these streams with the sub-seeds
  30100. returned by RandomSeedGenerator.
  30101. For a slightly more complicated approach to generating multiple streams of
  30102. random numbers with better theoretical guarantees, see
  30103. P. L'Ecuyer, R. Simard, E. J. Chen, and W. D. Kelton,
  30104. ``An Objected-Oriented Random-Number Package with Many Long Streams and
  30105. Substreams'', Operations Research, 50, 6 (2002), 1073--1075
  30106. http://www.iro.umontreal.ca/~lecuyer/papers.html
  30107. http://www.iro.umontreal.ca/~lecuyer/myftp/streams00/]]>
  30108. </doc>
  30109. </class>
  30110. <!-- end class org.apache.hadoop.tools.rumen.RandomSeedGenerator -->
  30111. <!-- start class org.apache.hadoop.tools.rumen.ReduceAttempt20LineHistoryEventEmitter -->
  30112. <class name="ReduceAttempt20LineHistoryEventEmitter" extends="org.apache.hadoop.tools.rumen.TaskAttempt20LineEventEmitter"
  30113. abstract="false"
  30114. static="false" final="false" visibility="public"
  30115. deprecated="not deprecated">
  30116. </class>
  30117. <!-- end class org.apache.hadoop.tools.rumen.ReduceAttempt20LineHistoryEventEmitter -->
  30118. <!-- start class org.apache.hadoop.tools.rumen.ReduceTaskAttemptInfo -->
  30119. <class name="ReduceTaskAttemptInfo" extends="org.apache.hadoop.tools.rumen.TaskAttemptInfo"
  30120. abstract="false"
  30121. static="false" final="false" visibility="public"
  30122. deprecated="not deprecated">
  30123. <constructor name="ReduceTaskAttemptInfo" type="org.apache.hadoop.mapred.TaskStatus.State, org.apache.hadoop.tools.rumen.TaskInfo, long, long, long"
  30124. static="false" final="false" visibility="public"
  30125. deprecated="not deprecated">
  30126. </constructor>
  30127. <method name="getReduceRuntime" return="long"
  30128. abstract="false" native="false" synchronized="false"
  30129. static="false" final="false" visibility="public"
  30130. deprecated="not deprecated">
  30131. <doc>
  30132. <![CDATA[Get the runtime for the <b>reduce</b> phase of the reduce task-attempt.
  30133. @return the runtime for the <b>reduce</b> phase of the reduce task-attempt]]>
  30134. </doc>
  30135. </method>
  30136. <method name="getShuffleRuntime" return="long"
  30137. abstract="false" native="false" synchronized="false"
  30138. static="false" final="false" visibility="public"
  30139. deprecated="not deprecated">
  30140. <doc>
  30141. <![CDATA[Get the runtime for the <b>shuffle</b> phase of the reduce task-attempt.
  30142. @return the runtime for the <b>shuffle</b> phase of the reduce task-attempt]]>
  30143. </doc>
  30144. </method>
  30145. <method name="getMergeRuntime" return="long"
  30146. abstract="false" native="false" synchronized="false"
  30147. static="false" final="false" visibility="public"
  30148. deprecated="not deprecated">
  30149. <doc>
  30150. <![CDATA[Get the runtime for the <b>merge</b> phase of the reduce task-attempt
  30151. @return the runtime for the <b>merge</b> phase of the reduce task-attempt]]>
  30152. </doc>
  30153. </method>
  30154. <method name="getRuntime" return="long"
  30155. abstract="false" native="false" synchronized="false"
  30156. static="false" final="false" visibility="public"
  30157. deprecated="not deprecated">
  30158. </method>
  30159. <doc>
  30160. <![CDATA[{@link ReduceTaskAttemptInfo} represents the information with regard to a
  30161. reduce task attempt.]]>
  30162. </doc>
  30163. </class>
  30164. <!-- end class org.apache.hadoop.tools.rumen.ReduceTaskAttemptInfo -->
  30165. <!-- start class org.apache.hadoop.tools.rumen.RewindableInputStream -->
  30166. <class name="RewindableInputStream" extends="java.io.InputStream"
  30167. abstract="false"
  30168. static="false" final="false" visibility="public"
  30169. deprecated="not deprecated">
  30170. <constructor name="RewindableInputStream" type="java.io.InputStream"
  30171. static="false" final="false" visibility="public"
  30172. deprecated="not deprecated">
  30173. <doc>
  30174. <![CDATA[Constructor.
  30175. @param input]]>
  30176. </doc>
  30177. </constructor>
  30178. <constructor name="RewindableInputStream" type="java.io.InputStream, int"
  30179. static="false" final="false" visibility="public"
  30180. deprecated="not deprecated">
  30181. <doc>
  30182. <![CDATA[Constructor
  30183. @param input
  30184. input stream.
  30185. @param maxBytesToRemember
  30186. Maximum number of bytes we need to remember at the beginning of
  30187. the stream. If {@link #rewind()} is called after so many bytes are
  30188. read from the stream, {@link #rewind()} would fail.]]>
  30189. </doc>
  30190. </constructor>
  30191. <method name="read" return="int"
  30192. abstract="false" native="false" synchronized="false"
  30193. static="false" final="false" visibility="public"
  30194. deprecated="not deprecated">
  30195. <exception name="IOException" type="java.io.IOException"/>
  30196. </method>
  30197. <method name="read" return="int"
  30198. abstract="false" native="false" synchronized="false"
  30199. static="false" final="false" visibility="public"
  30200. deprecated="not deprecated">
  30201. <param name="buffer" type="byte[]"/>
  30202. <param name="offset" type="int"/>
  30203. <param name="length" type="int"/>
  30204. <exception name="IOException" type="java.io.IOException"/>
  30205. </method>
  30206. <method name="close"
  30207. abstract="false" native="false" synchronized="false"
  30208. static="false" final="false" visibility="public"
  30209. deprecated="not deprecated">
  30210. <exception name="IOException" type="java.io.IOException"/>
  30211. </method>
  30212. <method name="rewind" return="java.io.InputStream"
  30213. abstract="false" native="false" synchronized="false"
  30214. static="false" final="false" visibility="public"
  30215. deprecated="not deprecated">
  30216. <exception name="IOException" type="java.io.IOException"/>
  30217. </method>
  30218. <doc>
  30219. <![CDATA[A simple wrapper class to make any input stream "rewindable". It could be
  30220. made more memory efficient by grow the internal buffer adaptively.]]>
  30221. </doc>
  30222. </class>
  30223. <!-- end class org.apache.hadoop.tools.rumen.RewindableInputStream -->
  30224. <!-- start class org.apache.hadoop.tools.rumen.Task20LineHistoryEventEmitter -->
  30225. <class name="Task20LineHistoryEventEmitter" extends="org.apache.hadoop.tools.rumen.HistoryEventEmitter"
  30226. abstract="false"
  30227. static="false" final="false" visibility="public"
  30228. deprecated="not deprecated">
  30229. <constructor name="Task20LineHistoryEventEmitter"
  30230. static="false" final="false" visibility="protected"
  30231. deprecated="not deprecated">
  30232. </constructor>
  30233. </class>
  30234. <!-- end class org.apache.hadoop.tools.rumen.Task20LineHistoryEventEmitter -->
  30235. <!-- start class org.apache.hadoop.tools.rumen.TaskAttempt20LineEventEmitter -->
  30236. <class name="TaskAttempt20LineEventEmitter" extends="org.apache.hadoop.tools.rumen.HistoryEventEmitter"
  30237. abstract="true"
  30238. static="false" final="false" visibility="public"
  30239. deprecated="not deprecated">
  30240. <constructor name="TaskAttempt20LineEventEmitter"
  30241. static="false" final="false" visibility="protected"
  30242. deprecated="not deprecated">
  30243. </constructor>
  30244. </class>
  30245. <!-- end class org.apache.hadoop.tools.rumen.TaskAttempt20LineEventEmitter -->
  30246. <!-- start class org.apache.hadoop.tools.rumen.TaskAttemptInfo -->
  30247. <class name="TaskAttemptInfo" extends="java.lang.Object"
  30248. abstract="true"
  30249. static="false" final="false" visibility="public"
  30250. deprecated="not deprecated">
  30251. <constructor name="TaskAttemptInfo" type="org.apache.hadoop.mapred.TaskStatus.State, org.apache.hadoop.tools.rumen.TaskInfo"
  30252. static="false" final="false" visibility="protected"
  30253. deprecated="not deprecated">
  30254. </constructor>
  30255. <method name="getRunState" return="org.apache.hadoop.mapred.TaskStatus.State"
  30256. abstract="false" native="false" synchronized="false"
  30257. static="false" final="false" visibility="public"
  30258. deprecated="not deprecated">
  30259. <doc>
  30260. <![CDATA[Get the final {@link State} of the task-attempt.
  30261. @return the final <code>State</code> of the task-attempt]]>
  30262. </doc>
  30263. </method>
  30264. <method name="getRuntime" return="long"
  30265. abstract="true" native="false" synchronized="false"
  30266. static="false" final="false" visibility="public"
  30267. deprecated="not deprecated">
  30268. <doc>
  30269. <![CDATA[Get the total runtime for the task-attempt.
  30270. @return the total runtime for the task-attempt]]>
  30271. </doc>
  30272. </method>
  30273. <method name="getTaskInfo" return="org.apache.hadoop.tools.rumen.TaskInfo"
  30274. abstract="false" native="false" synchronized="false"
  30275. static="false" final="false" visibility="public"
  30276. deprecated="not deprecated">
  30277. <doc>
  30278. <![CDATA[Get the {@link TaskInfo} for the given task-attempt.
  30279. @return the <code>TaskInfo</code> for the given task-attempt]]>
  30280. </doc>
  30281. </method>
  30282. <field name="state" type="org.apache.hadoop.mapred.TaskStatus.State"
  30283. transient="false" volatile="false"
  30284. static="false" final="true" visibility="protected"
  30285. deprecated="not deprecated">
  30286. </field>
  30287. <field name="taskInfo" type="org.apache.hadoop.tools.rumen.TaskInfo"
  30288. transient="false" volatile="false"
  30289. static="false" final="true" visibility="protected"
  30290. deprecated="not deprecated">
  30291. </field>
  30292. <doc>
  30293. <![CDATA[{@link TaskAttemptInfo} is a collection of statistics about a particular
  30294. task-attempt gleaned from job-history of the job.]]>
  30295. </doc>
  30296. </class>
  30297. <!-- end class org.apache.hadoop.tools.rumen.TaskAttemptInfo -->
  30298. <!-- start class org.apache.hadoop.tools.rumen.TaskInfo -->
  30299. <class name="TaskInfo" extends="java.lang.Object"
  30300. abstract="false"
  30301. static="false" final="false" visibility="public"
  30302. deprecated="not deprecated">
  30303. <constructor name="TaskInfo" type="long, int, long, int, long"
  30304. static="false" final="false" visibility="public"
  30305. deprecated="not deprecated">
  30306. </constructor>
  30307. <method name="getInputBytes" return="long"
  30308. abstract="false" native="false" synchronized="false"
  30309. static="false" final="false" visibility="public"
  30310. deprecated="not deprecated">
  30311. <doc>
  30312. <![CDATA[@return Raw bytes read from the FileSystem into the task. Note that this
  30313. may not always match the input bytes to the task.]]>
  30314. </doc>
  30315. </method>
  30316. <method name="getInputRecords" return="int"
  30317. abstract="false" native="false" synchronized="false"
  30318. static="false" final="false" visibility="public"
  30319. deprecated="not deprecated">
  30320. <doc>
  30321. <![CDATA[@return Number of records input to this task.]]>
  30322. </doc>
  30323. </method>
  30324. <method name="getOutputBytes" return="long"
  30325. abstract="false" native="false" synchronized="false"
  30326. static="false" final="false" visibility="public"
  30327. deprecated="not deprecated">
  30328. <doc>
  30329. <![CDATA[@return Raw bytes written to the destination FileSystem. Note that this may
  30330. not match output bytes.]]>
  30331. </doc>
  30332. </method>
  30333. <method name="getOutputRecords" return="int"
  30334. abstract="false" native="false" synchronized="false"
  30335. static="false" final="false" visibility="public"
  30336. deprecated="not deprecated">
  30337. <doc>
  30338. <![CDATA[@return Number of records output from this task.]]>
  30339. </doc>
  30340. </method>
  30341. <method name="getTaskMemory" return="long"
  30342. abstract="false" native="false" synchronized="false"
  30343. static="false" final="false" visibility="public"
  30344. deprecated="not deprecated">
  30345. <doc>
  30346. <![CDATA[@return Memory used by the task leq the heap size.]]>
  30347. </doc>
  30348. </method>
  30349. </class>
  30350. <!-- end class org.apache.hadoop.tools.rumen.TaskInfo -->
  30351. <!-- start class org.apache.hadoop.tools.rumen.TopologyBuilder -->
  30352. <class name="TopologyBuilder" extends="java.lang.Object"
  30353. abstract="false"
  30354. static="false" final="false" visibility="public"
  30355. deprecated="not deprecated">
  30356. <constructor name="TopologyBuilder"
  30357. static="false" final="false" visibility="public"
  30358. deprecated="not deprecated">
  30359. </constructor>
  30360. <method name="process"
  30361. abstract="false" native="false" synchronized="false"
  30362. static="false" final="false" visibility="public"
  30363. deprecated="not deprecated">
  30364. <param name="event" type="org.apache.hadoop.mapreduce.jobhistory.HistoryEvent"/>
  30365. <doc>
  30366. <![CDATA[Process one {@link HistoryEvent}
  30367. @param event
  30368. The {@link HistoryEvent} to be processed.]]>
  30369. </doc>
  30370. </method>
  30371. <method name="process"
  30372. abstract="false" native="false" synchronized="false"
  30373. static="false" final="false" visibility="public"
  30374. deprecated="not deprecated">
  30375. <param name="conf" type="java.util.Properties"/>
  30376. <doc>
  30377. <![CDATA[Process a collection of JobConf {@link Properties}. We do not restrict it
  30378. to be called once.
  30379. @param conf
  30380. The job conf properties to be added.]]>
  30381. </doc>
  30382. </method>
  30383. <method name="build" return="org.apache.hadoop.tools.rumen.LoggedNetworkTopology"
  30384. abstract="false" native="false" synchronized="false"
  30385. static="false" final="false" visibility="public"
  30386. deprecated="not deprecated">
  30387. <doc>
  30388. <![CDATA[Request the builder to build the final object. Once called, the
  30389. {@link TopologyBuilder} would accept no more events or job-conf properties.
  30390. @return Parsed {@link LoggedNetworkTopology} object.]]>
  30391. </doc>
  30392. </method>
  30393. <doc>
  30394. <![CDATA[Building the cluster topology.]]>
  30395. </doc>
  30396. </class>
  30397. <!-- end class org.apache.hadoop.tools.rumen.TopologyBuilder -->
  30398. <!-- start class org.apache.hadoop.tools.rumen.TraceBuilder -->
  30399. <class name="TraceBuilder" extends="org.apache.hadoop.conf.Configured"
  30400. abstract="false"
  30401. static="false" final="false" visibility="public"
  30402. deprecated="not deprecated">
  30403. <implements name="org.apache.hadoop.util.Tool"/>
  30404. <constructor name="TraceBuilder"
  30405. static="false" final="false" visibility="public"
  30406. deprecated="not deprecated">
  30407. </constructor>
  30408. <method name="main"
  30409. abstract="false" native="false" synchronized="false"
  30410. static="true" final="false" visibility="public"
  30411. deprecated="not deprecated">
  30412. <param name="args" type="java.lang.String[]"/>
  30413. </method>
  30414. <method name="run" return="int"
  30415. abstract="false" native="false" synchronized="false"
  30416. static="false" final="false" visibility="public"
  30417. deprecated="not deprecated">
  30418. <param name="args" type="java.lang.String[]"/>
  30419. <exception name="Exception" type="java.lang.Exception"/>
  30420. </method>
  30421. <doc>
  30422. <![CDATA[The main driver of the Rumen Parser.]]>
  30423. </doc>
  30424. </class>
  30425. <!-- end class org.apache.hadoop.tools.rumen.TraceBuilder -->
  30426. <!-- start class org.apache.hadoop.tools.rumen.TreePath -->
  30427. <class name="TreePath" extends="java.lang.Object"
  30428. abstract="false"
  30429. static="false" final="false" visibility="public"
  30430. deprecated="not deprecated">
  30431. <constructor name="TreePath" type="org.apache.hadoop.tools.rumen.TreePath, java.lang.String"
  30432. static="false" final="false" visibility="public"
  30433. deprecated="not deprecated">
  30434. </constructor>
  30435. <constructor name="TreePath" type="org.apache.hadoop.tools.rumen.TreePath, java.lang.String, int"
  30436. static="false" final="false" visibility="public"
  30437. deprecated="not deprecated">
  30438. </constructor>
  30439. <method name="toString" return="java.lang.String"
  30440. abstract="false" native="false" synchronized="false"
  30441. static="false" final="false" visibility="public"
  30442. deprecated="not deprecated">
  30443. </method>
  30444. <doc>
  30445. <![CDATA[This describes a path from a node to the root. We use it when we compare two
  30446. trees during rumen unit tests. If the trees are not identical, this chain
  30447. will be converted to a string which describes the path from the root to the
  30448. fields that did not compare.]]>
  30449. </doc>
  30450. </class>
  30451. <!-- end class org.apache.hadoop.tools.rumen.TreePath -->
  30452. <!-- start class org.apache.hadoop.tools.rumen.ZombieCluster -->
  30453. <class name="ZombieCluster" extends="org.apache.hadoop.tools.rumen.AbstractClusterStory"
  30454. abstract="false"
  30455. static="false" final="false" visibility="public"
  30456. deprecated="not deprecated">
  30457. <constructor name="ZombieCluster" type="org.apache.hadoop.tools.rumen.LoggedNetworkTopology, org.apache.hadoop.tools.rumen.MachineNode"
  30458. static="false" final="false" visibility="public"
  30459. deprecated="not deprecated">
  30460. <doc>
  30461. <![CDATA[Construct a homogeneous cluster. We assume that the leaves on the topology
  30462. are {@link MachineNode}s, and the parents of {@link MachineNode}s are
  30463. {@link RackNode}s. We also expect all leaf nodes are on the same level.
  30464. @param topology
  30465. The network topology.
  30466. @param defaultNode
  30467. The default node setting.]]>
  30468. </doc>
  30469. </constructor>
  30470. <constructor name="ZombieCluster" type="org.apache.hadoop.fs.Path, org.apache.hadoop.tools.rumen.MachineNode, org.apache.hadoop.conf.Configuration"
  30471. static="false" final="false" visibility="public"
  30472. deprecated="not deprecated">
  30473. <exception name="IOException" type="java.io.IOException"/>
  30474. <doc>
  30475. <![CDATA[Construct a homogeneous cluster. We assume that the leaves on the topology
  30476. are {@link MachineNode}s, and the parents of {@link MachineNode}s are
  30477. {@link RackNode}s. We also expect all leaf nodes are on the same level.
  30478. @param path Path to the JSON-encoded topology file.
  30479. @param conf
  30480. @param defaultNode
  30481. The default node setting.
  30482. @throws IOException]]>
  30483. </doc>
  30484. </constructor>
  30485. <constructor name="ZombieCluster" type="java.io.InputStream, org.apache.hadoop.tools.rumen.MachineNode"
  30486. static="false" final="false" visibility="public"
  30487. deprecated="not deprecated">
  30488. <exception name="IOException" type="java.io.IOException"/>
  30489. <doc>
  30490. <![CDATA[Construct a homogeneous cluster. We assume that the leaves on the topology
  30491. are {@link MachineNode}s, and the parents of {@link MachineNode}s are
  30492. {@link RackNode}s. We also expect all leaf nodes are on the same level.
  30493. @param input The input stream for the JSON-encoded topology file.
  30494. @param defaultNode
  30495. The default node setting.
  30496. @throws IOException]]>
  30497. </doc>
  30498. </constructor>
  30499. <method name="getClusterTopology" return="org.apache.hadoop.tools.rumen.Node"
  30500. abstract="false" native="false" synchronized="false"
  30501. static="false" final="false" visibility="public"
  30502. deprecated="not deprecated">
  30503. </method>
  30504. <doc>
  30505. <![CDATA[{@link ZombieCluster} rebuilds the cluster topology using the information
  30506. obtained from job history logs.]]>
  30507. </doc>
  30508. </class>
  30509. <!-- end class org.apache.hadoop.tools.rumen.ZombieCluster -->
  30510. <!-- start class org.apache.hadoop.tools.rumen.ZombieJob -->
  30511. <class name="ZombieJob" extends="java.lang.Object"
  30512. abstract="false"
  30513. static="false" final="false" visibility="public"
  30514. deprecated="not deprecated">
  30515. <implements name="org.apache.hadoop.tools.rumen.JobStory"/>
  30516. <constructor name="ZombieJob" type="org.apache.hadoop.tools.rumen.LoggedJob, org.apache.hadoop.tools.rumen.ClusterStory, long"
  30517. static="false" final="false" visibility="public"
  30518. deprecated="not deprecated">
  30519. <doc>
  30520. <![CDATA[This constructor creates a {@link ZombieJob} with the same semantics as the
  30521. {@link LoggedJob} passed in this parameter
  30522. @param job
  30523. The dead job this ZombieJob instance is based on.
  30524. @param cluster
  30525. The cluster topology where the dead job ran on. This argument can
  30526. be null if we do not have knowledge of the cluster topology.
  30527. @param seed
  30528. Seed for the random number generator for filling in information
  30529. not available from the ZombieJob.]]>
  30530. </doc>
  30531. </constructor>
  30532. <constructor name="ZombieJob" type="org.apache.hadoop.tools.rumen.LoggedJob, org.apache.hadoop.tools.rumen.ClusterStory"
  30533. static="false" final="false" visibility="public"
  30534. deprecated="not deprecated">
  30535. <doc>
  30536. <![CDATA[This constructor creates a {@link ZombieJob} with the same semantics as the
  30537. {@link LoggedJob} passed in this parameter
  30538. @param job
  30539. The dead job this ZombieJob instance is based on.
  30540. @param cluster
  30541. The cluster topology where the dead job ran on. This argument can
  30542. be null if we do not have knowledge of the cluster topology.]]>
  30543. </doc>
  30544. </constructor>
  30545. <method name="getJobConf" return="org.apache.hadoop.mapred.JobConf"
  30546. abstract="false" native="false" synchronized="true"
  30547. static="false" final="false" visibility="public"
  30548. deprecated="not deprecated">
  30549. </method>
  30550. <method name="getInputSplits" return="org.apache.hadoop.mapreduce.InputSplit[]"
  30551. abstract="false" native="false" synchronized="false"
  30552. static="false" final="false" visibility="public"
  30553. deprecated="not deprecated">
  30554. </method>
  30555. <method name="getName" return="java.lang.String"
  30556. abstract="false" native="false" synchronized="false"
  30557. static="false" final="false" visibility="public"
  30558. deprecated="not deprecated">
  30559. </method>
  30560. <method name="getJobID" return="org.apache.hadoop.mapreduce.JobID"
  30561. abstract="false" native="false" synchronized="false"
  30562. static="false" final="false" visibility="public"
  30563. deprecated="not deprecated">
  30564. </method>
  30565. <method name="getNumberMaps" return="int"
  30566. abstract="false" native="false" synchronized="false"
  30567. static="false" final="false" visibility="public"
  30568. deprecated="not deprecated">
  30569. </method>
  30570. <method name="getNumberReduces" return="int"
  30571. abstract="false" native="false" synchronized="false"
  30572. static="false" final="false" visibility="public"
  30573. deprecated="not deprecated">
  30574. </method>
  30575. <method name="getOutcome" return="org.apache.hadoop.tools.rumen.Pre21JobHistoryConstants.Values"
  30576. abstract="false" native="false" synchronized="false"
  30577. static="false" final="false" visibility="public"
  30578. deprecated="not deprecated">
  30579. </method>
  30580. <method name="getSubmissionTime" return="long"
  30581. abstract="false" native="false" synchronized="false"
  30582. static="false" final="false" visibility="public"
  30583. deprecated="not deprecated">
  30584. </method>
  30585. <method name="getQueueName" return="java.lang.String"
  30586. abstract="false" native="false" synchronized="false"
  30587. static="false" final="false" visibility="public"
  30588. deprecated="not deprecated">
  30589. </method>
  30590. <method name="getNumLoggedMaps" return="int"
  30591. abstract="false" native="false" synchronized="false"
  30592. static="false" final="false" visibility="public"
  30593. deprecated="not deprecated">
  30594. <doc>
  30595. <![CDATA[Getting the number of map tasks that are actually logged in the trace.
  30596. @return The number of map tasks that are actually logged in the trace.]]>
  30597. </doc>
  30598. </method>
  30599. <method name="getNumLoggedReduces" return="int"
  30600. abstract="false" native="false" synchronized="false"
  30601. static="false" final="false" visibility="public"
  30602. deprecated="not deprecated">
  30603. <doc>
  30604. <![CDATA[Getting the number of reduce tasks that are actually logged in the trace.
  30605. @return The number of map tasks that are actually logged in the trace.]]>
  30606. </doc>
  30607. </method>
  30608. <method name="getUser" return="java.lang.String"
  30609. abstract="false" native="false" synchronized="false"
  30610. static="false" final="false" visibility="public"
  30611. deprecated="not deprecated">
  30612. </method>
  30613. <method name="getLoggedJob" return="org.apache.hadoop.tools.rumen.LoggedJob"
  30614. abstract="false" native="false" synchronized="false"
  30615. static="false" final="false" visibility="public"
  30616. deprecated="not deprecated">
  30617. <doc>
  30618. <![CDATA[Get the underlining {@link LoggedJob} object read directly from the trace.
  30619. This is mainly for debugging.
  30620. @return the underlining {@link LoggedJob} object]]>
  30621. </doc>
  30622. </method>
  30623. <method name="getTaskAttemptInfo" return="org.apache.hadoop.tools.rumen.TaskAttemptInfo"
  30624. abstract="false" native="false" synchronized="false"
  30625. static="false" final="false" visibility="public"
  30626. deprecated="not deprecated">
  30627. <param name="taskType" type="org.apache.hadoop.mapreduce.TaskType"/>
  30628. <param name="taskNumber" type="int"/>
  30629. <param name="taskAttemptNumber" type="int"/>
  30630. <doc>
  30631. <![CDATA[Get a {@link TaskAttemptInfo} with a {@link TaskAttemptID} associated with
  30632. taskType, taskNumber, and taskAttemptNumber. This function does not care
  30633. about locality, and follows the following decision logic: 1. Make up a
  30634. {@link TaskAttemptInfo} if the task attempt is missing in trace, 2. Make up
  30635. a {@link TaskAttemptInfo} if the task attempt has a KILLED final status in
  30636. trace, 3. Otherwise (final state is SUCCEEDED or FAILED), construct the
  30637. {@link TaskAttemptInfo} from the trace.]]>
  30638. </doc>
  30639. </method>
  30640. <method name="getTaskInfo" return="org.apache.hadoop.tools.rumen.TaskInfo"
  30641. abstract="false" native="false" synchronized="false"
  30642. static="false" final="false" visibility="public"
  30643. deprecated="not deprecated">
  30644. <param name="taskType" type="org.apache.hadoop.mapreduce.TaskType"/>
  30645. <param name="taskNumber" type="int"/>
  30646. </method>
  30647. <method name="getMapTaskAttemptInfoAdjusted" return="org.apache.hadoop.tools.rumen.TaskAttemptInfo"
  30648. abstract="false" native="false" synchronized="false"
  30649. static="false" final="false" visibility="public"
  30650. deprecated="not deprecated">
  30651. <param name="taskNumber" type="int"/>
  30652. <param name="taskAttemptNumber" type="int"/>
  30653. <param name="locality" type="int"/>
  30654. <doc>
  30655. <![CDATA[Get a {@link TaskAttemptInfo} with a {@link TaskAttemptID} associated with
  30656. taskType, taskNumber, and taskAttemptNumber. This function considers
  30657. locality, and follows the following decision logic: 1. Make up a
  30658. {@link TaskAttemptInfo} if the task attempt is missing in trace, 2. Make up
  30659. a {@link TaskAttemptInfo} if the task attempt has a KILLED final status in
  30660. trace, 3. If final state is FAILED, construct a {@link TaskAttemptInfo}
  30661. from the trace, without considering locality. 4. If final state is
  30662. SUCCEEDED, construct a {@link TaskAttemptInfo} from the trace, with runtime
  30663. scaled according to locality in simulation and locality in trace.]]>
  30664. </doc>
  30665. </method>
  30666. <doc>
  30667. <![CDATA[{@link ZombieJob} is a layer above {@link LoggedJob} raw JSON objects.
  30668. Each {@link ZombieJob} object represents a job in job history. For everything
  30669. that exists in job history, contents are returned unchanged faithfully. To
  30670. get input splits of a non-exist task, a non-exist task attempt, or an
  30671. ill-formed task attempt, proper objects are made up from statistical
  30672. sketches.]]>
  30673. </doc>
  30674. </class>
  30675. <!-- end class org.apache.hadoop.tools.rumen.ZombieJob -->
  30676. <!-- start class org.apache.hadoop.tools.rumen.ZombieJobProducer -->
  30677. <class name="ZombieJobProducer" extends="java.lang.Object"
  30678. abstract="false"
  30679. static="false" final="false" visibility="public"
  30680. deprecated="not deprecated">
  30681. <implements name="org.apache.hadoop.tools.rumen.JobStoryProducer"/>
  30682. <constructor name="ZombieJobProducer" type="org.apache.hadoop.fs.Path, org.apache.hadoop.tools.rumen.ZombieCluster, org.apache.hadoop.conf.Configuration"
  30683. static="false" final="false" visibility="public"
  30684. deprecated="not deprecated">
  30685. <exception name="IOException" type="java.io.IOException"/>
  30686. <doc>
  30687. <![CDATA[Constructor
  30688. @param path
  30689. Path to the JSON trace file, possibly compressed.
  30690. @param cluster
  30691. The topology of the cluster that corresponds to the jobs in the
  30692. trace. The argument can be null if we do not have knowledge of the
  30693. cluster topology.
  30694. @param conf
  30695. @throws IOException]]>
  30696. </doc>
  30697. </constructor>
  30698. <constructor name="ZombieJobProducer" type="org.apache.hadoop.fs.Path, org.apache.hadoop.tools.rumen.ZombieCluster, org.apache.hadoop.conf.Configuration, long"
  30699. static="false" final="false" visibility="public"
  30700. deprecated="not deprecated">
  30701. <exception name="IOException" type="java.io.IOException"/>
  30702. <doc>
  30703. <![CDATA[Constructor
  30704. @param path
  30705. Path to the JSON trace file, possibly compressed.
  30706. @param cluster
  30707. The topology of the cluster that corresponds to the jobs in the
  30708. trace. The argument can be null if we do not have knowledge of the
  30709. cluster topology.
  30710. @param conf
  30711. @param randomSeed
  30712. use a deterministic seed.
  30713. @throws IOException]]>
  30714. </doc>
  30715. </constructor>
  30716. <constructor name="ZombieJobProducer" type="java.io.InputStream, org.apache.hadoop.tools.rumen.ZombieCluster"
  30717. static="false" final="false" visibility="public"
  30718. deprecated="not deprecated">
  30719. <exception name="IOException" type="java.io.IOException"/>
  30720. <doc>
  30721. <![CDATA[Constructor
  30722. @param input
  30723. The input stream for the JSON trace.
  30724. @param cluster
  30725. The topology of the cluster that corresponds to the jobs in the
  30726. trace. The argument can be null if we do not have knowledge of the
  30727. cluster topology.
  30728. @throws IOException]]>
  30729. </doc>
  30730. </constructor>
  30731. <constructor name="ZombieJobProducer" type="java.io.InputStream, org.apache.hadoop.tools.rumen.ZombieCluster, long"
  30732. static="false" final="false" visibility="public"
  30733. deprecated="not deprecated">
  30734. <exception name="IOException" type="java.io.IOException"/>
  30735. <doc>
  30736. <![CDATA[Constructor
  30737. @param input
  30738. The input stream for the JSON trace.
  30739. @param cluster
  30740. The topology of the cluster that corresponds to the jobs in the
  30741. trace. The argument can be null if we do not have knowledge of the
  30742. cluster topology.
  30743. @param randomSeed
  30744. use a deterministic seed.
  30745. @throws IOException]]>
  30746. </doc>
  30747. </constructor>
  30748. <method name="getNextJob" return="org.apache.hadoop.tools.rumen.ZombieJob"
  30749. abstract="false" native="false" synchronized="false"
  30750. static="false" final="false" visibility="public"
  30751. deprecated="not deprecated">
  30752. <exception name="IOException" type="java.io.IOException"/>
  30753. </method>
  30754. <method name="close"
  30755. abstract="false" native="false" synchronized="false"
  30756. static="false" final="false" visibility="public"
  30757. deprecated="not deprecated">
  30758. <exception name="IOException" type="java.io.IOException"/>
  30759. </method>
  30760. <doc>
  30761. <![CDATA[Producing {@link JobStory}s from job trace.]]>
  30762. </doc>
  30763. </class>
  30764. <!-- end class org.apache.hadoop.tools.rumen.ZombieJobProducer -->
  30765. </package>
  30766. </api>