17 年之前 · 6771646cc0
--- a/CHANGES.txt
+++ b/CHANGES.txt
@@ -14,6 +14,8 @@ Trunk (unreleased changes)
 
				 
			
 
				     HADOOP-1398.  Add HBase in-memory block cache.  (tomwhite)
			
 
				 
			
 
				+    HADOOP-2178.  Job History on DFS. (Amareshwari Sri Ramadasu via ddas)
			
 
				+
			
 
				   OPTIMIZATIONS
			
 
				 
			
 
				   BUG FIXES
			
--- a/build.xml
+++ b/build.xml
@@ -178,6 +178,7 @@
 
				     <mkdir dir="${build.webapps}/job/WEB-INF"/>
			
 
				     <mkdir dir="${build.webapps}/dfs/WEB-INF"/>
			
 
				     <mkdir dir="${build.webapps}/datanode/WEB-INF"/>
			
 
				+    <mkdir dir="${build.webapps}/history/WEB-INF"/>
			
 
				     <mkdir dir="${build.examples}"/>
			
 
				     <mkdir dir="${build.anttasks}"/>
			
 
				     <mkdir dir="${build.dir}/c++"/>
			
@@ -272,6 +273,13 @@
 
				      webxml="${build.webapps}/dfs/WEB-INF/web.xml">
			
 
				     </jsp-compile>
			
 
				 
			
 
				+    <jsp-compile
			
 
				+     uriroot="${src.webapps}/history"
			
 
				+     outputdir="${build.src}"
			
 
				+     package="org.apache.hadoop.mapred"
			
 
				+     webxml="${build.webapps}/history/WEB-INF/web.xml">
			
 
				+    </jsp-compile>
			
 
				+
			
 
				     <jsp-compile
			
 
				      uriroot="${src.webapps}/datanode"
			
 
				      outputdir="${build.src}"
			
--- a/conf/hadoop-default.xml
+++ b/conf/hadoop-default.xml
@@ -35,6 +35,25 @@
 
				   <description>The max number of log files</description>
			
 
				 </property>
			
 
				 
			
 
				+<property>
			
 
				+  <name>hadoop.job.history.location</name>
			
 
				+  <value>file://${hadoop.log.dir}/history</value>
			
 
				+  <description> If job tracker is static the history files are stored 
			
 
				+  in this single well known place. By default, it is in the local 
			
 
				+  file system at ${hadoop.log.dir}/history.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>hadoop.job.history.user.location</name>
			
 
				+  <value></value>
			
 
				+  <description> User can specify a location to store the history files of 
			
 
				+  a particular job. If nothing is specified, the logs are stored in 
			
 
				+  output directory. The files are stored in "_logs/history/" in the directory.
			
 
				+  User can stop logging by giving the value "none". 
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				 <property>
			
 
				   <name>dfs.namenode.logging.level</name>
			
 
				   <value>info</value>
			
@@ -506,6 +525,15 @@ creations/deletions), or "all".</description>
 
				   </description>
			
 
				 </property>
			
 
				 
			
 
				+<property>
			
 
				+  <name>mapred.job.history.http.bindAddress</name>
			
 
				+  <value>0.0.0.0:0</value>
			
 
				+  <description>
			
 
				+    The job history http server bind address and port.
			
 
				+    If the port is 0 then the server will start on a free port.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				 <property>
			
 
				   <name>mapred.job.tracker.handler.count</name>
			
 
				   <value>10</value>
			
--- a/docs/cluster_setup.html
+++ b/docs/cluster_setup.html
@@ -622,13 +622,41 @@ document.write("Last Published: " + document.lastModified);
 
				           Commons Logging</a> framework for logging. Edit the 
			
 
				           <span class="codefrag">conf/log4j.properties</span> file to customize the Hadoop 
			
 
				           daemons' logging configuration (log-formats and so on).</p>
			
 
				+<a name="N1030D"></a><a name="History+Logging"></a>
			
 
				+<h5>History Logging</h5>
			
 
				+<p> The job history files are stored in central location 
			
 
				+            <span class="codefrag"> hadoop.job.history.location </span> which can be on DFS also,
			
 
				+            whose default value is <span class="codefrag">${HADOOP_LOG_DIR}/history</span>. 
			
 
				+            Job history server is started on job tracker. The history 
			
 
				+            web UI is accessible from job tracker web UI.</p>
			
 
				+<p> The history files are also logged to user specified directory
			
 
				+            <span class="codefrag">hadoop.job.history.user.location</span> 
			
 
				+            which defaults to job output directory. The files are stored in
			
 
				+            "_logs/history/" in the specified directory. Hence, by default 
			
 
				+            they will be in "mapred.output.dir/_logs/history/". User can stop
			
 
				+            logging by giving the value <span class="codefrag">none</span> for 
			
 
				+            <span class="codefrag">hadoop.job.history.user.location</span> 
			
 
				+</p>
			
 
				+<p> User can view logs in specified directory using 
			
 
				+            the following command <br>
			
 
				+            
			
 
				+<span class="codefrag">$ bin/hadoop job -history output-dir</span>
			
 
				+<br>
			
 
				+            This will start a stand alone jetty on the client and 
			
 
				+            load history jsp's. 
			
 
				+            It will display the port where the server is up at. The server will
			
 
				+            be up for 30 minutes. User has to use 
			
 
				+            <span class="codefrag"> http://hostname:port </span> to view the history. User can 
			
 
				+            also provide http bind address using 
			
 
				+            <span class="codefrag">mapred.job.history.http.bindAddress</span>
			
 
				+</p>
			
 
				 <p>Once all the necessary configuration is complete, distribute the files
			
 
				       to the <span class="codefrag">HADOOP_CONF_DIR</span> directory on all the machines, 
			
 
				       typically <span class="codefrag">${HADOOP_HOME}/conf</span>.</p>
			
 
				 </div>
			
 
				     
			
 
				     
			
 
				-<a name="N10319"></a><a name="Hadoop+Startup"></a>
			
 
				+<a name="N10343"></a><a name="Hadoop+Startup"></a>
			
 
				 <h2 class="h3">Hadoop Startup</h2>
			
 
				 <div class="section">
			
 
				 <p>To start a Hadoop cluster you will need to start both the HDFS and 
			
@@ -663,7 +691,7 @@ document.write("Last Published: " + document.lastModified);
 
				 </div>
			
 
				     
			
 
				     
			
 
				-<a name="N1035F"></a><a name="Hadoop+Shutdown"></a>
			
 
				+<a name="N10389"></a><a name="Hadoop+Shutdown"></a>
			
 
				 <h2 class="h3">Hadoop Shutdown</h2>
			
 
				 <div class="section">
			
 
				 <p>
			
--- a/docs/cluster_setup.pdf
+++ b/docs/cluster_setup.pdf
--- a/docs/hadoop-default.html
+++ b/docs/hadoop-default.html
@@ -17,6 +17,19 @@
 
				 <td><a name="hadoop.logfile.count">hadoop.logfile.count</a></td><td>10</td><td>The max number of log files</td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				+<td><a name="hadoop.job.history.location">hadoop.job.history.location</a></td><td>file://${hadoop.log.dir}/history</td><td> If job tracker is static the history files are stored 
			
 
				+  in this single well known place. By default, it is in the local 
			
 
				+  file system at ${hadoop.log.dir}/history.
			
 
				+  </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				+<td><a name="hadoop.job.history.user.location">hadoop.job.history.user.location</a></td><td></td><td> User can specify a location to store the history files of 
			
 
				+  a particular job. If nothing is specified, the logs are stored in 
			
 
				+  output directory. The files are stored in "_logs/history/" in the directory.
			
 
				+  User can stop logging by giving the value "none". 
			
 
				+  </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				 <td><a name="dfs.namenode.logging.level">dfs.namenode.logging.level</a></td><td>info</td><td>The logging level for dfs namenode. Other values are "dir"(trac
			
 
				 e namespace mutations), "block"(trace block under/over replications and block
			
 
				 creations/deletions), or "all".</td>
			
@@ -62,10 +75,6 @@ creations/deletions), or "all".</td>
 
				   determine the host, port, etc. for a filesystem.</td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="fs.trash.root">fs.trash.root</a></td><td>${hadoop.tmp.dir}/Trash</td><td>The trash directory, used by FsShell's 'rm' command.
			
 
				-  </td>
			
 
				-</tr>
			
 
				-<tr>
			
 
				 <td><a name="fs.trash.interval">fs.trash.interval</a></td><td>0</td><td>Number of minutes between trash checkpoints.
			
 
				   If zero, the trash feature is disabled.
			
 
				   </td>
			
@@ -106,25 +115,25 @@ creations/deletions), or "all".</td>
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="dfs.secondary.http.bindAddress">dfs.secondary.http.bindAddress</a></td><td>0.0.0.0:50090</td><td>
			
 
				-    The secondary namenode http server bind address and port.
			
 
				+<td><a name="dfs.secondary.http.address">dfs.secondary.http.address</a></td><td>0.0.0.0:50090</td><td>
			
 
				+    The secondary namenode http server address and port.
			
 
				     If the port is 0 then the server will start on a free port.
			
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="dfs.datanode.bindAddress">dfs.datanode.bindAddress</a></td><td>0.0.0.0:50010</td><td>
			
 
				-    The address where the datanode will listen to.
			
 
				+<td><a name="dfs.datanode.address">dfs.datanode.address</a></td><td>0.0.0.0:50010</td><td>
			
 
				+    The address where the datanode server will listen to.
			
 
				     If the port is 0 then the server will start on a free port.
			
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="dfs.datanode.http.bindAddress">dfs.datanode.http.bindAddress</a></td><td>0.0.0.0:50075</td><td>
			
 
				-    The datanode http server bind address and port.
			
 
				+<td><a name="dfs.datanode.http.address">dfs.datanode.http.address</a></td><td>0.0.0.0:50075</td><td>
			
 
				+    The datanode http server address and port.
			
 
				     If the port is 0 then the server will start on a free port.
			
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="dfs.http.bindAddress">dfs.http.bindAddress</a></td><td>0.0.0.0:50070</td><td>
			
 
				+<td><a name="dfs.http.address">dfs.http.address</a></td><td>0.0.0.0:50070</td><td>
			
 
				     The address and the base port where the dfs namenode web ui will listen on.
			
 
				     If the port is 0 then the server will start on a free port.
			
 
				   </td>
			
@@ -163,6 +172,11 @@ creations/deletions), or "all".</td>
 
				       directories, for redundancy. </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				+<td><a name="dfs.web.ugi">dfs.web.ugi</a></td><td>webuser,webgroup</td><td>The user account used by the web interface.
			
 
				+    Syntax: USERNAME,GROUP1,GROUP2, ...
			
 
				+  </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				 <td><a name="dfs.permissions">dfs.permissions</a></td><td>true</td><td>
			
 
				     If "true", enable permission checking in HDFS.
			
 
				     If "false", permission checking is turned off,
			
@@ -267,6 +281,12 @@ creations/deletions), or "all".</td>
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				+<td><a name="dfs.namenode.decommission.interval">dfs.namenode.decommission.interval</a></td><td>300</td><td>Namenode periodicity in seconds to check if decommission is complete.</td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				+<td><a name="dfs.replication.interval">dfs.replication.interval</a></td><td>3</td><td>The periodicity in seconds with which the namenode computes repliaction work for datanodes. </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				 <td><a name="fs.s3.block.size">fs.s3.block.size</a></td><td>67108864</td><td>Block size to use when writing files to S3.</td>
			
 
				 </tr>
			
 
				 <tr>
			
@@ -291,8 +311,14 @@ creations/deletions), or "all".</td>
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="mapred.job.tracker.http.bindAddress">mapred.job.tracker.http.bindAddress</a></td><td>0.0.0.0:50030</td><td>
			
 
				-    The job tracker http server bind address and port.
			
 
				+<td><a name="mapred.job.tracker.http.address">mapred.job.tracker.http.address</a></td><td>0.0.0.0:50030</td><td>
			
 
				+    The job tracker http server address and port the server will listen on.
			
 
				+    If the port is 0 then the server will start on a free port.
			
 
				+  </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				+<td><a name="mapred.job.history.http.bindAddress">mapred.job.history.http.bindAddress</a></td><td>0.0.0.0:0</td><td>
			
 
				+    The job history http server bind address and port.
			
 
				     If the port is 0 then the server will start on a free port.
			
 
				   </td>
			
 
				 </tr>
			
@@ -303,8 +329,10 @@ creations/deletions), or "all".</td>
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="mapred.task.tracker.report.bindAddress">mapred.task.tracker.report.bindAddress</a></td><td>127.0.0.1:0</td><td>The interface that task processes use to communicate
			
 
				-  with their parent tasktracker process.</td>
			
 
				+<td><a name="mapred.task.tracker.report.address">mapred.task.tracker.report.address</a></td><td>127.0.0.1:0</td><td>The interface and port that task tracker server listens on. 
			
 
				+  Since it is only connected to by the tasks, it uses the local interface.
			
 
				+  EXPERT ONLY. Should only be changed if your host does not have the loopback 
			
 
				+  interface.</td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				 <td><a name="mapred.local.dir">mapred.local.dir</a></td><td>${hadoop.tmp.dir}/mapred/local</td><td>The local directory where MapReduce stores intermediate
			
@@ -410,6 +438,15 @@ creations/deletions), or "all".</td>
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				+<td><a name="mapred.child.tmp">mapred.child.tmp</a></td><td>./tmp</td><td> To set the value of tmp directory for map and reduce tasks.
			
 
				+  If the value is an absolute path, it is directly assigned. Otherwise, it is
			
 
				+  prepended with task's working directory. The java tasks are executed with
			
 
				+  option -Djava.io.tmpdir='the absolute path of the tmp dir'. Pipes and
			
 
				+  streaming are set with environment variable,
			
 
				+   TMPDIR='the absolute path of the tmp dir'
			
 
				+  </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				 <td><a name="mapred.inmem.merge.threshold">mapred.inmem.merge.threshold</a></td><td>1000</td><td>The threshold, in terms of the number of files 
			
 
				   for the in-memory merge process. When we accumulate threshold number of files
			
 
				   we initiate the in-memory merge and spill to disk. A value of 0 or less than
			
@@ -452,8 +489,8 @@ creations/deletions), or "all".</td>
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				-<td><a name="mapred.task.tracker.http.bindAddress">mapred.task.tracker.http.bindAddress</a></td><td>0.0.0.0:50060</td><td>
			
 
				-    The task tracker http server bind address and port.
			
 
				+<td><a name="mapred.task.tracker.http.address">mapred.task.tracker.http.address</a></td><td>0.0.0.0:50060</td><td>
			
 
				+    The task tracker http server address and port.
			
 
				     If the port is 0 then the server will start on a free port.
			
 
				   </td>
			
 
				 </tr>
			
@@ -564,6 +601,22 @@ creations/deletions), or "all".</td>
 
				     </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				+<td><a name="mapred.task.profile">mapred.task.profile</a></td><td>false</td><td>To set whether the system should collect profiler
			
 
				+     information for some of the tasks in this job? The information is stored
			
 
				+     in the the user log directory. The value is "true" if task profiling
			
 
				+     is enabled.</td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				+<td><a name="mapred.task.profile.maps">mapred.task.profile.maps</a></td><td>0-2</td><td> To set the ranges of map tasks to profile.
			
 
				+    mapred.task.profile has to be set to true for the value to be accounted.
			
 
				+    </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				+<td><a name="mapred.task.profile.reduces">mapred.task.profile.reduces</a></td><td>0-2</td><td> To set the ranges of reduce tasks to profile.
			
 
				+    mapred.task.profile has to be set to true for the value to be accounted.
			
 
				+    </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				 <td><a name="ipc.client.timeout">ipc.client.timeout</a></td><td>60000</td><td>Defines the timeout for IPC calls in milliseconds.</td>
			
 
				 </tr>
			
 
				 <tr>
			
@@ -596,6 +649,18 @@ creations/deletions), or "all".</td>
 
				   </td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				+<td><a name="ipc.server.tcpnodelay">ipc.server.tcpnodelay</a></td><td>false</td><td>Turn on/off Nagle's algorithm for the TCP socket connection on 
			
 
				+  the server. Setting to true disables the algorithm and may decrease latency
			
 
				+  with a cost of more/smaller packets. 
			
 
				+  </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				+<td><a name="ipc.client.tcpnodelay">ipc.client.tcpnodelay</a></td><td>false</td><td>Turn on/off Nagle's algorithm for the TCP socket connection on 
			
 
				+  the client. Setting to true disables the algorithm and may decrease latency
			
 
				+  with a cost of more/smaller packets. 
			
 
				+  </td>
			
 
				+</tr>
			
 
				+<tr>
			
 
				 <td><a name="job.end.retry.attempts">job.end.retry.attempts</a></td><td>0</td><td>Indicates how many times hadoop should attempt to contact the
			
 
				                notification URL </td>
			
 
				 </tr>
			
--- a/docs/mapred_tutorial.html
+++ b/docs/mapred_tutorial.html
@@ -283,7 +283,7 @@ document.write("Last Published: " + document.lastModified);
 
				 <a href="#Example%3A+WordCount+v2.0">Example: WordCount v2.0</a>
			
 
				 <ul class="minitoc">
			
 
				 <li>
			
 
				-<a href="#Source+Code-N10BBE">Source Code</a>
			
 
				+<a href="#Source+Code-N10BDE">Source Code</a>
			
 
				 </li>
			
 
				 <li>
			
 
				 <a href="#Sample+Runs">Sample Runs</a>
			
@@ -1570,10 +1570,34 @@ document.write("Last Published: " + document.lastModified);
 
				           </li>
			
 
				         
			
 
				 </ol>
			
 
				+<p> Job history files are also logged to user specified directory
			
 
				+        <span class="codefrag">hadoop.job.history.user.location</span> 
			
 
				+        which defaults to job output directory. The files are stored in
			
 
				+        "_logs/history/" in the specified directory. Hence, by default they will
			
 
				+        be in mapred.output.dir/_logs/history. User can stop
			
 
				+        logging by giving the value <span class="codefrag">none</span> for 
			
 
				+        <span class="codefrag">hadoop.job.history.user.location</span>
			
 
				+</p>
			
 
				+<p> User can view logs in specified directory using 
			
 
				+        the following command <br>
			
 
				+        
			
 
				+<span class="codefrag">$ bin/hadoop job -history output-dir</span>
			
 
				+<br>
			
 
				+        This will start a stand alone jetty on the client and 
			
 
				+        load history jsp's. 
			
 
				+        It will display the port where the server is up at. The server will
			
 
				+        be up for 30 minutes. User has to use 
			
 
				+        <span class="codefrag"> http://hostname:port </span> to view the history. User can 
			
 
				+        also provide http bind address using 
			
 
				+        <span class="codefrag">mapred.job.history.http.bindAddress</span>
			
 
				+</p>
			
 
				+<p> User can use 
			
 
				+        <a href="api/org/apache/hadoop/mapred/OutputLogFilter.html">OutputLogFilter</a>
			
 
				+        to filter log files from the output directory listing. </p>
			
 
				 <p>Normally the user creates the application, describes various facets 
			
 
				         of the job via <span class="codefrag">JobConf</span>, and then uses the 
			
 
				         <span class="codefrag">JobClient</span> to submit the job and monitor its progress.</p>
			
 
				-<a name="N108F7"></a><a name="Job+Control"></a>
			
 
				+<a name="N10917"></a><a name="Job+Control"></a>
			
 
				 <h4>Job Control</h4>
			
 
				 <p>Users may need to chain map-reduce jobs to accomplish complex
			
 
				           tasks which cannot be done via a single map-reduce job. This is fairly
			
@@ -1609,7 +1633,7 @@ document.write("Last Published: " + document.lastModified);
 
				             </li>
			
 
				           
			
 
				 </ul>
			
 
				-<a name="N10921"></a><a name="Job+Input"></a>
			
 
				+<a name="N10941"></a><a name="Job+Input"></a>
			
 
				 <h3 class="h4">Job Input</h3>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/mapred/InputFormat.html">
			
@@ -1657,7 +1681,7 @@ document.write("Last Published: " + document.lastModified);
 
				         appropriate <span class="codefrag">CompressionCodec</span>. However, it must be noted that
			
 
				         compressed files with the above extensions cannot be <em>split</em> and 
			
 
				         each compressed file is processed in its entirety by a single mapper.</p>
			
 
				-<a name="N1098B"></a><a name="InputSplit"></a>
			
 
				+<a name="N109AB"></a><a name="InputSplit"></a>
			
 
				 <h4>InputSplit</h4>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/mapred/InputSplit.html">
			
@@ -1671,7 +1695,7 @@ document.write("Last Published: " + document.lastModified);
 
				           FileSplit</a> is the default <span class="codefrag">InputSplit</span>. It sets 
			
 
				           <span class="codefrag">map.input.file</span> to the path of the input file for the
			
 
				           logical split.</p>
			
 
				-<a name="N109B0"></a><a name="RecordReader"></a>
			
 
				+<a name="N109D0"></a><a name="RecordReader"></a>
			
 
				 <h4>RecordReader</h4>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/mapred/RecordReader.html">
			
@@ -1683,7 +1707,7 @@ document.write("Last Published: " + document.lastModified);
 
				           for processing. <span class="codefrag">RecordReader</span> thus assumes the 
			
 
				           responsibility of processing record boundaries and presents the tasks 
			
 
				           with keys and values.</p>
			
 
				-<a name="N109D3"></a><a name="Job+Output"></a>
			
 
				+<a name="N109F3"></a><a name="Job+Output"></a>
			
 
				 <h3 class="h4">Job Output</h3>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/mapred/OutputFormat.html">
			
@@ -1708,7 +1732,7 @@ document.write("Last Published: " + document.lastModified);
 
				 <p>
			
 
				 <span class="codefrag">TextOutputFormat</span> is the default 
			
 
				         <span class="codefrag">OutputFormat</span>.</p>
			
 
				-<a name="N109FC"></a><a name="Task+Side-Effect+Files"></a>
			
 
				+<a name="N10A1C"></a><a name="Task+Side-Effect+Files"></a>
			
 
				 <h4>Task Side-Effect Files</h4>
			
 
				 <p>In some applications, component tasks need to create and/or write to
			
 
				           side-files, which differ from the actual job-output files.</p>
			
@@ -1734,7 +1758,7 @@ document.write("Last Published: " + document.lastModified);
 
				           JobConf.getOutputPath()</a>, and the framework will promote them 
			
 
				           similarly for succesful task-attempts, thus eliminating the need to 
			
 
				           pick unique paths per task-attempt.</p>
			
 
				-<a name="N10A31"></a><a name="RecordWriter"></a>
			
 
				+<a name="N10A51"></a><a name="RecordWriter"></a>
			
 
				 <h4>RecordWriter</h4>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/mapred/RecordWriter.html">
			
@@ -1742,9 +1766,9 @@ document.write("Last Published: " + document.lastModified);
 
				           pairs to an output file.</p>
			
 
				 <p>RecordWriter implementations write the job outputs to the 
			
 
				           <span class="codefrag">FileSystem</span>.</p>
			
 
				-<a name="N10A48"></a><a name="Other+Useful+Features"></a>
			
 
				+<a name="N10A68"></a><a name="Other+Useful+Features"></a>
			
 
				 <h3 class="h4">Other Useful Features</h3>
			
 
				-<a name="N10A4E"></a><a name="Counters"></a>
			
 
				+<a name="N10A6E"></a><a name="Counters"></a>
			
 
				 <h4>Counters</h4>
			
 
				 <p>
			
 
				 <span class="codefrag">Counters</span> represent global counters, defined either by 
			
@@ -1758,7 +1782,7 @@ document.write("Last Published: " + document.lastModified);
 
				           Reporter.incrCounter(Enum, long)</a> in the <span class="codefrag">map</span> and/or 
			
 
				           <span class="codefrag">reduce</span> methods. These counters are then globally 
			
 
				           aggregated by the framework.</p>
			
 
				-<a name="N10A79"></a><a name="DistributedCache"></a>
			
 
				+<a name="N10A99"></a><a name="DistributedCache"></a>
			
 
				 <h4>DistributedCache</h4>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/filecache/DistributedCache.html">
			
@@ -1791,7 +1815,7 @@ document.write("Last Published: " + document.lastModified);
 
				           <a href="api/org/apache/hadoop/filecache/DistributedCache.html#createSymlink(org.apache.hadoop.conf.Configuration)">
			
 
				           DistributedCache.createSymlink(Path, Configuration)</a> api. Files 
			
 
				           have <em>execution permissions</em> set.</p>
			
 
				-<a name="N10AB7"></a><a name="Tool"></a>
			
 
				+<a name="N10AD7"></a><a name="Tool"></a>
			
 
				 <h4>Tool</h4>
			
 
				 <p>The <a href="api/org/apache/hadoop/util/Tool.html">Tool</a> 
			
 
				           interface supports the handling of generic Hadoop command-line options.
			
@@ -1831,7 +1855,7 @@ document.write("Last Published: " + document.lastModified);
 
				             </span>
			
 
				           
			
 
				 </p>
			
 
				-<a name="N10AE9"></a><a name="IsolationRunner"></a>
			
 
				+<a name="N10B09"></a><a name="IsolationRunner"></a>
			
 
				 <h4>IsolationRunner</h4>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/mapred/IsolationRunner.html">
			
@@ -1855,13 +1879,13 @@ document.write("Last Published: " + document.lastModified);
 
				 <p>
			
 
				 <span class="codefrag">IsolationRunner</span> will run the failed task in a single 
			
 
				           jvm, which can be in the debugger, over precisely the same input.</p>
			
 
				-<a name="N10B1C"></a><a name="JobControl"></a>
			
 
				+<a name="N10B3C"></a><a name="JobControl"></a>
			
 
				 <h4>JobControl</h4>
			
 
				 <p>
			
 
				 <a href="api/org/apache/hadoop/mapred/jobcontrol/package-summary.html">
			
 
				           JobControl</a> is a utility which encapsulates a set of Map-Reduce jobs
			
 
				           and their dependencies.</p>
			
 
				-<a name="N10B29"></a><a name="Data+Compression"></a>
			
 
				+<a name="N10B49"></a><a name="Data+Compression"></a>
			
 
				 <h4>Data Compression</h4>
			
 
				 <p>Hadoop Map-Reduce provides facilities for the application-writer to
			
 
				           specify compression for both intermediate map-outputs and the
			
@@ -1875,7 +1899,7 @@ document.write("Last Published: " + document.lastModified);
 
				           codecs for reasons of both performance (zlib) and non-availability of
			
 
				           Java libraries (lzo). More details on their usage and availability are
			
 
				           available <a href="native_libraries.html">here</a>.</p>
			
 
				-<a name="N10B49"></a><a name="Intermediate+Outputs"></a>
			
 
				+<a name="N10B69"></a><a name="Intermediate+Outputs"></a>
			
 
				 <h5>Intermediate Outputs</h5>
			
 
				 <p>Applications can control compression of intermediate map-outputs
			
 
				             via the 
			
@@ -1896,7 +1920,7 @@ document.write("Last Published: " + document.lastModified);
 
				             <a href="api/org/apache/hadoop/mapred/JobConf.html#setMapOutputCompressionType(org.apache.hadoop.io.SequenceFile.CompressionType)">
			
 
				             JobConf.setMapOutputCompressionType(SequenceFile.CompressionType)</a> 
			
 
				             api.</p>
			
 
				-<a name="N10B75"></a><a name="Job+Outputs"></a>
			
 
				+<a name="N10B95"></a><a name="Job+Outputs"></a>
			
 
				 <h5>Job Outputs</h5>
			
 
				 <p>Applications can control compression of job-outputs via the
			
 
				             <a href="api/org/apache/hadoop/mapred/OutputFormatBase.html#setCompressOutput(org.apache.hadoop.mapred.JobConf,%20boolean)">
			
@@ -1916,7 +1940,7 @@ document.write("Last Published: " + document.lastModified);
 
				 </div>
			
 
				 
			
 
				     
			
 
				-<a name="N10BA4"></a><a name="Example%3A+WordCount+v2.0"></a>
			
 
				+<a name="N10BC4"></a><a name="Example%3A+WordCount+v2.0"></a>
			
 
				 <h2 class="h3">Example: WordCount v2.0</h2>
			
 
				 <div class="section">
			
 
				 <p>Here is a more complete <span class="codefrag">WordCount</span> which uses many of the
			
@@ -1926,7 +1950,7 @@ document.write("Last Published: " + document.lastModified);
 
				       <a href="quickstart.html#SingleNodeSetup">pseudo-distributed</a> or
			
 
				       <a href="quickstart.html#Fully-Distributed+Operation">fully-distributed</a> 
			
 
				       Hadoop installation.</p>
			
 
				-<a name="N10BBE"></a><a name="Source+Code-N10BBE"></a>
			
 
				+<a name="N10BDE"></a><a name="Source+Code-N10BDE"></a>
			
 
				 <h3 class="h4">Source Code</h3>
			
 
				 <table class="ForrestTable" cellspacing="1" cellpadding="4">
			
 
				           
			
@@ -3136,7 +3160,7 @@ document.write("Last Published: " + document.lastModified);
 
				 </tr>
			
 
				         
			
 
				 </table>
			
 
				-<a name="N11320"></a><a name="Sample+Runs"></a>
			
 
				+<a name="N11340"></a><a name="Sample+Runs"></a>
			
 
				 <h3 class="h4">Sample Runs</h3>
			
 
				 <p>Sample text-files as input:</p>
			
 
				 <p>
			
@@ -3304,7 +3328,7 @@ document.write("Last Published: " + document.lastModified);
 
				 <br>
			
 
				         
			
 
				 </p>
			
 
				-<a name="N113F4"></a><a name="Highlights"></a>
			
 
				+<a name="N11414"></a><a name="Highlights"></a>
			
 
				 <h3 class="h4">Highlights</h3>
			
 
				 <p>The second version of <span class="codefrag">WordCount</span> improves upon the 
			
 
				         previous one by using some features offered by the Map-Reduce framework:
			
--- a/docs/mapred_tutorial.pdf
+++ b/docs/mapred_tutorial.pdf
--- a/src/contrib/streaming/src/test/org/apache/hadoop/streaming/TestMultipleCachefiles.java
+++ b/src/contrib/streaming/src/test/org/apache/hadoop/streaming/TestMultipleCachefiles.java
@@ -23,6 +23,7 @@ import java.io.*;
 
				 import java.util.*;
			
 
				 import org.apache.hadoop.conf.Configuration;
			
 
				 import org.apache.hadoop.fs.FileSystem;
			
 
				+import org.apache.hadoop.fs.FileUtil;
			
 
				 import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.mapred.*;
			
 
				 import org.apache.hadoop.dfs.MiniDFSCluster;
			
@@ -100,7 +101,9 @@ public class TestMultipleCachefiles extends TestCase
 
				         job.go();
			
 
				         String line = null;
			
 
				         String line2 = null;
			
 
				-        Path[] fileList = fileSys.listPaths(new Path(OUTPUT_DIR));
			
 
				+        Path[] fileList = FileUtil.stat2Paths(fileSys.listStatus(
			
 
				+                                     new Path(OUTPUT_DIR),
			
 
				+                                     new OutputLogFilter()));
			
 
				         for (int i = 0; i < fileList.length; i++){
			
 
				           System.out.println(fileList[i].toString());
			
 
				           BufferedReader bread =
			
--- a/src/contrib/streaming/src/test/org/apache/hadoop/streaming/TestSymLink.java
+++ b/src/contrib/streaming/src/test/org/apache/hadoop/streaming/TestSymLink.java
@@ -23,6 +23,7 @@ import java.io.*;
 
				 import java.util.*;
			
 
				 import org.apache.hadoop.conf.Configuration;
			
 
				 import org.apache.hadoop.fs.FileSystem;
			
 
				+import org.apache.hadoop.fs.FileUtil;
			
 
				 import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.mapred.*;
			
 
				 import org.apache.hadoop.dfs.MiniDFSCluster;
			
@@ -91,7 +92,9 @@ public class TestSymLink extends TestCase
 
				         job = new StreamJob(argv, mayExit);      
			
 
				         job.go();
			
 
				         String line = null;
			
 
				-        Path[] fileList = fileSys.listPaths(new Path(OUTPUT_DIR));
			
 
				+        Path[] fileList = FileUtil.stat2Paths(fileSys.listStatus(
			
 
				+                                                new Path(OUTPUT_DIR),
			
 
				+                                                new OutputLogFilter()));
			
 
				         for (int i = 0; i < fileList.length; i++){
			
 
				           System.out.println(fileList[i].toString());
			
 
				           BufferedReader bread =
			
--- a/src/docs/src/documentation/content/xdocs/cluster_setup.xml
+++ b/src/docs/src/documentation/content/xdocs/cluster_setup.xml
@@ -365,6 +365,35 @@
 
				           Commons Logging</a> framework for logging. Edit the 
			
 
				           <code>conf/log4j.properties</code> file to customize the Hadoop 
			
 
				           daemons' logging configuration (log-formats and so on).</p>
			
 
				+          
			
 
				+          <section>
			
 
				+            <title>History Logging</title>
			
 
				+            
			
 
				+            <p> The job history files are stored in central location 
			
 
				+            <code> hadoop.job.history.location </code> which can be on DFS also,
			
 
				+            whose default value is <code>${HADOOP_LOG_DIR}/history</code>. 
			
 
				+            Job history server is started on job tracker. The history 
			
 
				+            web UI is accessible from job tracker web UI.</p>
			
 
				+            
			
 
				+            <p> The history files are also logged to user specified directory
			
 
				+            <code>hadoop.job.history.user.location</code> 
			
 
				+            which defaults to job output directory. The files are stored in
			
 
				+            "_logs/history/" in the specified directory. Hence, by default 
			
 
				+            they will be in "mapred.output.dir/_logs/history/". User can stop
			
 
				+            logging by giving the value <code>none</code> for 
			
 
				+            <code>hadoop.job.history.user.location</code> </p>
			
 
				+            
			
 
				+            <p> User can view logs in specified directory using 
			
 
				+            the following command <br/>
			
 
				+            <code>$ bin/hadoop job -history output-dir</code><br/>
			
 
				+            This will start a stand alone jetty on the client and 
			
 
				+            load history jsp's. 
			
 
				+            It will display the port where the server is up at. The server will
			
 
				+            be up for 30 minutes. User has to use 
			
 
				+            <code> http://hostname:port </code> to view the history. User can 
			
 
				+            also provide http bind address using 
			
 
				+            <code>mapred.job.history.http.bindAddress</code></p>
			
 
				+          </section>
			
 
				         </section>
			
 
				       </section>
			
 
				       
			
--- a/src/docs/src/documentation/content/xdocs/mapred_tutorial.xml
+++ b/src/docs/src/documentation/content/xdocs/mapred_tutorial.xml
@@ -1110,7 +1110,29 @@
 
				             monitoring it's status.
			
 
				           </li>
			
 
				         </ol>
			
 
				-  
			
 
				+        <p> Job history files are also logged to user specified directory
			
 
				+        <code>hadoop.job.history.user.location</code> 
			
 
				+        which defaults to job output directory. The files are stored in
			
 
				+        "_logs/history/" in the specified directory. Hence, by default they will
			
 
				+        be in mapred.output.dir/_logs/history. User can stop
			
 
				+        logging by giving the value <code>none</code> for 
			
 
				+        <code>hadoop.job.history.user.location</code></p>
			
 
				+
			
 
				+        <p> User can view logs in specified directory using 
			
 
				+        the following command <br/>
			
 
				+        <code>$ bin/hadoop job -history output-dir</code><br/>
			
 
				+        This will start a stand alone jetty on the client and 
			
 
				+        load history jsp's. 
			
 
				+        It will display the port where the server is up at. The server will
			
 
				+        be up for 30 minutes. User has to use 
			
 
				+        <code> http://hostname:port </code> to view the history. User can 
			
 
				+        also provide http bind address using 
			
 
				+        <code>mapred.job.history.http.bindAddress</code></p>
			
 
				+            
			
 
				+        <p> User can use 
			
 
				+        <a href="ext:api/org/apache/hadoop/mapred/outputlogfilter">OutputLogFilter</a>
			
 
				+        to filter log files from the output directory listing. </p>
			
 
				+        
			
 
				         <p>Normally the user creates the application, describes various facets 
			
 
				         of the job via <code>JobConf</code>, and then uses the 
			
 
				         <code>JobClient</code> to submit the job and monitor its progress.</p>
			
--- a/src/docs/src/documentation/content/xdocs/site.xml
+++ b/src/docs/src/documentation/content/xdocs/site.xml
@@ -169,6 +169,7 @@ See http://forrest.apache.org/docs/linking.html for more info.
 
				                 <setcompressoutput href="#setCompressOutput(org.apache.hadoop.mapred.JobConf,%20boolean)" />
			
 
				                 <setoutputcompressorclass href="#setOutputCompressorClass(org.apache.hadoop.mapred.JobConf,%20java.lang.Class)" />
			
 
				               </outputformatbase>
			
 
				+              <outputlogfilter href="OutputLogFilter.html" />
			
 
				               <sequencefileoutputformat href="SequenceFileOutputFormat.html">
			
 
				                 <setoutputcompressiontype href="#setOutputCompressionType(org.apache.hadoop.mapred.JobConf,%20org.apache.hadoop.io.SequenceFile.CompressionType)" />
			
 
				               </sequencefileoutputformat>
			
--- a/src/java/org/apache/hadoop/mapred/DefaultJobHistoryParser.java
+++ b/src/java/org/apache/hadoop/mapred/DefaultJobHistoryParser.java
@@ -20,6 +20,8 @@ package org.apache.hadoop.mapred;
 
				 
			
 
				 import java.util.*;
			
 
				 import java.io.*;
			
 
				+
			
 
				+import org.apache.hadoop.fs.FileSystem;
			
 
				 import org.apache.hadoop.mapred.JobHistory.Keys; 
			
 
				 import org.apache.hadoop.mapred.JobHistory.Values;
			
 
				 
			
@@ -35,40 +37,20 @@ public class DefaultJobHistoryParser {
 
				   // to cast to this type without generating compiler warnings, which is only
			
 
				   // possible if it is a non-generic class.
			
 
				 
			
 
				-  /**
			
 
				-   * Contents of a job history file. Maps: 
			
 
				-   * <xmp>jobTrackerId -> <jobId, JobHistory.JobInfo>*</xmp>
			
 
				-   */
			
 
				-  public static class MasterIndex 
			
 
				-    extends TreeMap<String, Map<String, JobHistory.JobInfo>> {
			
 
				-    
			
 
				-  }
			
 
				-
			
 
				-  /**
			
 
				-   * Parses a master index file and returns a {@link MasterIndex}.
			
 
				-   * @param historyFile master index history file. 
			
 
				-   * @return a {@link MasterIndex}.  
			
 
				-   * @throws IOException
			
 
				-   */
			
 
				-  public static MasterIndex parseMasterIndex(File historyFile)
			
 
				-    throws IOException {
			
 
				-    MasterIndexParseListener parser = new MasterIndexParseListener();
			
 
				-    JobHistory.parseHistory(historyFile, parser);
			
 
				-
			
 
				-    return parser.getValues();
			
 
				-  }
			
 
				-
			
 
				   /**
			
 
				    * Populates a JobInfo object from the job's history log file. 
			
 
				    * @param jobHistoryFile history file for this job. 
			
 
				    * @param job a precreated JobInfo object, should be non-null. 
			
 
				+   * @param fs FileSystem where historyFile is present. 
			
 
				    * @throws IOException
			
 
				    */
			
 
				-  public static void parseJobTasks(File jobHistoryFile, JobHistory.JobInfo job)
			
 
				+  public static void parseJobTasks(String jobHistoryFile, 
			
 
				+                       JobHistory.JobInfo job, FileSystem fs)
			
 
				     throws IOException {
			
 
				-    JobHistory.parseHistory(jobHistoryFile, 
			
 
				-                            new JobTasksParseListener(job));
			
 
				+    JobHistory.parseHistoryFromFS(jobHistoryFile, 
			
 
				+                            new JobTasksParseListener(job), fs);
			
 
				   }
			
 
				+  
			
 
				   /**
			
 
				    * Listener for Job's history log file, it populates JobHistory.JobInfo 
			
 
				    * object with data from log file. 
			
@@ -144,48 +126,6 @@ public class DefaultJobHistoryParser {
 
				     }
			
 
				   }
			
 
				 
			
 
				-  /**
			
 
				-   * Parses and returns a map of values in master index. 
			
 
				-   * 
			
 
				-   */
			
 
				-  static class MasterIndexParseListener
			
 
				-    implements JobHistory.Listener {
			
 
				-    MasterIndex jobTrackerToJobs = new MasterIndex();
			
 
				-
			
 
				-    Map<String, JobHistory.JobInfo> activeJobs = null;
			
 
				-    String currentTracker; 
			
 
				-    
			
 
				-    // Implement JobHistory.Listener
			
 
				-
			
 
				-    public void handle(JobHistory.RecordTypes recType, Map<Keys, String> values)
			
 
				-      throws IOException {
			
 
				- 
			
 
				-      if (recType.equals(JobHistory.RecordTypes.Jobtracker)) {
			
 
				-        activeJobs = new TreeMap<String, JobHistory.JobInfo>();
			
 
				-        currentTracker = values.get(Keys.START_TIME);
			
 
				-        jobTrackerToJobs.put(currentTracker, activeJobs);
			
 
				-      } else if (recType.equals(JobHistory.RecordTypes.Job)) {
			
 
				-        String jobId = values.get(Keys.JOBID);
			
 
				-        JobHistory.JobInfo job = activeJobs.get(jobId);
			
 
				-        if (null == job) {
			
 
				-          job = new JobHistory.JobInfo(jobId);
			
 
				-          job.set(Keys.JOBTRACKERID, currentTracker);
			
 
				-          activeJobs.put(jobId, job);
			
 
				-        }
			
 
				-        job.handle(values);
			
 
				-      }
			
 
				-    }
			
 
				-
			
 
				-    /**
			
 
				-     * Return map of parsed values. 
			
 
				-     * @return
			
 
				-     */ 
			
 
				-    MasterIndex getValues() {
			
 
				-      return jobTrackerToJobs;
			
 
				-    }
			
 
				-  }
			
 
				-  
			
 
				-  
			
 
				   // call this only for jobs that succeeded for better results. 
			
 
				   static class FailedOnNodesFilter implements JobHistory.Listener {
			
 
				     private Map<String, Set<String>> badNodesToNumFailedTasks =
			
--- a/src/java/org/apache/hadoop/mapred/JobClient.java
+++ b/src/java/org/apache/hadoop/mapred/JobClient.java
@@ -1009,6 +1009,7 @@ public class JobClient extends Configured implements MRConstants, Tool  {
 
				     System.out.printf("\t-status\t<job-id>\n");
			
 
				     System.out.printf("\t-kill\t<job-id>\n");
			
 
				     System.out.printf("\t-events\t<job-id> <from-event-#> <#-of-events>\n");
			
 
				+    System.out.printf("\t-history\t<jobOutputDir>\n");
			
 
				     System.out.printf("\t-list\n");
			
 
				     System.out.printf("\t-list\tall\n");
			
 
				     System.out.printf("\t-kill-task <task-id>\n");
			
@@ -1022,11 +1023,13 @@ public class JobClient extends Configured implements MRConstants, Tool  {
 
				     String submitJobFile = null;
			
 
				     String jobid = null;
			
 
				     String taskid = null;
			
 
				+    String outputDir = null;
			
 
				     int fromEvent = 0;
			
 
				     int nEvents = 0;
			
 
				     boolean getStatus = false;
			
 
				     boolean killJob = false;
			
 
				     boolean listEvents = false;
			
 
				+    boolean viewHistory = false;
			
 
				     boolean listJobs = false;
			
 
				     boolean listAllJobs = false;
			
 
				     boolean killTask = false;
			
@@ -1056,6 +1059,11 @@ public class JobClient extends Configured implements MRConstants, Tool  {
 
				       fromEvent = Integer.parseInt(argv[2]);
			
 
				       nEvents = Integer.parseInt(argv[3]);
			
 
				       listEvents = true;
			
 
				+    } else if ("-history".equals(argv[0])) {
			
 
				+      if (argv.length != 2)
			
 
				+        displayUsage();
			
 
				+        outputDir = argv[1];
			
 
				+        viewHistory = true;
			
 
				     } else if ("-list".equals(argv[0])) {
			
 
				       if (argv.length != 1 && !(argv.length == 2 && "all".equals(argv[1])))
			
 
				         displayUsage();
			
@@ -1112,6 +1120,10 @@ public class JobClient extends Configured implements MRConstants, Tool  {
 
				           System.out.println("Killed job " + jobid);
			
 
				           exitCode = 0;
			
 
				         }
			
 
				+      } else if (viewHistory) {
			
 
				+    	// start http server
			
 
				+        viewHistory(outputDir);
			
 
				+        exitCode = 0;
			
 
				       } else if (listEvents) {
			
 
				         listEvents(jobid, fromEvent, nEvents);
			
 
				         exitCode = 0;
			
@@ -1144,6 +1156,45 @@ public class JobClient extends Configured implements MRConstants, Tool  {
 
				     return exitCode;
			
 
				   }
			
 
				 
			
 
				+  private void viewHistory(String outputDir) 
			
 
				+    throws IOException {
			
 
				+
			
 
				+    Path output = new Path(outputDir);
			
 
				+    FileSystem fs = output.getFileSystem(getConf());
			
 
				+
			
 
				+    // start http server used to provide an HTML view on Job history
			
 
				+    StatusHttpServer infoServer;
			
 
				+    String infoAddr = new JobConf(getConf()).get(
			
 
				+             "mapred.job.history.http.bindAddress", "0.0.0.0:0");
			
 
				+    InetSocketAddress infoSocAddr = NetUtils.createSocketAddr(infoAddr);
			
 
				+    String infoBindAddress = infoSocAddr.getHostName();
			
 
				+    int tmpInfoPort = infoSocAddr.getPort();
			
 
				+    infoServer = new StatusHttpServer("history", infoBindAddress, tmpInfoPort,
			
 
				+                                       tmpInfoPort == 0);
			
 
				+    infoServer.setAttribute("fileSys", fs);
			
 
				+    infoServer.setAttribute("historyLogDir", outputDir + "/_logs/history");
			
 
				+    infoServer.start();
			
 
				+    int infoPort = infoServer.getPort();
			
 
				+    getConf().set("mapred.job.history.http.bindAddress", 
			
 
				+        infoBindAddress + ":" + infoPort);
			
 
				+    LOG.info("JobHistory webserver up at: " + infoPort);
			
 
				+
			
 
				+    // let the server be up for 30 minutes.
			
 
				+    try {
			
 
				+      Thread.sleep(30 * 60 * 1000);
			
 
				+    } catch (InterruptedException ie) {}
			
 
				+      
			
 
				+    // stop infoServer
			
 
				+    if (infoServer != null) {
			
 
				+      LOG.info("Stopping infoServer");
			
 
				+      try {
			
 
				+        infoServer.stop();
			
 
				+      } catch (InterruptedException ex) {
			
 
				+        ex.printStackTrace();
			
 
				+      }
			
 
				+    } 
			
 
				+  }
			
 
				+  
			
 
				   /**
			
 
				    * List the events for the given job
			
 
				    * @param jobId the job id for the job's events to list
			
--- a/src/java/org/apache/hadoop/mapred/JobHistory.java
+++ b/src/java/org/apache/hadoop/mapred/JobHistory.java
@@ -24,7 +24,9 @@ import java.io.FileFilter;
 
				 import java.io.FileOutputStream;
			
 
				 import java.io.FileReader;
			
 
				 import java.io.IOException;
			
 
				+import java.io.InputStreamReader;
			
 
				 import java.io.PrintWriter;
			
 
				+import java.util.ArrayList;
			
 
				 import java.util.HashMap;
			
 
				 import java.util.Iterator;
			
 
				 import java.util.Map;
			
@@ -34,7 +36,12 @@ import java.util.regex.Pattern;
 
				 
			
 
				 import org.apache.commons.logging.Log;
			
 
				 import org.apache.commons.logging.LogFactory;
			
 
				+import org.apache.hadoop.fs.FSDataInputStream;
			
 
				+import org.apache.hadoop.fs.FSDataOutputStream;
			
 
				+import org.apache.hadoop.fs.FileSystem;
			
 
				+import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.util.StringUtils;
			
 
				+
			
 
				 /**
			
 
				  * Provides methods for writing to and reading from job history. 
			
 
				  * Job History works in an append mode, JobHistory and its inner classes provide methods 
			
@@ -60,13 +67,14 @@ public class JobHistory {
 
				   private static final String VALUE = "[[^\"]?]+"; // anything but a " in ""
			
 
				   
			
 
				   private static final Pattern pattern = Pattern.compile(KEY + "=" + "\"" + VALUE + "\"");
			
 
				+  private static final int MAX_FILENAME_SIZE = 255;
			
 
				   
			
 
				-  public static final String JOBTRACKER_START_TIME = String.valueOf(System.currentTimeMillis()); 
			
 
				-  private static final String LOG_DIR = System.getProperty("hadoop.log.dir") + File.separator + "history"; 
			
 
				-  public static final String MASTER_INDEX_LOG_FILE = "JobHistory.log"; 
			
 
				-  
			
 
				-  private static PrintWriter masterIndex = null;
			
 
				-  private static Map<String, PrintWriter> openJobs = new HashMap<String, PrintWriter>(); 
			
 
				+  public static final String JOBTRACKER_START_TIME =
			
 
				+                               String.valueOf(System.currentTimeMillis());
			
 
				+  private static String JOBTRACKER_UNIQUE_STRING = null;
			
 
				+  private static String LOG_DIR = null;
			
 
				+  private static Map<String, ArrayList<PrintWriter>> openJobs = 
			
 
				+                     new HashMap<String, ArrayList<PrintWriter>>();
			
 
				   private static boolean disableHistory = false; 
			
 
				   /**
			
 
				    * Record types are identifiers for each line of log in history files. 
			
@@ -101,27 +109,23 @@ public class JobHistory {
 
				   // temp buffer for parsed dataa
			
 
				   private static Map<Keys,String> parseBuffer = new HashMap<Keys, String>(); 
			
 
				 
			
 
				-  // init log files
			
 
				-  static { init(); } 
			
 
				-  
			
 
				   /**
			
 
				    * Initialize JobHistory files. 
			
 
				    *
			
 
				    */
			
 
				-  private static void init(){
			
 
				+  public static void init(JobConf conf, String hostname){
			
 
				     if (!disableHistory){
			
 
				       try{
			
 
				-        File logDir = new File(LOG_DIR); 
			
 
				-        if (!logDir.exists()){
			
 
				-          if (!logDir.mkdirs()){
			
 
				+        LOG_DIR = conf.get("hadoop.job.history.location");
			
 
				+        JOBTRACKER_UNIQUE_STRING = hostname + "_" + 
			
 
				+                                   JOBTRACKER_START_TIME + "_";
			
 
				+        Path logDir = new Path(LOG_DIR);
			
 
				+        FileSystem fs = logDir.getFileSystem(conf);
			
 
				+        if (!fs.exists(logDir)){
			
 
				+          if (!fs.mkdirs(logDir)){
			
 
				             throw new IOException("Mkdirs failed to create " + logDir.toString());
			
 
				           }
			
 
				         }
			
 
				-        masterIndex = 
			
 
				-          new PrintWriter(
			
 
				-                          new FileOutputStream(new File(LOG_DIR + File.separator + MASTER_INDEX_LOG_FILE), true));
			
 
				-        // add jobtracker id = tracker start time
			
 
				-        log(masterIndex, RecordTypes.Jobtracker, Keys.START_TIME, JOBTRACKER_START_TIME);  
			
 
				       }catch(IOException e){
			
 
				         LOG.error("Failed to initialize JobHistory log file", e); 
			
 
				         disableHistory = true; 
			
@@ -129,17 +133,19 @@ public class JobHistory {
 
				     }
			
 
				   }
			
 
				 
			
 
				-
			
 
				   /**
			
 
				-   * Parses history file and invokes Listener.handle() for each line of history. It can 
			
 
				-   * be used for looking through history files for specific items without having to keep 
			
 
				-   * whlole history in memory. 
			
 
				+   * Parses history file and invokes Listener.handle() for 
			
 
				+   * each line of history. It can be used for looking through history
			
 
				+   * files for specific items without having to keep whole history in memory. 
			
 
				    * @param path path to history file
			
 
				    * @param l Listener for history events 
			
 
				+   * @param fs FileSystem where history file is present
			
 
				    * @throws IOException
			
 
				    */
			
 
				-  public static void parseHistory(File path, Listener l) throws IOException{
			
 
				-    BufferedReader reader = new BufferedReader(new FileReader(path));
			
 
				+  public static void parseHistoryFromFS(String path, Listener l, FileSystem fs)
			
 
				+  throws IOException{
			
 
				+    FSDataInputStream in = fs.open(new Path(path));
			
 
				+    BufferedReader reader = new BufferedReader(new InputStreamReader (in));
			
 
				     try {
			
 
				       String line = null; 
			
 
				       StringBuffer buf = new StringBuffer(); 
			
@@ -155,6 +161,7 @@ public class JobHistory {
 
				       try { reader.close(); } catch (IOException ex) {}
			
 
				     }
			
 
				   }
			
 
				+
			
 
				   /**
			
 
				    * Parse a single line of history. 
			
 
				    * @param line
			
@@ -203,8 +210,8 @@ public class JobHistory {
 
				    * @param values type of log event
			
 
				    */
			
 
				 
			
 
				-  static void log(PrintWriter out, RecordTypes recordType, Keys[] keys, 
			
 
				-                  String[] values){
			
 
				+  static void log(ArrayList<PrintWriter> writers, RecordTypes recordType, 
			
 
				+                  Keys[] keys, String[] values) {
			
 
				     StringBuffer buf = new StringBuffer(recordType.name()); 
			
 
				     buf.append(DELIMITER); 
			
 
				     for(int i =0; i< keys.length; i++){
			
@@ -215,8 +222,10 @@ public class JobHistory {
 
				       buf.append(DELIMITER); 
			
 
				     }
			
 
				     
			
 
				-    out.println(buf.toString());
			
 
				-    out.flush(); 
			
 
				+    for (PrintWriter out : writers) {
			
 
				+      out.println(buf.toString());
			
 
				+      out.flush();
			
 
				+    }
			
 
				   }
			
 
				   
			
 
				   /**
			
@@ -331,7 +340,8 @@ public class JobHistory {
 
				      * @return the path of the job file on the local file system 
			
 
				      */
			
 
				     public static String getLocalJobFilePath(String jobId){
			
 
				-      return LOG_DIR + File.separator + jobId + "_conf.xml";
			
 
				+      return System.getProperty("hadoop.log.dir") + File.separator +
			
 
				+               jobId + "_conf.xml";
			
 
				     }
			
 
				     
			
 
				     /**
			
@@ -347,23 +357,63 @@ public class JobHistory {
 
				                                     String jobConfPath, long submitTime) {
			
 
				       String jobName = jobConf.getJobName();
			
 
				       String user = jobConf.getUser(); 
			
 
				+      FileSystem fs = null;
			
 
				+      String userLogDir = null;
			
 
				+      String jobUniqueString = JOBTRACKER_UNIQUE_STRING + jobId;
			
 
				+
			
 
				       if (!disableHistory){
			
 
				-        synchronized(MASTER_INDEX_LOG_FILE){
			
 
				-          JobHistory.log(masterIndex, RecordTypes.Job, 
			
 
				-                         new Keys[]{Keys.JOBID, Keys.JOBNAME, Keys.USER, Keys.SUBMIT_TIME, Keys.JOBCONF }, 
			
 
				-                         new String[]{jobId, jobName, user, 
			
 
				-                                      String.valueOf(submitTime), jobConfPath}
			
 
				-                        );
			
 
				-        }
			
 
				         // setup the history log file for this job
			
 
				-        String logFileName =  JOBTRACKER_START_TIME + "_" + jobId; 
			
 
				-        File logFile = new File(LOG_DIR + File.separator + logFileName);
			
 
				-        
			
 
				+        String logFileName = jobUniqueString +  
			
 
				+                             "_" + user+ "_" + jobName;
			
 
				+        if (logFileName.length() > MAX_FILENAME_SIZE) {
			
 
				+          logFileName = logFileName.substring(0, MAX_FILENAME_SIZE-1);
			
 
				+        }
			
 
				+
			
 
				+        // find user log directory 
			
 
				+        Path outputPath = jobConf.getOutputPath();
			
 
				+        userLogDir = jobConf.get("hadoop.job.history.user.location",
			
 
				+        		outputPath == null ? null : outputPath.toString());
			
 
				+        if ("none".equals(userLogDir)) {
			
 
				+          userLogDir = null;
			
 
				+        }
			
 
				+        if (userLogDir != null) {
			
 
				+          userLogDir = userLogDir + "/_logs/history";
			
 
				+        }
			
 
				+
			
 
				+        String logFile = null;
			
 
				+        String userLogFile = null;
			
 
				+        if (LOG_DIR != null ) {
			
 
				+          logFile = LOG_DIR + File.separator + logFileName;
			
 
				+        }
			
 
				+        if (userLogDir != null ) {
			
 
				+          userLogFile = userLogDir + File.separator + logFileName;
			
 
				+        }
			
 
				+
			
 
				         try{
			
 
				-          PrintWriter writer = new PrintWriter(logFile);
			
 
				-          openJobs.put(logFileName, writer);
			
 
				-          // add to writer as well 
			
 
				-          JobHistory.log(writer, RecordTypes.Job, 
			
 
				+          ArrayList<PrintWriter> writers = new ArrayList<PrintWriter>();
			
 
				+          FSDataOutputStream out = null;
			
 
				+          PrintWriter writer = null;
			
 
				+
			
 
				+          if (LOG_DIR != null) {
			
 
				+            // create output stream for logging in hadoop.job.history.location
			
 
				+            fs = new Path(LOG_DIR).getFileSystem(jobConf);
			
 
				+            out = fs.create(new Path(logFile), true, 4096);
			
 
				+            writer = new PrintWriter(out);
			
 
				+            writers.add(writer);
			
 
				+          }
			
 
				+          if (userLogDir != null) {
			
 
				+            // create output stream for logging 
			
 
				+            // in hadoop.job.history.user.location
			
 
				+            fs = new Path(userLogDir).getFileSystem(jobConf);
			
 
				+            out = fs.create(new Path(userLogFile), true, 4096);
			
 
				+            writer = new PrintWriter(out);
			
 
				+            writers.add(writer);
			
 
				+          }
			
 
				+
			
 
				+          openJobs.put(jobUniqueString, writers);
			
 
				+
			
 
				+          //add to writer as well 
			
 
				+          JobHistory.log(writers, RecordTypes.Job, 
			
 
				                          new Keys[]{Keys.JOBID, Keys.JOBNAME, Keys.USER, Keys.SUBMIT_TIME, Keys.JOBCONF }, 
			
 
				                          new String[]{jobId, jobName, user, 
			
 
				                                       String.valueOf(submitTime) , jobConfPath}
			
@@ -374,7 +424,7 @@ public class JobHistory {
 
				           disableHistory = true; 
			
 
				         }
			
 
				       }
			
 
				-      /* Storing the job conf on the local file system */
			
 
				+      // Always store job conf on local file system 
			
 
				       String localJobFilePath =  JobInfo.getLocalJobFilePath(jobId); 
			
 
				       File localJobFile = new File(localJobFilePath);
			
 
				       FileOutputStream jobOut = null;
			
@@ -393,10 +443,53 @@ public class JobHistory {
 
				             jobOut.close();
			
 
				           } catch (IOException ie) {
			
 
				             LOG.info("Failed to close the job configuration file " 
			
 
				-                     + StringUtils.stringifyException(ie));
			
 
				+                       + StringUtils.stringifyException(ie));
			
 
				           }
			
 
				         }
			
 
				       }
			
 
				+
			
 
				+      /* Storing the job conf on the log dir */
			
 
				+      Path jobFilePath = null;
			
 
				+      if (LOG_DIR != null) {
			
 
				+        jobFilePath = new Path(LOG_DIR + File.separator + 
			
 
				+                               jobUniqueString + "_conf.xml");
			
 
				+      }
			
 
				+      Path userJobFilePath = null;
			
 
				+      if (userLogDir != null) {
			
 
				+        userJobFilePath = new Path(userLogDir + File.separator +
			
 
				+                                   jobUniqueString + "_conf.xml");
			
 
				+      }
			
 
				+      FSDataOutputStream jobFileOut = null;
			
 
				+      try {
			
 
				+        if (LOG_DIR != null) {
			
 
				+          fs = new Path(LOG_DIR).getFileSystem(jobConf);
			
 
				+          if (!fs.exists(jobFilePath)) {
			
 
				+            jobFileOut = fs.create(jobFilePath);
			
 
				+            jobConf.write(jobFileOut);
			
 
				+            jobFileOut.close();
			
 
				+          }
			
 
				+        } 
			
 
				+        if (userLogDir != null) {
			
 
				+          fs = new Path(userLogDir).getFileSystem(jobConf);
			
 
				+          jobFileOut = fs.create(userJobFilePath);
			
 
				+          jobConf.write(jobFileOut);
			
 
				+        }
			
 
				+        if (LOG.isDebugEnabled()) {
			
 
				+          LOG.debug("Job conf for " + jobId + " stored at " 
			
 
				+                    + jobFilePath + "and" + userJobFilePath );
			
 
				+        }
			
 
				+      } catch (IOException ioe) {
			
 
				+        LOG.error("Failed to store job conf on the local filesystem ", ioe);
			
 
				+      } finally {
			
 
				+        if (jobFileOut != null) {
			
 
				+          try {
			
 
				+            jobFileOut.close();
			
 
				+          } catch (IOException ie) {
			
 
				+            LOG.info("Failed to close the job configuration file " 
			
 
				+                     + StringUtils.stringifyException(ie));
			
 
				+          }
			
 
				+        }
			
 
				+      } 
			
 
				     }
			
 
				     /**
			
 
				      * Logs launch time of job. 
			
@@ -407,16 +500,9 @@ public class JobHistory {
 
				      */
			
 
				     public static void logStarted(String jobId, long startTime, int totalMaps, int totalReduces){
			
 
				       if (!disableHistory){
			
 
				-        synchronized(MASTER_INDEX_LOG_FILE){
			
 
				-          JobHistory.log(masterIndex, RecordTypes.Job, 
			
 
				-                         new Keys[] {Keys.JOBID, Keys.LAUNCH_TIME, Keys.TOTAL_MAPS, Keys.TOTAL_REDUCES },
			
 
				-                         new String[] {jobId,  String.valueOf(startTime), 
			
 
				-                                       String.valueOf(totalMaps), String.valueOf(totalReduces) }); 
			
 
				-        }
			
 
				-        
			
 
				-        String logFileName =  JOBTRACKER_START_TIME + "_" + jobId; 
			
 
				-        PrintWriter writer = openJobs.get(logFileName); 
			
 
				-        
			
 
				+        String logFileKey =  JOBTRACKER_UNIQUE_STRING + jobId; 
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(logFileKey); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.Job, 
			
 
				                          new Keys[] {Keys.JOBID, Keys.LAUNCH_TIME, Keys.TOTAL_MAPS, Keys.TOTAL_REDUCES },
			
@@ -439,20 +525,10 @@ public class JobHistory {
 
				                                    int failedMaps, int failedReduces,
			
 
				                                    Counters counters){
			
 
				       if (!disableHistory){
			
 
				-        synchronized(MASTER_INDEX_LOG_FILE){
			
 
				-          JobHistory.log(masterIndex, RecordTypes.Job,          
			
 
				-                         new Keys[] {Keys.JOBID, Keys.FINISH_TIME, 
			
 
				-                                     Keys.JOB_STATUS, Keys.FINISHED_MAPS, 
			
 
				-                                     Keys.FINISHED_REDUCES},
			
 
				-                         new String[] {jobId,  "" + finishTime, 
			
 
				-                                       Values.SUCCESS.name(), 
			
 
				-                                       String.valueOf(finishedMaps), 
			
 
				-                                       String.valueOf(finishedReduces)});
			
 
				-        }
			
 
				-        
			
 
				         // close job file for this job
			
 
				-        String logFileName = JOBTRACKER_START_TIME + "_" + jobId; 
			
 
				-        PrintWriter writer = openJobs.get(logFileName); 
			
 
				+        String logFileKey =  JOBTRACKER_UNIQUE_STRING + jobId; 
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(logFileKey); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.Job,          
			
 
				                          new Keys[] {Keys.JOBID, Keys.FINISH_TIME, 
			
@@ -467,8 +543,10 @@ public class JobHistory {
 
				                                        String.valueOf(failedMaps), 
			
 
				                                        String.valueOf(failedReduces),
			
 
				                                        counters.makeCompactString()});
			
 
				-          writer.close();
			
 
				-          openJobs.remove(logFileName); 
			
 
				+          for (PrintWriter out : writer) {
			
 
				+            out.close();
			
 
				+          }
			
 
				+          openJobs.remove(logFileKey); 
			
 
				         }
			
 
				         Thread historyCleaner  = new Thread(new HistoryCleaner());
			
 
				         historyCleaner.start(); 
			
@@ -483,21 +561,18 @@ public class JobHistory {
 
				      */
			
 
				     public static void logFailed(String jobid, long timestamp, int finishedMaps, int finishedReduces){
			
 
				       if (!disableHistory){
			
 
				-        synchronized(MASTER_INDEX_LOG_FILE){
			
 
				-          JobHistory.log(masterIndex, RecordTypes.Job,
			
 
				-                         new Keys[] {Keys.JOBID, Keys.FINISH_TIME, Keys.JOB_STATUS, Keys.FINISHED_MAPS, Keys.FINISHED_REDUCES },
			
 
				-                         new String[] {jobid,  String.valueOf(timestamp), Values.FAILED.name(), String.valueOf(finishedMaps), 
			
 
				-                                       String.valueOf(finishedReduces)}); 
			
 
				-        }
			
 
				-        String logFileName =  JOBTRACKER_START_TIME + "_" + jobid; 
			
 
				-        PrintWriter writer = openJobs.get(logFileName); 
			
 
				+        String logFileKey =  JOBTRACKER_UNIQUE_STRING + jobid; 
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(logFileKey); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.Job,
			
 
				                          new Keys[] {Keys.JOBID, Keys.FINISH_TIME, Keys.JOB_STATUS, Keys.FINISHED_MAPS, Keys.FINISHED_REDUCES },
			
 
				                          new String[] {jobid,  String.valueOf(timestamp), Values.FAILED.name(), String.valueOf(finishedMaps), 
			
 
				                                        String.valueOf(finishedReduces)}); 
			
 
				-          writer.close();
			
 
				-          openJobs.remove(logFileName); 
			
 
				+          for (PrintWriter out : writer) {
			
 
				+            out.close();
			
 
				+          }
			
 
				+          openJobs.remove(logFileKey); 
			
 
				         }
			
 
				       }
			
 
				     }
			
@@ -520,7 +595,9 @@ public class JobHistory {
 
				     public static void logStarted(String jobId, String taskId, String taskType, 
			
 
				                                   long startTime){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId); 
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.Task, 
			
 
				                          new Keys[]{Keys.TASKID, Keys.TASK_TYPE , Keys.START_TIME}, 
			
@@ -538,7 +615,9 @@ public class JobHistory {
 
				     public static void logFinished(String jobId, String taskId, String taskType, 
			
 
				                                    long finishTime, Counters counters){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId); 
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.Task, 
			
 
				                          new Keys[]{Keys.TASKID, Keys.TASK_TYPE, 
			
@@ -560,7 +639,9 @@ public class JobHistory {
 
				      */
			
 
				     public static void logFailed(String jobId, String taskId, String taskType, long time, String error){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId); 
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.Task, 
			
 
				                          new Keys[]{Keys.TASKID, Keys.TASK_TYPE, 
			
@@ -597,7 +678,9 @@ public class JobHistory {
 
				      */
			
 
				     public static void logStarted(String jobId, String taskId, String taskAttemptId, long startTime, String hostName){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.MapAttempt, 
			
 
				                          new Keys[]{ Keys.TASK_TYPE, Keys.TASKID, 
			
@@ -620,7 +703,9 @@ public class JobHistory {
 
				                                    String taskAttemptId, long finishTime, 
			
 
				                                    String hostName){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.MapAttempt, 
			
 
				                          new Keys[]{ Keys.TASK_TYPE, Keys.TASKID, 
			
@@ -644,7 +729,9 @@ public class JobHistory {
 
				     public static void logFailed(String jobId, String taskId, String taskAttemptId, 
			
 
				                                  long timestamp, String hostName, String error){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.MapAttempt, 
			
 
				                          new Keys[]{Keys.TASK_TYPE, Keys.TASKID, Keys.TASK_ATTEMPT_ID, Keys.TASK_STATUS, 
			
@@ -666,7 +753,9 @@ public class JobHistory {
 
				     public static void logKilled(String jobId, String taskId, String taskAttemptId, 
			
 
				                                  long timestamp, String hostName, String error){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.MapAttempt, 
			
 
				                          new Keys[]{Keys.TASK_TYPE, Keys.TASKID, Keys.TASK_ATTEMPT_ID, Keys.TASK_STATUS, 
			
@@ -693,7 +782,9 @@ public class JobHistory {
 
				     public static void logStarted(String jobId, String taskId, String taskAttemptId, 
			
 
				                                   long startTime, String hostName){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.ReduceAttempt, 
			
 
				                          new Keys[]{  Keys.TASK_TYPE, Keys.TASKID, 
			
@@ -718,7 +809,9 @@ public class JobHistory {
 
				                                    long sortFinished, long finishTime, 
			
 
				                                    String hostName){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.ReduceAttempt, 
			
 
				                          new Keys[]{ Keys.TASK_TYPE, Keys.TASKID, 
			
@@ -743,7 +836,9 @@ public class JobHistory {
 
				     public static void logFailed(String jobId, String taskId, String taskAttemptId, long timestamp, 
			
 
				                                  String hostName, String error){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.ReduceAttempt, 
			
 
				                          new Keys[]{  Keys.TASK_TYPE, Keys.TASKID, Keys.TASK_ATTEMPT_ID, Keys.TASK_STATUS, 
			
@@ -765,7 +860,9 @@ public class JobHistory {
 
				     public static void logKilled(String jobId, String taskId, String taskAttemptId, long timestamp, 
			
 
				                                  String hostName, String error){
			
 
				       if (!disableHistory){
			
 
				-        PrintWriter writer = openJobs.get(JOBTRACKER_START_TIME + "_" + jobId);
			
 
				+        ArrayList<PrintWriter> writer = openJobs.get(JOBTRACKER_UNIQUE_STRING 
			
 
				+                                                     + jobId); 
			
 
				+
			
 
				         if (null != writer){
			
 
				           JobHistory.log(writer, RecordTypes.ReduceAttempt, 
			
 
				                          new Keys[]{  Keys.TASK_TYPE, Keys.TASKID, 
			
@@ -822,61 +919,6 @@ public class JobHistory {
 
				       }
			
 
				       lastRan = now;  
			
 
				       isRunning = true; 
			
 
				-      // update master Index first
			
 
				-      try{
			
 
				-        File logFile = new File(
			
 
				-                                LOG_DIR + File.separator + MASTER_INDEX_LOG_FILE); 
			
 
				-        
			
 
				-        synchronized(MASTER_INDEX_LOG_FILE){
			
 
				-          Map<String, Map<String, JobHistory.JobInfo>> jobTrackersToJobs = 
			
 
				-            DefaultJobHistoryParser.parseMasterIndex(logFile);
			
 
				-          
			
 
				-          // find job that started more than one month back and remove them
			
 
				-          // for jobtracker instances which dont have a job in past one month 
			
 
				-          // remove the jobtracker start timestamp as well.
			
 
				-          Iterator<Map<String, JobHistory.JobInfo>> jobTrackerItr =
			
 
				-            jobTrackersToJobs.values().iterator();
			
 
				-          while (jobTrackerItr.hasNext()) {
			
 
				-            Map<String, JobHistory.JobInfo> jobs = jobTrackerItr.next();
			
 
				-            Iterator<Map.Entry<String, JobHistory.JobInfo>> jobItr = 
			
 
				-                   jobs.entrySet().iterator();
			
 
				-            while (jobItr.hasNext()) {
			
 
				-              Map.Entry<String, JobHistory.JobInfo> item = jobItr.next();
			
 
				-              if (now - item.getValue().getLong(Keys.SUBMIT_TIME) > 
			
 
				-                  THIRTY_DAYS_IN_MS) {
			
 
				-                jobItr.remove(); 
			
 
				-              }
			
 
				-            }
			
 
				-            if (jobs.size() == 0){
			
 
				-              jobTrackerItr.remove(); 
			
 
				-            }
			
 
				-          }
			
 
				-          masterIndex.close(); 
			
 
				-          masterIndex = new PrintWriter(logFile);
			
 
				-          // delete old history and write back to a new file
			
 
				-          for (Map.Entry<String, Map<String, JobHistory.JobInfo>> entry :
			
 
				-                  jobTrackersToJobs.entrySet()) {
			
 
				-            String jobTrackerId = entry.getKey();
			
 
				-            Map<String, JobHistory.JobInfo> jobs = entry.getValue();
			
 
				-
			
 
				-            
			
 
				-            log(masterIndex, RecordTypes.Jobtracker, Keys.START_TIME, jobTrackerId);
			
 
				-
			
 
				-            for(JobHistory.JobInfo job : jobs.values()){
			
 
				-              Map<Keys, String> values = job.getValues();
			
 
				-              
			
 
				-              log(masterIndex, RecordTypes.Job, 
			
 
				-                  values.keySet().toArray(new Keys[0]), 
			
 
				-                  values.values().toArray(new String[0])); 
			
 
				-
			
 
				-            }
			
 
				-            masterIndex.flush();
			
 
				-          }
			
 
				-        }
			
 
				-      }catch(IOException e){
			
 
				-        LOG.error("Failed loading history log for cleanup", e);
			
 
				-      }
			
 
				-      
			
 
				       File[] oldFiles = new File(LOG_DIR).listFiles(new FileFilter(){
			
 
				           public boolean accept(File file){
			
 
				             // delete if older than 30 days
			
--- a/src/java/org/apache/hadoop/mapred/JobTracker.java
+++ b/src/java/org/apache/hadoop/mapred/JobTracker.java
@@ -593,6 +593,7 @@ public class JobTracker implements MRConstants, InterTrackerProtocol, JobSubmiss
 
				 
			
 
				   // Used to provide an HTML view on Job, Task, and TaskTracker structures
			
 
				   StatusHttpServer infoServer;
			
 
				+  StatusHttpServer historyServer;
			
 
				   int infoPort;
			
 
				 
			
 
				   Server interTrackerServer;
			
@@ -701,6 +702,26 @@ public class JobTracker implements MRConstants, InterTrackerProtocol, JobSubmiss
 
				       Thread.sleep(SYSTEM_DIR_CLEANUP_RETRY_PERIOD);
			
 
				     }
			
 
				 
			
 
				+    // start history viewing server.
			
 
				+    JobHistory.init(conf, this.localMachine); 
			
 
				+    String histAddr = conf.get("mapred.job.history.http.bindAddress",
			
 
				+                                  "0.0.0.0:0");
			
 
				+    InetSocketAddress historySocAddr = NetUtils.createSocketAddr(histAddr);
			
 
				+    String historyBindAddress = historySocAddr.getHostName();
			
 
				+    int tmpHistoryPort = historySocAddr.getPort();
			
 
				+    historyServer = new StatusHttpServer("history", historyBindAddress, 
			
 
				+                       tmpHistoryPort, tmpHistoryPort == 0);
			
 
				+    String historyLogDir = conf.get("hadoop.job.history.location");
			
 
				+    historyServer.setAttribute("historyLogDir", historyLogDir);
			
 
				+    FileSystem fileSys = new Path(historyLogDir).getFileSystem(conf);
			
 
				+    historyServer.setAttribute("fileSys", fileSys);
			
 
				+    historyServer.start();
			
 
				+    this.conf.set("mapred.job.history.http.bindAddress", 
			
 
				+                (this.localMachine + ":" + historyServer.getPort()));
			
 
				+    LOG.info("JobHistory webserver on JobTracker up at: " +
			
 
				+              historyServer.getPort());
			
 
				+
			
 
				+
			
 
				     // Same with 'localDir' except it's always on the local disk.
			
 
				     jobConf.deleteLocalFiles(SUBDIR);
			
 
				     synchronized (this) {
			
@@ -719,6 +740,9 @@ public class JobTracker implements MRConstants, InterTrackerProtocol, JobSubmiss
 
				     return NetUtils.createSocketAddr(jobTrackerStr);
			
 
				   }
			
 
				 
			
 
				+  public String getHistoryAddress() {
			
 
				+    return conf.get("mapred.job.history.http.bindAddress");
			
 
				+  }
			
 
				 
			
 
				   /**
			
 
				    * Run forever
			
@@ -754,6 +778,14 @@ public class JobTracker implements MRConstants, InterTrackerProtocol, JobSubmiss
 
				         ex.printStackTrace();
			
 
				       }
			
 
				     }
			
 
				+    if (this.historyServer != null) {
			
 
				+      LOG.info("Stopping historyServer");
			
 
				+      try {
			
 
				+        this.historyServer.stop();
			
 
				+      } catch (InterruptedException ex) {
			
 
				+        ex.printStackTrace();
			
 
				+      }
			
 
				+    }
			
 
				     if (this.interTrackerServer != null) {
			
 
				       LOG.info("Stopping interTrackerServer");
			
 
				       this.interTrackerServer.stop();
			
--- a/src/java/org/apache/hadoop/mapred/OutputLogFilter.java
+++ b/src/java/org/apache/hadoop/mapred/OutputLogFilter.java
@@ -0,0 +1,35 @@
 
				+/**
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.mapred;
			
 
				+
			
 
				+import org.apache.hadoop.fs.Path;
			
 
				+import org.apache.hadoop.fs.PathFilter;
			
 
				+
			
 
				+/**
			
 
				+ * This class filters log files from directory given
			
 
				+ * It doesnt accept paths having _logs.
			
 
				+ * This can be used to list paths of output directory as follows:
			
 
				+ *   Path[] fileList = FileUtil.stat2Paths(fs.listStatus(outDir,
			
 
				+ *                                   new OutputLogFilter()));
			
 
				+ */
			
 
				+public class OutputLogFilter implements PathFilter {
			
 
				+  public boolean accept(Path path) {
			
 
				+    return !(path.toString().contains("_logs"));
			
 
				+  }
			
 
				+}
			
--- a/src/test/org/apache/hadoop/mapred/TestClusterMapReduceTestCase.java
+++ b/src/test/org/apache/hadoop/mapred/TestClusterMapReduceTestCase.java
@@ -17,6 +17,7 @@
 
				  */
			
 
				 package org.apache.hadoop.mapred;
			
 
				 
			
 
				+import org.apache.hadoop.fs.FileUtil;
			
 
				 import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.io.LongWritable;
			
 
				 import org.apache.hadoop.io.Text;
			
@@ -61,8 +62,9 @@ public class TestClusterMapReduceTestCase extends ClusterMapReduceTestCase {
 
				 
			
 
				     JobClient.runJob(conf);
			
 
				 
			
 
				-    Path[] outputFiles = getFileSystem().listPaths(getOutputDir());
			
 
				-
			
 
				+    Path[] outputFiles = FileUtil.stat2Paths(
			
 
				+                           getFileSystem().listStatus(getOutputDir(),
			
 
				+                           new OutputLogFilter()));
			
 
				     if (outputFiles.length > 0) {
			
 
				       InputStream is = getFileSystem().open(outputFiles[0]);
			
 
				       BufferedReader reader = new BufferedReader(new InputStreamReader(is));
			
--- a/src/test/org/apache/hadoop/mapred/TestMiniMRClasspath.java
+++ b/src/test/org/apache/hadoop/mapred/TestMiniMRClasspath.java
@@ -24,6 +24,7 @@ import junit.framework.TestCase;
 
				 import org.apache.hadoop.conf.Configuration;
			
 
				 import org.apache.hadoop.dfs.MiniDFSCluster;
			
 
				 import org.apache.hadoop.fs.FileSystem;
			
 
				+import org.apache.hadoop.fs.FileUtil;
			
 
				 import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.io.IntWritable;
			
 
				 import org.apache.hadoop.io.Text;
			
@@ -76,7 +77,8 @@ public class TestMiniMRClasspath extends TestCase {
 
				     StringBuffer result = new StringBuffer();
			
 
				     {
			
 
				       Path[] parents = fs.listPaths(outDir.getParent());
			
 
				-      Path[] fileList = fs.listPaths(outDir);
			
 
				+      Path[] fileList = FileUtil.stat2Paths(fs.listStatus(outDir,
			
 
				+              new OutputLogFilter()));
			
 
				       for(int i=0; i < fileList.length; ++i) {
			
 
				         BufferedReader file = 
			
 
				           new BufferedReader(new InputStreamReader(fs.open(fileList[i])));
			
@@ -130,8 +132,8 @@ public class TestMiniMRClasspath extends TestCase {
 
				     conf.setJar("build/test/testjar/testjob.jar");
			
 
				     JobClient.runJob(conf);
			
 
				     StringBuffer result = new StringBuffer();
			
 
				-
			
 
				-    Path[] fileList = fs.listPaths(outDir);
			
 
				+    Path[] fileList = FileUtil.stat2Paths(fs.listStatus(outDir,
			
 
				+                                 new OutputLogFilter()));
			
 
				     for (int i = 0; i < fileList.length; ++i) {
			
 
				       BufferedReader file = new BufferedReader(new InputStreamReader(
			
 
				                                                                      fs.open(fileList[i])));
			
--- a/src/test/org/apache/hadoop/mapred/TestMiniMRWithDFS.java
+++ b/src/test/org/apache/hadoop/mapred/TestMiniMRWithDFS.java
@@ -27,6 +27,7 @@ import org.apache.commons.logging.LogFactory;
 
				 import org.apache.hadoop.conf.Configuration;
			
 
				 import org.apache.hadoop.dfs.MiniDFSCluster;
			
 
				 import org.apache.hadoop.fs.FileSystem;
			
 
				+import org.apache.hadoop.fs.FileUtil;
			
 
				 import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.io.IntWritable;
			
 
				 import org.apache.hadoop.io.Text;
			
@@ -91,8 +92,11 @@ public class TestMiniMRWithDFS extends TestCase {
 
				     FileSystem fs = outDir.getFileSystem(conf);
			
 
				     StringBuffer result = new StringBuffer();
			
 
				     {
			
 
				-      Path[] fileList = fs.listPaths(outDir);
			
 
				+      
			
 
				+      Path[] fileList = FileUtil.stat2Paths(fs.listStatus(outDir,
			
 
				+                                   new OutputLogFilter()));
			
 
				       for(int i=0; i < fileList.length; ++i) {
			
 
				+        LOG.info("File list[" + i + "]" + ": "+ fileList[i]);
			
 
				         BufferedReader file = 
			
 
				           new BufferedReader(new InputStreamReader(fs.open(fileList[i])));
			
 
				         String line = file.readLine();
			
--- a/src/test/org/apache/hadoop/mapred/pipes/TestPipes.java
+++ b/src/test/org/apache/hadoop/mapred/pipes/TestPipes.java
@@ -32,6 +32,7 @@ import org.apache.hadoop.fs.FileSystem;
 
				 import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.mapred.JobConf;
			
 
				 import org.apache.hadoop.mapred.MiniMRCluster;
			
 
				+import org.apache.hadoop.mapred.OutputLogFilter;
			
 
				 import org.apache.hadoop.mapred.RunningJob;
			
 
				 import org.apache.hadoop.mapred.TestMiniMRWithDFS;
			
 
				 import org.apache.hadoop.util.StringUtils;
			
@@ -144,7 +145,8 @@ public class TestPipes extends TestCase {
 
				     RunningJob result = Submitter.submitJob(job);
			
 
				     assertTrue("pipes job failed", result.isSuccessful());
			
 
				     List<String> results = new ArrayList<String>();
			
 
				-    for (Path p:fs.listPaths(outputPath)) {
			
 
				+    for (Path p:FileUtil.stat2Paths(fs.listStatus(outputPath,
			
 
				+    		                        new OutputLogFilter()))) {
			
 
				       results.add(TestMiniMRWithDFS.readOutput(p, job));
			
 
				     }
			
 
				     assertEquals("number of reduces is wrong", 
			
--- a/src/webapps/history/analysejobhistory.jsp
+++ b/src/webapps/history/analysejobhistory.jsp
@@ -10,13 +10,13 @@
 
				 %>
			
 
				 <jsp:include page="loadhistory.jsp">
			
 
				 	<jsp:param name="jobid" value="<%=request.getParameter("jobid") %>"/>
			
 
				-	<jsp:param name="jobTrackerId" value="<%=request.getParameter("jobTrackerId") %>"/>
			
 
				+	<jsp:param name="logFile" value="<%=request.getParameter("logFile") %>"/>
			
 
				 </jsp:include>
			
 
				 <%!	private static SimpleDateFormat dateFormat = new SimpleDateFormat("d/MM HH:mm:ss") ; %>
			
 
				 <html><body>
			
 
				 <%
			
 
				 	String jobid = request.getParameter("jobid");
			
 
				-	String jobTrackerId = request.getParameter("jobTrackerId");
			
 
				+	String logFile = request.getParameter("logFile");
			
 
				 	String numTasks = request.getParameter("numTasks");
			
 
				 	int showTasks = 10 ; 
			
 
				 	if( numTasks != null ) {
			
@@ -26,7 +26,7 @@
 
				 	JobInfo job = (JobInfo)request.getSession().getAttribute("job");
			
 
				 
			
 
				 %>
			
 
				-<h2>Hadoop Job <a href="jobdetailshistory.jsp?jobid=<%=jobid%>&&jobTrackerId=<%=jobTrackerId %>"><%=jobid %> </a></h2>
			
 
				+<h2>Hadoop Job <a href="jobdetailshistory.jsp?jobid=<%=jobid%>&&logFile=<%=logFile %>"><%=jobid %> </a></h2>
			
 
				 
			
 
				 <b>User : </b> <%=job.get(Keys.USER) %><br/> 
			
 
				 <b>JobName : </b> <%=job.get(Keys.JOBNAME) %><br/> 
			
@@ -105,7 +105,7 @@
 
				 %>
			
 
				 
			
 
				 <h3>Time taken by best performing Map task 
			
 
				-<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>&taskid=<%=minMap.get(Keys.TASKID)%>">
			
 
				+<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>&taskid=<%=minMap.get(Keys.TASKID)%>">
			
 
				 <%=minMap.get(Keys.TASKID) %></a> : <%=StringUtils.formatTimeDiff(minMap.getLong(Keys.FINISH_TIME), minMap.getLong(Keys.START_TIME) ) %></h3>
			
 
				 <h3>Average time taken by Map tasks: 
			
 
				 <%=StringUtils.formatTimeDiff(avgMapTime, 0) %></h3>
			
@@ -116,7 +116,7 @@
 
				 	for( int i=0;i<showTasks && i<mapTasks.length; i++){
			
 
				 %>
			
 
				 		<tr>
			
 
				-			<td><a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>&taskid=<%=mapTasks[i].get(Keys.TASKID)%>">
			
 
				+			<td><a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>&taskid=<%=mapTasks[i].get(Keys.TASKID)%>">
			
 
				   		    <%=mapTasks[i].get(Keys.TASKID) %></a></td>
			
 
				 			<td><%=StringUtils.formatTimeDiff(mapTasks[i].getLong(Keys.FINISH_TIME), mapTasks[i].getLong(Keys.START_TIME)) %></td>
			
 
				 		</tr>
			
@@ -137,7 +137,7 @@
 
				     JobHistory.Task lastMap = mapTasks[0] ;
			
 
				 %>
			
 
				 <h3>The last Map task 
			
 
				-<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>
			
 
				+<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>
			
 
				 &taskid=<%=lastMap.get(Keys.TASKID)%>"><%=lastMap.get(Keys.TASKID) %></a> 
			
 
				 finished at (relative to the Job launch time): 
			
 
				 <%=StringUtils.getFormattedTimeWithDiff(dateFormat, 
			
@@ -145,7 +145,7 @@ finished at (relative to the Job launch time):
 
				                               job.getLong(Keys.LAUNCH_TIME) ) %></h3>
			
 
				 <hr/>
			
 
				 <h3>Time taken by best performing shuffle
			
 
				-<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>
			
 
				+<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>
			
 
				 &taskid=<%=minShuffle.get(Keys.TASKID)%>"><%=minShuffle.get(Keys.TASKID)%></a> : 
			
 
				 <%=StringUtils.formatTimeDiff(minShuffle.getLong(Keys.SHUFFLE_FINISHED), 
			
 
				                               minShuffle.getLong(Keys.START_TIME) ) %></h3>
			
@@ -158,8 +158,8 @@ finished at (relative to the Job launch time):
 
				 	for( int i=0;i<showTasks && i<reduceTasks.length; i++){
			
 
				 %>
			
 
				       <tr>
			
 
				-	    <td><a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=
			
 
				-	    <%=jobTrackerId%>&taskid=<%=reduceTasks[i].get(Keys.TASKID)%>">
			
 
				+	    <td><a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=
			
 
				+	    <%=logFile%>&taskid=<%=reduceTasks[i].get(Keys.TASKID)%>">
			
 
				 			<%=reduceTasks[i].get(Keys.TASKID) %></a></td>
			
 
				 	    <td><%=
			
 
				 	      StringUtils.formatTimeDiff(
			
@@ -185,7 +185,7 @@ finished at (relative to the Job launch time):
 
				 %>
			
 
				 
			
 
				 <h3>The last Shuffle  
			
 
				-<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>
			
 
				+<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>
			
 
				 &taskid=<%=lastShuffle.get(Keys.TASKID)%>"><%=lastShuffle.get(Keys.TASKID)%>
			
 
				 </a> finished at (relative to the Job launch time): 
			
 
				 <%=StringUtils.getFormattedTimeWithDiff(dateFormat,
			
@@ -207,7 +207,7 @@ finished at (relative to the Job launch time):
 
				 %>
			
 
				 <hr/>
			
 
				 <h3>Time taken by best performing Reduce task : 
			
 
				-<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>&taskid=<%=minReduce.get(Keys.TASKID)%>">
			
 
				+<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>&taskid=<%=minReduce.get(Keys.TASKID)%>">
			
 
				 <%=minReduce.get(Keys.TASKID) %></a> : 
			
 
				 <%=StringUtils.formatTimeDiff(minReduce.getLong(Keys.FINISH_TIME),
			
 
				     minReduce.getLong(Keys.SHUFFLE_FINISHED) ) %></h3>
			
@@ -221,7 +221,7 @@ finished at (relative to the Job launch time):
 
				 	for( int i=0;i<showTasks && i<reduceTasks.length; i++){
			
 
				 %>
			
 
				 		<tr>
			
 
				-			<td><a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>&taskid=<%=reduceTasks[i].get(Keys.TASKID)%>">
			
 
				+			<td><a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>&taskid=<%=reduceTasks[i].get(Keys.TASKID)%>">
			
 
				 			<%=reduceTasks[i].get(Keys.TASKID) %></a></td>
			
 
				 			<td><%=StringUtils.formatTimeDiff(
			
 
				 			    reduceTasks[i].getLong(Keys.FINISH_TIME), 
			
@@ -237,7 +237,7 @@ finished at (relative to the Job launch time):
 
				 %>
			
 
				 
			
 
				 <h3>The last Reduce task 
			
 
				-<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId%>
			
 
				+<a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile%>
			
 
				 &taskid=<%=lastReduce.get(Keys.TASKID)%>"><%=lastReduce.get(Keys.TASKID)%>
			
 
				 </a> finished at (relative to the Job launch time): 
			
 
				 <%=StringUtils.getFormattedTimeWithDiff(dateFormat,
			
--- a/src/webapps/history/index.html
+++ b/src/webapps/history/index.html
@@ -0,0 +1,20 @@
 
				+<meta HTTP-EQUIV="REFRESH" content="0;url=jobhistory.jsp"/>
			
 
				+<html>
			
 
				+
			
 
				+<head>
			
 
				+<title>Hadoop Administration - History</title>
			
 
				+</head>
			
 
				+
			
 
				+<body>
			
 
				+
			
 
				+<h1>Hadoop Administration - History</h1>
			
 
				+
			
 
				+<ul>
			
 
				+
			
 
				+<li><a href="jobhistory.jsp">Job History</a></li>
			
 
				+
			
 
				+</ul>
			
 
				+
			
 
				+</body>
			
 
				+
			
 
				+</html>
			
--- a/src/webapps/history/jobconf_history.jsp
+++ b/src/webapps/history/jobconf_history.jsp
@@ -0,0 +1,58 @@
 
				+<%@ page
			
 
				+  contentType="text/html; charset=UTF-8"
			
 
				+  import="javax.servlet.*"
			
 
				+  import="javax.servlet.http.*"
			
 
				+  import="java.io.*"
			
 
				+  import="java.net.URL"
			
 
				+  import="org.apache.hadoop.mapred.*"
			
 
				+  import="org.apache.hadoop.fs.*"
			
 
				+  import="org.apache.hadoop.util.*"
			
 
				+%>
			
 
				+
			
 
				+
			
 
				+<%
			
 
				+  JobTracker tracker = (JobTracker) application.getAttribute("job.tracker");
			
 
				+  String jobId = request.getParameter("jobid");
			
 
				+  if (jobId == null) {
			
 
				+    out.println("<h2>Missing 'jobid' for fetching job configuration!</h2>");
			
 
				+ 	return;
			
 
				+  }
			
 
				+%>
			
 
				+  
			
 
				+<html>
			
 
				+
			
 
				+<title>Job Configuration: JobId - <%= jobId %></title>
			
 
				+
			
 
				+<body>
			
 
				+<h2>Job Configuration: JobId - <%= jobId %></h2><br>
			
 
				+
			
 
				+<%
			
 
				+  Path logDir = new Path(request.getParameter("jobLogDir"));
			
 
				+  Path jobFilePath = new Path(logDir, 
			
 
				+                       request.getParameter("jobUniqueString") + "_conf.xml");
			
 
				+  FileSystem fs = (FileSystem)request.getSession().getAttribute("fs");
			
 
				+  FSDataInputStream jobFile = null; 
			
 
				+  try {
			
 
				+    jobFile = fs.open(jobFilePath);
			
 
				+    JobConf jobConf = new JobConf(jobFilePath);
			
 
				+    XMLUtils.transform(
			
 
				+        jobConf.getConfResourceAsInputStream("webapps/static/jobconf.xsl"),
			
 
				+        jobFile, out);
			
 
				+  } catch (Exception e) {
			
 
				+    out.println("Failed to retreive job configuration for job '" + jobId + "!");
			
 
				+    out.println(e);
			
 
				+  } finally {
			
 
				+    if (jobFile != null) {
			
 
				+      try { 
			
 
				+        jobFile.close(); 
			
 
				+      } catch (IOException e) {}
			
 
				+    }
			
 
				+  } 
			
 
				+%>
			
 
				+
			
 
				+<br>
			
 
				+<hr>
			
 
				+<a href="http://lucene.apache.org/hadoop">Hadoop</a>, 2007.<br>
			
 
				+
			
 
				+</body>
			
 
				+</html>
			
--- a/src/webapps/history/jobdetailshistory.jsp
+++ b/src/webapps/history/jobdetailshistory.jsp
@@ -3,6 +3,7 @@
 
				   import="javax.servlet.http.*"
			
 
				   import="java.io.*"
			
 
				   import="java.util.*"
			
 
				+  import="org.apache.hadoop.fs.*"
			
 
				   import="org.apache.hadoop.mapred.*"
			
 
				   import="org.apache.hadoop.util.*"
			
 
				   import="java.text.SimpleDateFormat"
			
@@ -10,26 +11,31 @@
 
				 %>
			
 
				 <jsp:include page="loadhistory.jsp">
			
 
				 	<jsp:param name="jobid" value="<%=request.getParameter("jobid") %>"/>
			
 
				-	<jsp:param name="jobTrackerId" value="<%=request.getParameter("jobTrackerId") %>"/>
			
 
				+	<jsp:param name="logFile" value="<%=request.getParameter("logFile") %>"/>
			
 
				 </jsp:include>
			
 
				 <%! static SimpleDateFormat dateFormat = new SimpleDateFormat("d-MMM-yyyy HH:mm:ss") ; %>
			
 
				 <%
			
 
				 	String jobid = request.getParameter("jobid");
			
 
				-	String jobTrackerId = request.getParameter("jobTrackerId");
			
 
				+	String logFile = request.getParameter("logFile");
			
 
				+	
			
 
				+	Path jobFile = new Path(logFile);
			
 
				+	String[] jobDetails = jobFile.getName().split("_");
			
 
				+    String jobUniqueString = jobDetails[0] + "_" +jobDetails[1] + "_" + jobid ;
			
 
				 	
			
 
				 	JobInfo job = (JobInfo)request.getSession().getAttribute("job");
			
 
				+	FileSystem fs = (FileSystem)request.getSession().getAttribute("fs");
			
 
				 %>
			
 
				 <html><body>
			
 
				-<h2>Hadoop Job <%=jobid %> </h2>
			
 
				+<h2>Hadoop Job <%=jobid %> on <a href="jobhistory.jsp">History Viewer</a></h2>
			
 
				 
			
 
				 <b>User: </b> <%=job.get(Keys.USER) %><br/> 
			
 
				 <b>JobName: </b> <%=job.get(Keys.JOBNAME) %><br/> 
			
 
				-<b>JobConf: </b> <a href="jobconf.jsp?jobid=<%=jobid %>"> 
			
 
				+<b>JobConf: </b> <a href="jobconf_history.jsp?jobid=<%=jobid%>&jobLogDir=<%=new Path(logFile).getParent().toString()%>&jobUniqueString=<%=jobUniqueString%>"> 
			
 
				                  <%=job.get(Keys.JOBCONF) %></a><br/> 
			
 
				 <b>Submitted At: </b> <%=StringUtils.getFormattedTimeWithDiff(dateFormat, job.getLong(Keys.SUBMIT_TIME), 0 )  %><br/> 
			
 
				 <b>Launched At: </b> <%=StringUtils.getFormattedTimeWithDiff(dateFormat, job.getLong(Keys.LAUNCH_TIME), job.getLong(Keys.SUBMIT_TIME)) %><br/>
			
 
				 <b>Finished At: </b>  <%=StringUtils.getFormattedTimeWithDiff(dateFormat, job.getLong(Keys.FINISH_TIME), job.getLong(Keys.LAUNCH_TIME)) %><br/>
			
 
				-<b>Status: </b> <%= ((job.get(Keys.JOB_STATUS) == null)?"Incomplete" :job.get(Keys.JOB_STATUS)) %><br/> 
			
 
				+<b>Status: </b> <%= ((job.get(Keys.JOB_STATUS) == "")?"Incomplete" :job.get(Keys.JOB_STATUS)) %><br/> 
			
 
				 <%
			
 
				 	Map<String, JobHistory.Task> tasks = job.getAllTasks();
			
 
				 	int totalMaps = 0 ; 
			
@@ -51,7 +57,7 @@
 
				 	  long startTime = task.getLong(Keys.START_TIME) ; 
			
 
				 	  long finishTime = task.getLong(Keys.FINISH_TIME) ; 
			
 
				 	  
			
 
				-          allHosts.put(task.get(Keys.HOSTNAME), null);
			
 
				+          allHosts.put(task.get(Keys.HOSTNAME), "");
			
 
				 
			
 
				 	  if( Values.MAP.name().equals(task.get(Keys.TASK_TYPE)) ){
			
 
				 	    if( mapStarted==0 || mapStarted > startTime ){
			
@@ -91,8 +97,7 @@
 
				 	  }
			
 
				 	}
			
 
				 %>
			
 
				-<b>Number of nodes used: </b> <%=allHosts.size() %><br/>
			
 
				-<b><a href="analysejobhistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>">Analyse This Job</a></b> 
			
 
				+<b><a href="analysejobhistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>">Analyse This Job</a></b> 
			
 
				 <hr/>
			
 
				 <center>
			
 
				 <table border="2" cellpadding="5" cellspacing="2">
			
@@ -101,26 +106,26 @@
 
				 </tr>
			
 
				 <tr>
			
 
				 <td>Map</td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.MAP.name() %>&status=all">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.MAP.name() %>&status=all">
			
 
				 	  <%=totalMaps %></a></td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.MAP.name() %>&status=<%=Values.SUCCESS %>">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.MAP.name() %>&status=<%=Values.SUCCESS %>">
			
 
				 	  <%=job.getInt(Keys.FINISHED_MAPS) %></a></td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.MAP.name() %>&status=<%=Values.FAILED %>">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.MAP.name() %>&status=<%=Values.FAILED %>">
			
 
				 	  <%=failedMaps %></a></td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.MAP.name() %>&status=<%=Values.KILLED %>">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.MAP.name() %>&status=<%=Values.KILLED %>">
			
 
				 	  <%=killedMaps %></a></td>
			
 
				 	<td><%=StringUtils.getFormattedTimeWithDiff(dateFormat, mapStarted, 0) %></td>
			
 
				 	<td><%=StringUtils.getFormattedTimeWithDiff(dateFormat, mapFinished, mapStarted) %></td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				 <td>Reduce</td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.REDUCE.name() %>&status=all">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.REDUCE.name() %>&status=all">
			
 
				 	  <%=totalReduces%></a></td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.REDUCE.name() %>&status=<%=Values.SUCCESS %>">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.REDUCE.name() %>&status=<%=Values.SUCCESS %>">
			
 
				 	  <%=job.getInt(Keys.FINISHED_REDUCES)%></a></td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.REDUCE.name() %>&status=<%=Values.FAILED %>">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.REDUCE.name() %>&status=<%=Values.FAILED %>">
			
 
				 	  <%=failedReduces%></a></td>
			
 
				-	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&jobTrackerId=<%=jobTrackerId %>&taskType=<%=Values.REDUCE.name() %>&status=<%=Values.KILLED %>">
			
 
				+	<td><a href="jobtaskshistory.jsp?jobid=<%=jobid %>&logFile=<%=logFile %>&taskType=<%=Values.REDUCE.name() %>&status=<%=Values.KILLED %>">
			
 
				 	  <%=killedReduces%></a></td>  
			
 
				 	<td><%=StringUtils.getFormattedTimeWithDiff(dateFormat, reduceStarted, 0) %></td>
			
 
				 	<td><%=StringUtils.getFormattedTimeWithDiff(dateFormat, reduceFinished, reduceStarted) %></td>
			
@@ -130,9 +135,7 @@
 
				 <br/>
			
 
				  <%
			
 
				 	DefaultJobHistoryParser.FailedOnNodesFilter filter = new DefaultJobHistoryParser.FailedOnNodesFilter();
			
 
				-	String dir = System.getProperty("hadoop.log.dir") + File.separator + "history" ; 
			
 
				- 
			
 
				-	JobHistory.parseHistory(new File(dir, jobTrackerId+"_" + jobid), filter); 
			
 
				+	JobHistory.parseHistoryFromFS(logFile, filter, fs); 
			
 
				 	Map<String, Set<String>> badNodes = filter.getValues(); 
			
 
				 	if( badNodes.size() > 0 ) {
			
 
				  %>
			
@@ -150,7 +153,7 @@
 
				 <%
			
 
				 		for( String t : failedTasks ) {
			
 
				 %>
			
 
				-		 <a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId %>&taskid=<%=t %>"><%=t %></a>,&nbsp;
			
 
				+		 <a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile %>&taskid=<%=t %>"><%=t %></a>,&nbsp;
			
 
				 <%		  
			
 
				 		}
			
 
				 %>	
			
@@ -164,9 +167,7 @@
 
				 <br/>
			
 
				  <%
			
 
				 	DefaultJobHistoryParser.KilledOnNodesFilter killedFilter = new DefaultJobHistoryParser.KilledOnNodesFilter();
			
 
				-	dir = System.getProperty("hadoop.log.dir") + File.separator + "history" ; 
			
 
				- 
			
 
				-	JobHistory.parseHistory(new File(dir, jobTrackerId+"_" + jobid), filter); 
			
 
				+	JobHistory.parseHistoryFromFS(logFile, filter, fs); 
			
 
				 	badNodes = killedFilter.getValues(); 
			
 
				 	if( badNodes.size() > 0 ) {
			
 
				  %>
			
@@ -184,7 +185,7 @@
 
				 <%
			
 
				 		for( String t : killedTasks ) {
			
 
				 %>
			
 
				-		 <a href="taskdetailshistory.jsp?jobid=<%=jobid%>&jobTrackerId=<%=jobTrackerId %>&taskid=<%=t %>"><%=t %></a>,&nbsp;
			
 
				+		 <a href="taskdetailshistory.jsp?jobid=<%=jobid%>&logFile=<%=logFile %>&taskid=<%=t %>"><%=t %></a>,&nbsp;
			
 
				 <%		  
			
 
				 		}
			
 
				 %>	
			
--- a/src/webapps/history/jobhistory.jsp
+++ b/src/webapps/history/jobhistory.jsp
@@ -0,0 +1,104 @@
 
				+<%@ page
			
 
				+  contentType="text/html; charset=UTF-8"
			
 
				+  import="java.io.*"
			
 
				+  import="java.util.*"
			
 
				+  import="org.apache.hadoop.mapred.*"
			
 
				+  import="org.apache.hadoop.util.*"
			
 
				+  import="org.apache.hadoop.fs.*"
			
 
				+  import="javax.servlet.jsp.*"
			
 
				+  import="java.text.SimpleDateFormat"
			
 
				+  import="org.apache.hadoop.mapred.*"
			
 
				+  import="org.apache.hadoop.mapred.JobHistory.*"
			
 
				+%>
			
 
				+<%!	
			
 
				+	private static SimpleDateFormat dateFormat = new SimpleDateFormat("d/MM HH:mm:ss") ;
			
 
				+%>
			
 
				+<html>
			
 
				+<head>
			
 
				+<title>Hadoop Map/Reduce Administration</title>
			
 
				+<link rel="stylesheet" type="text/css" href="/static/hadoop.css">
			
 
				+</head>
			
 
				+<body>
			
 
				+<h1>Hadoop Map/Reduce History Viewer</h1>
			
 
				+<hr>
			
 
				+<h2>Available History </h2>
			
 
				+<%
			
 
				+    PathFilter jobLogFileFilter = new PathFilter() {
			
 
				+      public boolean accept(Path path) {
			
 
				+        return !(path.getName().endsWith(".xml"));
			
 
				+      }
			
 
				+    };
			
 
				+    
			
 
				+	FileSystem fs = (FileSystem) application.getAttribute("fileSys");
			
 
				+	String historyLogDir = (String) application.getAttribute("historyLogDir");
			
 
				+	Path[] jobFiles = fs.listPaths(new Path(historyLogDir), jobLogFileFilter);
			
 
				+
			
 
				+    // sort the files on creation time.
			
 
				+    Arrays.sort(jobFiles, new Comparator<Path>() {
			
 
				+      public int compare(Path p1, Path p2) {
			
 
				+        String[] split1 = p1.getName().split("_");
			
 
				+        String[] split2 = p2.getName().split("_");
			
 
				+        
			
 
				+        // compare job tracker start time
			
 
				+        int res = new Date(Long.parseLong(split1[1])).compareTo(
			
 
				+                             new Date(Long.parseLong(split2[1])));
			
 
				+        if (res == 0) {
			
 
				+          res = new Date(Long.parseLong(split1[3])).compareTo(
			
 
				+                           new Date(Long.parseLong(split2[3])));
			
 
				+        }
			
 
				+        if (res == 0) {
			
 
				+          Long l1 = Long.parseLong(split1[4]);
			
 
				+          res = l1.compareTo(Long.parseLong(split2[4]));
			
 
				+        }
			
 
				+        
			
 
				+        return res;
			
 
				+      }
			
 
				+    });
			
 
				+
			
 
				+    if (null == jobFiles ){
			
 
				+      out.println("NULL !!!"); 
			
 
				+      return ; 
			
 
				+    }
			
 
				+       
			
 
				+    out.print("<table align=center border=2 cellpadding=\"5\" cellspacing=\"2\">");
			
 
				+    out.print("<tr><td align=\"center\" colspan=\"9\"><b>Available Jobs </b></td></tr>\n");
			
 
				+    out.print("<tr>");
			
 
				+    out.print("<td>Job tracker Host Name</td>" +
			
 
				+              "<td>Job tracker Start time</td>" +
			
 
				+              "<td>Job Id</td><td>Name</td><td>User</td>") ; 
			
 
				+    out.print("</tr>"); 
			
 
				+    for (Path jobFile: jobFiles) {
			
 
				+      String[] jobDetails = jobFile.getName().split("_");
			
 
				+      String trackerHostName = jobDetails[0];
			
 
				+      String trackerStartTime = jobDetails[1];
			
 
				+      String jobId = jobDetails[2] + "_" +jobDetails[3] + "_" + jobDetails[4] ;
			
 
				+      String user = jobDetails[5];
			
 
				+      String jobName = jobDetails[6];
			
 
				+      
			
 
				+%>
			
 
				+<center>
			
 
				+<%	
			
 
				+
			
 
				+	  printJob(trackerHostName, trackerStartTime, jobId,
			
 
				+               jobName, user, jobFile.toString(), out) ; 
			
 
				+%>
			
 
				+</center> 
			
 
				+<%
			
 
				+	} // end while trackers 
			
 
				+%>
			
 
				+<%!
			
 
				+	private void printJob(String trackerHostName, String trackerid,
			
 
				+                          String jobId, String jobName,
			
 
				+                          String user, String logFile, JspWriter out)
			
 
				+    throws IOException{
			
 
				+	    out.print("<tr>"); 
			
 
				+	    out.print("<td>" + trackerHostName + "</td>"); 
			
 
				+	    out.print("<td>" + new Date(Long.parseLong(trackerid)) + "</td>"); 
			
 
				+	    out.print("<td>" + "<a href=\"jobdetailshistory.jsp?jobid="+ jobId + 
			
 
				+	        "&logFile=" + logFile +"\">" + jobId + "</a></td>"); 
			
 
				+	    out.print("<td>" + jobName + "</td>"); 
			
 
				+	    out.print("<td>" + user + "</td>"); 
			
 
				+	    out.print("</tr>");
			
 
				+	}
			
 
				+ %> 
			
 
				+</body></html>
			
--- a/src/webapps/history/jobtaskshistory.jsp
+++ b/src/webapps/history/jobtaskshistory.jsp
@@ -10,13 +10,13 @@
 
				 %>
			
 
				 <jsp:include page="loadhistory.jsp">
			
 
				 	<jsp:param name="jobid" value="<%=request.getParameter("jobid") %>"/>
			
 
				-	<jsp:param name="jobTrackerId" value="<%=request.getParameter("jobTrackerId") %>"/>
			
 
				+	<jsp:param name="logFile" value="<%=request.getParameter("logFile") %>"/>
			
 
				 </jsp:include>
			
 
				 <%!	private static SimpleDateFormat dateFormat = new SimpleDateFormat("d/MM HH:mm:ss") ; %>
			
 
				 
			
 
				 <%	
			
 
				 	String jobid = request.getParameter("jobid");
			
 
				-	String jobTrackerId = request.getParameter("jobTrackerId");
			
 
				+	String logFile = request.getParameter("logFile");
			
 
				 	String taskStatus = request.getParameter("status"); 
			
 
				 	String taskType = request.getParameter("taskType"); 
			
 
				 	
			
@@ -26,7 +26,7 @@
 
				 %>
			
 
				 <html>
			
 
				 <body>
			
 
				-<h2><%=taskStatus%> <%=taskType %> task list for <a href="jobdetailshistory.jsp?jobid=<%=jobid%>&&jobTrackerId=<%=jobTrackerId %>"><%=jobid %> </a></h2>
			
 
				+<h2><%=taskStatus%> <%=taskType %> task list for <a href="jobdetailshistory.jsp?jobid=<%=jobid%>&&logFile=<%=logFile %>"><%=jobid %> </a></h2>
			
 
				 <center>
			
 
				 <table border="2" cellpadding="5" cellspacing="2">
			
 
				 <tr><td>Task Id</td><td>Start Time</td><td>Finish Time<br/></td><td>Error</td></tr>
			
@@ -36,7 +36,7 @@
 
				             Map <String, TaskAttempt> taskAttempts = task.getTaskAttempts();
			
 
				             for (JobHistory.TaskAttempt taskAttempt : taskAttempts.values()) {
			
 
				 	      if( taskStatus.equals(taskAttempt.get(Keys.TASK_STATUS)) || taskStatus.equals("all")){
			
 
				-	         printTask(jobid, jobTrackerId, task, out); 
			
 
				+	         printTask(jobid, logFile, task, out); 
			
 
				 	      }
			
 
				             }
			
 
				 	  }
			
@@ -47,7 +47,7 @@
 
				 	private void printTask(String jobid, String trackerId, JobHistory.Task task, JspWriter out) throws IOException{
			
 
				   		out.print("<tr>"); 
			
 
				   		out.print("<td>" + "<a href=\"taskdetailshistory.jsp?jobid=" + jobid + 
			
 
				-  		    "&jobTrackerId="+ trackerId +"&taskid="+task.get(Keys.TASKID)+"\">" + 
			
 
				+  		    "&logFile="+ trackerId +"&taskid="+task.get(Keys.TASKID)+"\">" + 
			
 
				   		    task.get(Keys.TASKID) + "</a></td>");
			
 
				   		out.print("<td>" + StringUtils.getFormattedTimeWithDiff(dateFormat, 
			
 
				   		    task.getLong(Keys.START_TIME), 0 ) + "</td>");
			
--- a/src/webapps/history/loadhistory.jsp
+++ b/src/webapps/history/loadhistory.jsp
@@ -0,0 +1,35 @@
 
				+<%@ page
			
 
				+  contentType="text/html; charset=UTF-8"
			
 
				+  import="java.io.*"
			
 
				+  import="java.util.*"
			
 
				+  import="org.apache.hadoop.mapred.*"
			
 
				+  import="org.apache.hadoop.fs.*"
			
 
				+  import="org.apache.hadoop.util.*"
			
 
				+  import="javax.servlet.jsp.*"
			
 
				+  import="java.text.SimpleDateFormat"  
			
 
				+  import="org.apache.hadoop.mapred.JobHistory.*"
			
 
				+%>
			
 
				+<%
			
 
				+    PathFilter jobLogFileFilter = new PathFilter() {
			
 
				+      public boolean accept(Path path) {
			
 
				+        return !(path.getName().endsWith(".xml"));
			
 
				+      }
			
 
				+    };
			
 
				+    
			
 
				+	FileSystem fs = (FileSystem) application.getAttribute("fileSys");
			
 
				+	String jobId =  (String)request.getParameter("jobid");
			
 
				+	JobHistory.JobInfo job = (JobHistory.JobInfo)request.getSession().getAttribute("job");
			
 
				+	if (null != job && (!jobId.equals(job.get(Keys.JOBID)))){
			
 
				+      // remove jobInfo from session, keep only one job in session at a time
			
 
				+      request.getSession().removeAttribute("job"); 
			
 
				+      job = null ; 
			
 
				+    }
			
 
				+	
			
 
				+	if (null == job) {
			
 
				+      String jobLogFile = (String)request.getParameter("logFile");
			
 
				+      job = new JobHistory.JobInfo(jobId); 
			
 
				+      DefaultJobHistoryParser.parseJobTasks(jobLogFile, job, fs) ; 
			
 
				+      request.getSession().setAttribute("job", job);
			
 
				+      request.getSession().setAttribute("fs", fs);
			
 
				+	}
			
 
				+%>
			
--- a/src/webapps/history/taskdetailshistory.jsp
+++ b/src/webapps/history/taskdetailshistory.jsp
@@ -16,7 +16,7 @@
 
				 
			
 
				 <%	
			
 
				 	String jobid = request.getParameter("jobid");
			
 
				-	String jobTrackerId = request.getParameter("jobTrackerId");
			
 
				+	String logFile = request.getParameter("logFile");
			
 
				 	String taskid = request.getParameter("taskid"); 
			
 
				 
			
 
				 	JobHistory.JobInfo job = (JobHistory.JobInfo)request.getSession().getAttribute("job");
			
@@ -24,7 +24,7 @@
 
				 %>
			
 
				 <html>
			
 
				 <body>
			
 
				-<h2><%=taskid %> attempts for <a href="jobdetailshistory.jsp?jobid=<%=jobid%>&&jobTrackerId=<%=jobTrackerId %>"> <%=jobid %> </a></h2>
			
 
				+<h2><%=taskid %> attempts for <a href="jobdetailshistory.jsp?jobid=<%=jobid%>&&logFile=<%=logFile %>"> <%=jobid %> </a></h2>
			
 
				 <center>
			
 
				 <table border="2" cellpadding="5" cellspacing="2">
			
 
				 <tr><td>Task Id</td><td>Start Time</td>
			
--- a/src/webapps/job/jobhistory.jsp
+++ b/src/webapps/job/jobhistory.jsp
@@ -1,99 +0,0 @@
 
				-<%@ page
			
 
				-  contentType="text/html; charset=UTF-8"
			
 
				-  import="java.io.*"
			
 
				-  import="java.util.*"
			
 
				-  import="org.apache.hadoop.mapred.*"
			
 
				-  import="org.apache.hadoop.util.*"
			
 
				-  import="javax.servlet.jsp.*"
			
 
				-  import="java.text.SimpleDateFormat"
			
 
				-  import="org.apache.hadoop.mapred.*"
			
 
				-  import="org.apache.hadoop.mapred.JobHistory.*"
			
 
				-%>
			
 
				-<jsp:include page="loadhistory.jsp">
			
 
				-	<jsp:param name="historyFile" value="<%=request.getParameter("historyFile") %>"/>
			
 
				-	<jsp:param name="reload" value="<%=request.getParameter("reload") %>"/>
			
 
				-</jsp:include>
			
 
				-<%!	
			
 
				-	private static SimpleDateFormat dateFormat = new SimpleDateFormat("d/MM HH:mm:ss") ;
			
 
				-%>
			
 
				-
			
 
				-<html><body>
			
 
				-<%
			
 
				-		DefaultJobHistoryParser.MasterIndex jobTrackerToJobs = 
			
 
				-		  (DefaultJobHistoryParser.MasterIndex)request.getSession().
			
 
				-		  getAttribute("jobHistory"); 
			
 
				-		
			
 
				-		if( null == jobTrackerToJobs ){
			
 
				-		  out.println("NULL !!!"); 
			
 
				-		  return ; 
			
 
				-		}
			
 
				-
			
 
				-    for (Map.Entry<String, Map<String, JobInfo>> entry : 
			
 
				-            jobTrackerToJobs.entrySet()) {
			
 
				-      String trackerStartTime = entry.getKey();
			
 
				-      Map<String, JobInfo> jobs = entry.getValue();
			
 
				-%>
			
 
				-<h2>JobTracker started at: <%=new Date(Long.parseLong(trackerStartTime)) %></h2>
			
 
				-<hr/>
			
 
				-<h3>Completed Jobs </h3>
			
 
				-<center>
			
 
				-<%	
			
 
				-		printJobs(trackerStartTime, jobs, Values.SUCCESS.name(), out) ; 
			
 
				-%>
			
 
				-</center> 
			
 
				-<h3>Failed Jobs </h3>
			
 
				-<center>
			
 
				-<%	
			
 
				-		printJobs(trackerStartTime, jobs, Values.FAILED.name() , out) ; 
			
 
				-%>
			
 
				-</center>
			
 
				-<h3>Incomplete Jobs </h3>
			
 
				-<center>
			
 
				-<%	
			
 
				-		printJobs(trackerStartTime, jobs, null , out) ; 
			
 
				-%>
			
 
				-</center>
			
 
				-<hr/><br/>
			
 
				-<%
			
 
				-		} // end while trackers 
			
 
				-%>
			
 
				- 
			
 
				-<%!
			
 
				-	private void printJobs(String trackerid, Map<String, JobInfo> jobs, String status, JspWriter out) throws IOException{
			
 
				-	  if( jobs.size() == 0 ) {
			
 
				-	    out.print("<h3>No Jobs available</h3>"); 
			
 
				-	    return ; 
			
 
				-	  }
			
 
				-      out.print("<table border=2 cellpadding=\"5\" cellspacing=\"2\">");
			
 
				-      out.print("<tr>");
			
 
				-   	  out.print("<td align=\"center\">Job Id</td><td>Name</td><td>User</td><td>Submit Time</td>" + 
			
 
				-   	      "<td>Finish Time</td><td>Total Maps</td><td>Total Reduces</td>" +
			
 
				-   		  "<td>Finished Maps</td><td>Finished Reduces</td>") ; 
			
 
				-   	  out.print("</tr>"); 
			
 
				-   	      
			
 
				-	  for( JobInfo job : jobs.values() ) {
			
 
				-		if( null != status && status.equals(job.get(Keys.JOB_STATUS)) ) {
			
 
				-		  printJob(trackerid, job, out); 
			
 
				-		}else if( status == null && job.get(Keys.JOB_STATUS).length() == 0 ) {
			
 
				-		  printJob(trackerid, job, out); 
			
 
				-		}
			
 
				-	  }
			
 
				-	  out.print("</table>");
			
 
				-	}
			
 
				-
			
 
				-	private void printJob(String trackerid, JobInfo job, JspWriter out)throws IOException{
			
 
				-	    out.print("<tr>"); 
			
 
				-	    out.print("<td>" + "<a href=\"jobdetailshistory.jsp?jobid="+ job.get(Keys.JOBID) + 
			
 
				-	        "&jobTrackerId=" +trackerid  + "\">" + job.get(Keys.JOBID) + "</a></td>"); 
			
 
				-	    out.print("<td>" + job.get(Keys.JOBNAME) + "</td>"); 
			
 
				-	    out.print("<td>" + job.get(Keys.USER) + "</td>"); 
			
 
				-	    out.print("<td>" + StringUtils.getFormattedTimeWithDiff(dateFormat, job.getLong(Keys.SUBMIT_TIME),0) + "</td>"); 
			
 
				-	    out.print("<td>" + StringUtils.getFormattedTimeWithDiff(dateFormat, job.getLong(Keys.FINISH_TIME) , job.getLong(Keys.SUBMIT_TIME) ) + "</td>");
			
 
				-	    out.print("<td>" + job.get(Keys.TOTAL_MAPS) + "</td>"); 
			
 
				-	    out.print("<td>" + job.get(Keys.TOTAL_REDUCES) + "</td>"); 
			
 
				-	    out.print("<td>" + job.get(Keys.FINISHED_MAPS) + "</td>"); 
			
 
				-	    out.print("<td>" + job.get(Keys.FINISHED_REDUCES) + "</td>"); 
			
 
				-	    out.print("</tr>");
			
 
				-	}
			
 
				- %>  
			
 
				-</body></html>
			
--- a/src/webapps/job/jobtracker.jsp
+++ b/src/webapps/job/jobtracker.jsp
@@ -134,7 +134,7 @@
 
				 <hr>
			
 
				 
			
 
				 <h2>Local logs</h2>
			
 
				-<a href="logs/">Log</a> directory, <a href="jobhistory.jsp?historyFile=JobHistory.log&reload=true">
			
 
				+<a href="logs/">Log</a> directory, <a href="http://<%=tracker.getHistoryAddress()%>">
			
 
				 Job Tracker History</a>
			
 
				 
			
 
				 <%
			
--- a/src/webapps/job/loadhistory.jsp
+++ b/src/webapps/job/loadhistory.jsp
@@ -1,49 +0,0 @@
 
				-<%@ page
			
 
				-  contentType="text/html; charset=UTF-8"
			
 
				-  import="java.io.*"
			
 
				-  import="java.util.*"
			
 
				-  import="org.apache.hadoop.mapred.*"
			
 
				-  import="org.apache.hadoop.util.*"
			
 
				-  import="javax.servlet.jsp.*"
			
 
				-  import="java.text.SimpleDateFormat"  
			
 
				-  import="org.apache.hadoop.mapred.JobHistory.*"
			
 
				-%>
			
 
				-<%
			
 
				-	// Reload master index or a job file in session
			
 
				-	String reload = request.getParameter("reload"); 
			
 
				-	String jobid = request.getParameter("jobid"); 
			
 
				-	String jobTrackerId = request.getParameter("jobTrackerId"); 
			
 
				-	
			
 
				-	String jobLogDir = System.getProperty("hadoop.log.dir") + File.separator + "history" ; 
			
 
				-	
			
 
				-	String masterIndex = request.getParameter("historyFile"); ;
			
 
				-	
			
 
				-	if( null != masterIndex ) {
			
 
				-		String filePath = jobLogDir + File.separator + masterIndex ;
			
 
				-		File historyFile = new File(filePath); 
			
 
				-		if( null == request.getSession().getAttribute("jobHistory") || "true".equals(reload) ){
			
 
				-		  request.getSession().setAttribute("jobHistory", 
			
 
				-				DefaultJobHistoryParser.parseMasterIndex(historyFile)); 
			
 
				-		}
			
 
				-	}
			
 
				-
			
 
				-	if( jobid != null && jobTrackerId != null ) {
			
 
				-	  
			
 
				-		JobHistory.JobInfo job = (JobHistory.JobInfo)request.getSession().getAttribute("job");
			
 
				-		if( null != job && (! jobid.equals(job.get(Keys.JOBID)) || 
			
 
				-		    ! jobTrackerId.equals(job.get(Keys.JOBTRACKERID)))){
			
 
				-		  // remove jobInfo from session, keep only one job in session at a time
			
 
				-		  request.getSession().removeAttribute("job"); 
			
 
				-		  job = null ; 
			
 
				-		}
			
 
				-		
			
 
				-		if( null == job ) {
			
 
				-  		  String jobLogFile = jobTrackerId + "_" + jobid; 
			
 
				-		  job = new JobHistory.JobInfo(jobid); 
			
 
				-		  job.set(Keys.JOBTRACKERID, jobTrackerId);
			
 
				-	      DefaultJobHistoryParser.parseJobTasks(
			
 
				-		  	    new File(jobLogDir + File.separator + jobLogFile), job) ; 
			
 
				-		  request.getSession().setAttribute("job", job); 
			
 
				-		}
			
 
				-	}
			
 
				-%>