13 years ago · 4956a0d17e
--- a/common/CHANGES.txt
+++ b/common/CHANGES.txt
@@ -1,6 +1,18 @@
 
				 Hadoop Change Log
			
 
				 
			
 
				-Release 0.22.0 - Unreleased
			
 
				+Release 0.22.1 - Unreleased
			
 
				+
			
 
				+  INCOMPATIBLE CHANGES
			
 
				+
			
 
				+  NEW FEATURES
			
 
				+
			
 
				+  IMPROVEMENTS
			
 
				+
			
 
				+  OPTIMIZATIONS
			
 
				+
			
 
				+  BUG FIXES
			
 
				+
			
 
				+Release 0.22.0 - 2011-11-29
			
 
				 
			
 
				   INCOMPATIBLE CHANGES
			
 
				 
			
--- a/common/build.xml
+++ b/common/build.xml
@@ -28,7 +28,7 @@
 
				  
			
 
				   <property name="Name" value="Hadoop-common"/>
			
 
				   <property name="name" value="hadoop-common"/>
			
 
				-  <property name="version" value="0.22.0-SNAPSHOT"/>
			
 
				+  <property name="version" value="0.22.0"/>
			
 
				   <property name="final.name" value="${name}-${version}"/>
			
 
				   <property name="test.final.name" value="${name}-test-${version}"/>
			
 
				   <property name="year" value="2009"/>
			
--- a/common/src/docs/releasenotes.html
+++ b/common/src/docs/releasenotes.html
@@ -1 +1,4790 @@
 
				-THIS IS A PLACEHOLDER.  REAL RELEASE NOTES WILL BE ADDED TO THIS FILE IN RELEASE BRANCHES.
			
 
				+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN">

			
 
				+<html>

			
 
				+<head>

			
 
				+<META http-equiv="Content-Type" content="text/html; charset=UTF-8">

			
 
				+<title>Hadoop 0.22.0 Release Notes</title>

			
 
				+<STYLE type="text/css">

			
 
				+    H1 {font-family: sans-serif}

			
 
				+    H2 {font-family: sans-serif; margin-left: 7mm}

			
 
				+    TABLE {margin-left: 7mm}

			
 
				+  </STYLE>

			
 
				+</head>

			
 
				+

			
 
				+<body>

			
 
				+<h1>Hadoop 0.22.0 Release Notes</h1>

			
 
				+    These release notes include new developer and user-facing incompatibilities, features, and major improvements. 

			
 
				+

			
 
				+<a name="changes"/>

			
 
				+<h2>Changes since Hadoop 0.21.1</h2>

			
 
				+<ul>

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7730">HADOOP-7730</a>.

			
 
				+     Major test reported by cos and fixed by cos (test)<br>

			
 
				+     <b>Allow TestCLI to be run against a cluster</b><br>

			
 
				+     <blockquote>Use the same CLI test to test cluster bits (see HDFS-1762 for more info)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7861">HADOOP-7861</a>.

			
 
				+     Major improvement reported by shv and fixed by shv (documentation)<br>

			
 
				+     <b>changes2html.pl should generate links to HADOOP, HDFS, and MAPREDUCE jiras</b><br>

			
 
				+     <blockquote>changes2html.pl correctly generates links to HADOOP jiras only. This hasn't been updated since projects split.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7786">HADOOP-7786</a>.

			
 
				+     Major improvement reported by eli and fixed by eli <br>

			
 
				+     <b>Remove HDFS-specific configuration keys defined in FsConfig</b><br>

			
 
				+     <blockquote>HADOOP-4952 added a couple HDFS-specific configuration values to common (the block size and the replication factor) that conflict with the HDFS values (eg have the wrong defaults, wrong key name), are not used by common or hdfs and should be removed. After removing these I noticed the rest of FsConfig is only used once outside a test, and isn&apos;t tagged as a public API, I think we can remove it entirely.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7783">HADOOP-7783</a>.

			
 
				+     Major test reported by eli and fixed by eli (fs)<br>

			
 
				+     <b>Add more symlink tests that cover intermediate links</b><br>

			
 
				+     <blockquote>This covers the tests for HDFS-2514.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7697">HADOOP-7697</a>.

			
 
				+     Major bug reported by shv and fixed by shv (build)<br>

			
 
				+     <b>Remove dependency on different version of slf4j in avro</b><br>

			
 
				+     <blockquote>Avro upgrade led to a mixture of slf4j versions. Hadoop uses slf4j 1.5.11, and avro brings in 1.6.1</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7663">HADOOP-7663</a>.

			
 
				+     Major bug reported by mayank_bansal and fixed by mayank_bansal (test)<br>

			
 
				+     <b>TestHDFSTrash failing on 22</b><br>

			
 
				+     <blockquote>Seems to have started failing recently in many commit builds as well as the last two nightly builds of 22:

			
 
				+<br>https://builds.apache.org/hudson/job/Hadoop-Hdfs-22-branch/51/testReport/org.apache.hadoop.hdfs/TestHDFSTrash/testTrashEmptier/

			
 
				+<br>

			
 
				+<br>https://issues.apache.org/jira/browse/HDFS-1967</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7646">HADOOP-7646</a>.

			
 
				+     Major bug reported by jrottinghuis and fixed by jrottinghuis (io, ipc)<br>

			
 
				+     <b>Make hadoop-common use same version of avro as HBase</b><br>

			
 
				+     <blockquote>HBase depends on avro 1.5.3 whereas hadoop-common depends on 1.3.2.

			
 
				+<br>When building HBase on top of hadoop, this should be consistent.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7577">HADOOP-7577</a>.

			
 
				+     Minor bug reported by jrottinghuis and fixed by jrottinghuis (metrics)<br>

			
 
				+     <b>TT does not start due to backwards compatibility wrt. EventCounter</b><br>

			
 
				+     <blockquote>Between metrics1 and mertrics2 EventCounter was moved from o.a.h.log to o.a.h.metrics.jvm.

			
 
				+<br>On 0.20-security a wrapper marked with @Deprecated was added back to o.a.h.log for compatibility, the same wrapper exists on trunk, but no on 0.22.

			
 
				+<br>

			
 
				+<br>Without it the TT will fail to start with a ClassNotFoundException.

			
 
				+<br>Hive configuration also point to this class in the log4j.properties.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7568">HADOOP-7568</a>.

			
 
				+     Major bug reported by shv and fixed by zero45 (io)<br>

			
 
				+     <b>SequenceFile should not print into stdout</b><br>

			
 
				+     <blockquote>The following line in {{SequenceFile.Reader.initialize()}} should be removed:

			
 
				+<br>System.out.println(&quot;Setting end to &quot; + end);

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7514">HADOOP-7514</a>.

			
 
				+     Minor bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Build fails with ClassCastException when running both mvn-install and mvn-deploy targets</b><br>

			
 
				+     <blockquote>Although this may not be a common use-case, the exception thrown is really confusing and does not clarify what the problem is.

			
 
				+<br>The resulting error is: java.lang.ClassCastException: org.codehaus.plexus.DefaultPlexusContainer cannot be cast to org.codehaus.plexus.PlexusContainer

			
 
				+<br>The error occurs because mvn-init target gets called twice.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7513">HADOOP-7513</a>.

			
 
				+     Major bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>mvn-deploy target fails</b><br>

			
 
				+     <blockquote>When executing mvn-deploy target, the build fails.

			
 
				+<br>hadoop-common and hadoop-common-sources deploy, but the test jar does not.

			
 
				+<br>

			
 
				+<br>property staging is not set and/or set to false, meaning when you try to deploy a snapshot build.

			
 
				+<br>

			
 
				+<br>The error reads:

			
 
				+<br>Invalid reference: &apos;hadoop.core.test&apos;.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7457">HADOOP-7457</a>.

			
 
				+     Blocker improvement reported by jghoman and fixed by jghoman (documentation)<br>

			
 
				+     <b>Remove out-of-date Chinese language documentation</b><br>

			
 
				+     <blockquote>The Chinese language documentation haven&apos;t been updated (other than copyright years and svn moves) since their original contribution several years ago.  Worse than no docs is out-of-date, wrong docs.  We should delete them from the source tree.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7450">HADOOP-7450</a>.

			
 
				+     Blocker bug reported by jnp and fixed by cos (build)<br>

			
 
				+     <b>Bump jetty to 6.1.26</b><br>

			
 
				+     <blockquote>Bump the jetty version, as previous version has an issue that can cause it to hang at startup.

			
 
				+<br>

			
 
				+<br>6.1.14 jetty is also tends to hung on heavy datanode loads.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7390">HADOOP-7390</a>.

			
 
				+     Minor bug reported by tgraves and fixed by tlipcon (build)<br>

			
 
				+     <b>VersionInfo not generated properly in git after unsplit</b><br>

			
 
				+     <blockquote>The version information generated during the build of common when running from git has revision and branch Unknown. I believe this started after the unsplit:

			
 
				+<br>

			
 
				+<br>@HadoopVersionAnnotation(version=&quot;0.22.0-SNAPSHOT&quot;, revision=&quot;Unknown&quot;, branch=&quot;Unknown&quot;,

			
 
				+<br>                         user=&quot;tgraves&quot;, date=&quot;Tue Jun 14 13:39:10 UTC 2011&quot;, url=&quot;file:///home/tgraves/git/hadoop-common/common&quot;,

			
 
				+<br>                         srcChecksum=&quot;0f78ea668971fe51e7ebf4f97f84eed2&quot;)

			
 
				+<br>

			
 
				+<br>The ./src/saveVersion.sh script which generates the package-info.java file with the version info looks for the presence of .git directory and that is now a level up instead of in the common directory.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7358">HADOOP-7358</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by tlipcon (ipc)<br>

			
 
				+     <b>Improve log levels when exceptions caught in RPC handler</b><br>

			
 
				+     <blockquote>When a server implementation throws an exception handling an RPC, the Handler thread catches it and logs it before responding with the exception over the IPC channel. This is currently done at INFO level.

			
 
				+<br>

			
 
				+<br>I&apos;d like to propose that, if the exception is an unchecked exception, it should be logged at WARN level instead. This can help alert operators when they might be hitting some kind of bug.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7355">HADOOP-7355</a>.

			
 
				+     Major improvement reported by stack and fixed by stack <br>

			
 
				+     <b>Add audience and stability annotations to HttpServer class</b><br>

			
 
				+     <blockquote>HttpServer has at least one subclasser in HBase.  Flag this class w/ annotations that make this plain so we avoid regressions like HADOOP-7351</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7351">HADOOP-7351</a>.

			
 
				+     Major bug reported by stack and fixed by stack <br>

			
 
				+     <b>Regression: HttpServer#getWebAppsPath used to be protected so subclasses could supply alternate webapps path but it was made private by HADOOP-6461</b><br>

			
 
				+     <blockquote>It USED to be protected rather than private but its access was changed by HADOOP-6461.  It did the following:

			
 
				+<br>

			
 
				+<br>-  protected String getWebAppsPath() throws IOException {

			
 
				+<br>-    URL url = getClass().getClassLoader().getResource(&quot;webapps&quot;);

			
 
				+<br>+  private String getWebAppsPath(String appName) throws FileNotFoundException {

			
 
				+<br>+    URL url = getClass().getClassLoader().getResource(&quot;webapps/&quot; + appName);

			
 
				+<br>...

			
 
				+<br>

			
 
				+<br>HBase subclasses HttpServer providing its UI.  This change makes it so we can no longer do so.

			
 
				+<br>

			
 
				+<br>This change made it into 0.21.  I&apos;d like to get a fix committed to 0.22 as well as TRUNK.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7349">HADOOP-7349</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (ipc, test)<br>

			
 
				+     <b>HADOOP-7121 accidentally disabled some tests</b><br>

			
 
				+     <blockquote>When I converted TestIPC to JUnit 4, I missed a couple of tests towards the bottom of the file when adding the @Test annotation.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7346">HADOOP-7346</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (ipc)<br>

			
 
				+     <b>Send back nicer error to clients using outdated IPC version</b><br>

			
 
				+     <blockquote>When an older Hadoop version tries to contact a newer Hadoop version across an IPC protocol version bump, the client currently just gets a non-useful error message like &quot;EOFException&quot;.

			
 
				+<br>

			
 
				+<br>Instead, the IPC server code can speak just enough of prior IPC protocols to send back a &quot;fatal&quot; message indicating the version mismatch.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7335">HADOOP-7335</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by tlipcon (build, test)<br>

			
 
				+     <b>Force entropy to come from non-true random for tests</b><br>

			
 
				+     <blockquote>Passing the system property {{-Djava.security.egd=file:///dev/urandom}} forces the JVM to seed its PRNG from non-true random (/dev/urandom) instead of the true random (/dev/random). This makes the tests run faster, since without it they often hang waiting for entropy while Jetty is initializing.

			
 
				+<br>

			
 
				+<br>We should turn this on for the test targets by default, so developers/hudson boxes don&apos;t have to make this change system-wide or use workarounds like rngtools.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7325">HADOOP-7325</a>.

			
 
				+     Minor improvement reported by brocknoland and fixed by brocknoland (scripts)<br>

			
 
				+     <b>hadoop command - do not accept class names starting with a hyphen</b><br>

			
 
				+     <blockquote>

			
 
				+The hadoop command does not appear to advertise allowing JVM options before the classname.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7318">HADOOP-7318</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (io)<br>

			
 
				+     <b>MD5Hash factory should reset the digester it returns</b><br>

			
 
				+     <blockquote>Currently the getDigest() method in MD5Hash does not reset the digester it returns. Since it&apos;s a thread-local, this means that a previous aborted usage of the same digester could leave some state around. For example, if the secondary namenode receives an IOException while transfering the image, and does another image transfer with the same thread, it will think it has received an invalid digest.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7312">HADOOP-7312</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by qwertymaniac (conf)<br>

			
 
				+     <b>core-default.xml lists configuration version as 0.21</b><br>

			
 
				+     <blockquote>This key was added in HADOOP-6233, though appears unused. I suppose it&apos;s somewhat useful to try to diagnose if someone has old versions of core-default.xml on the classpath.

			
 
				+<br>

			
 
				+<br>Either way it should probably be updated to say 0.22 in the branch and 0.23 in trunk.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7302">HADOOP-7302</a>.

			
 
				+     Major bug reported by asrabkin and fixed by asrabkin (documentation)<br>

			
 
				+     <b>webinterface.private.actions should not be in common</b><br>

			
 
				+     <blockquote>The comment in -defaults says that webinterface.private.actions applies to both NN and JT. This is wrong. This option is only referenced via the JobTracker. 

			
 
				+<br>

			
 
				+<br>I propose to delete it here, and file a second issue in MAPREDUCE for renaming the option (deprecating the existing name.)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7300">HADOOP-7300</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (conf)<br>

			
 
				+     <b>Configuration methods that return collections are inconsistent about mutability</b><br>

			
 
				+     <blockquote>In particular, getTrimmedStringCollection seems to return an immutable collection, whereas getStringCollection returns a mutable one.

			
 
				+<br>

			
 
				+<br>IMO we should always return mutable collections since these methods by definition are doing copies.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7298">HADOOP-7298</a>.

			
 
				+     Major test reported by tlipcon and fixed by tlipcon (test)<br>

			
 
				+     <b>Add test utility for writing multi-threaded tests</b><br>

			
 
				+     <blockquote>A lot of our tests spawn off multiple threads in order to check various synchronization issues, etc. It&apos;s often tedious to write these kinds of tests because you have to manually propagate exceptions back to the main thread, etc.

			
 
				+<br>

			
 
				+<br>In HBase we have developed a testing utility which makes writing these kinds of tests much easier. I&apos;d like to copy that utility into Hadoop so we can use it here as well.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7296">HADOOP-7296</a>.

			
 
				+     Minor bug reported by sseth and fixed by sseth (fs)<br>

			
 
				+     <b>The FsPermission(FsPermission) constructor does not use the sticky bit</b><br>

			
 
				+     <blockquote>The FsPermission(FsPermission) constructor copies u, g, o from the supplied FsPermission object but ignores the sticky bit.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7291">HADOOP-7291</a>.

			
 
				+     Major task reported by eli and fixed by eli <br>

			
 
				+     <b>Update Hudson job not to run test-contrib</b><br>

			
 
				+     <blockquote>The test-contrib target was removed in HADOOP-7137, which causes the Hudson job to fail. The build file doesn&apos;t execute test-contrib so I suspect the Hudson job needs to be updated to not call ant with the test-contrib target.  </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7287">HADOOP-7287</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by atm (conf)<br>

			
 
				+     <b>Configuration deprecation mechanism doesn&apos;t work properly for GenericOptionsParser/Tools</b><br>

			
 
				+     <blockquote>For example, you can&apos;t use -D options on the &quot;hadoop fs&quot; command line in order to specify the deprecated names of configuration options. The issue is that the ordering is:

			
 
				+<br>- JVM starts

			
 
				+<br>- GenericOptionsParser creates a Configuration object and calls set() for each of the options specified on command line

			
 
				+<br>- DistributedFileSystem or other class eventually instantiates HdfsConfiguration which adds the deprecations

			
 
				+<br>- Some class calls conf.get(&quot;new key&quot;) and sees the default instead of the version set on the command line</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7283">HADOOP-7283</a>.

			
 
				+     Blocker task reported by tomwhite and fixed by tomwhite (build)<br>

			
 
				+     <b>Include 32-bit and 64-bit native libraries in Jenkins tarball builds</b><br>

			
 
				+     <blockquote>The job at https://builds.apache.org/hudson/view/G-L/view/Hadoop/job/Hadoop-22-Build/ is building tarballs, but they do not currently include both 32-bit and 64-bit native libraries. We should update/duplicate hadoop-nighly/hudsonBuildHadoopRelease.sh to support post-split builds.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7252">HADOOP-7252</a>.

			
 
				+     Minor bug reported by ponyloky and fixed by qwertymaniac (build, conf, test)<br>

			
 
				+     <b>JUnit shows up as a compile time dependency</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7245">HADOOP-7245</a>.

			
 
				+     Major bug reported by tomwhite and fixed by tomwhite <br>

			
 
				+     <b>FsConfig should use constants in CommonConfigurationKeys</b><br>

			
 
				+     <blockquote>In particular, FsConfig should use fs.defaultFS instead of the deprecated fs.default.name.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7244">HADOOP-7244</a>.

			
 
				+     Blocker improvement reported by tomwhite and fixed by tomwhite (documentation)<br>

			
 
				+     <b>Documentation change for updated configuration keys</b><br>

			
 
				+     <blockquote>Common counterpart of HDFS-671.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7241">HADOOP-7241</a>.

			
 
				+     Minor improvement reported by weiyj and fixed by weiyj (fs, test)<br>

			
 
				+     <b>fix typo of command &apos;hadoop fs -help tail&apos;</b><br>

			
 
				+     <blockquote>Fix the typo of command &apos;hadoop fs -help tail&apos;.

			
 
				+<br>

			
 
				+<br>$ hadoop fs -help tail

			
 
				+<br>-tail [-f] &lt;file&gt;:  Show the last 1KB of the file. 

			
 
				+<br>    The -f option shows apended data as the file grows. 

			
 
				+<br>

			
 
				+<br>The &quot;apended data&quot; should be &quot;appended data&quot;.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7229">HADOOP-7229</a>.

			
 
				+     Major bug reported by atm and fixed by atm (security)<br>

			
 
				+     <b>Absolute path to kinit in auto-renewal thread</b><br>

			
 
				+     <blockquote>In the auto-renewal thread for Kerberos credentials in {{UserGroupInformation}}, the path to {{kinit}} is defaulted to {{/usr/kerberos/bin/kinit}}. This is the default path to {{kinit}} on RHEL/CentOS for MIT krb5, but not on Debian/Ubuntu (and perhaps others OSes.)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7192">HADOOP-7192</a>.

			
 
				+     Trivial improvement reported by qwertymaniac and fixed by qwertymaniac (documentation)<br>

			
 
				+     <b>fs -stat docs aren&apos;t updated to reflect the format features</b><br>

			
 
				+     <blockquote>The html docs of the &apos;fs -stat&apos; command (that is found listed in the File System Shell Guide), does not seem to have the formatting abilities of -stat explained (along with the options).

			
 
				+<br>

			
 
				+<br>Like &apos;fs -help&apos;, the docs must also reflect the latest available features.

			
 
				+<br>

			
 
				+<br>I shall attach a doc-fix patch shortly.

			
 
				+<br>

			
 
				+<br>If anyone has other discrepancies to point out in the web version of the guide, please do so :)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7189">HADOOP-7189</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by yuzhihong@gmail.com (security)<br>

			
 
				+     <b>Add ability to enable &apos;debug&apos; property in JAAS configuration</b><br>

			
 
				+     <blockquote>Occasionally users have run into weird &quot;Unable to login&quot; messages. Unfortunately, JAAS obscures the underlying exception message in many cases because it thinks leaking the exception might be insecure in itself. Enabling the &quot;debug&quot; option in the JAAS configuration gets it to dump the underlying issue and makes troubleshooting this kind of issue easier.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7187">HADOOP-7187</a>.

			
 
				+     Major bug reported by umamaheswararao and fixed by umamaheswararao (metrics)<br>

			
 
				+     <b>Socket Leak in org.apache.hadoop.metrics.ganglia.GangliaContext</b><br>

			
 
				+     <blockquote>Init method is creating DatagramSocket. But this is not closed any where. 

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7184">HADOOP-7184</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (documentation, filecache)<br>

			
 
				+     <b>Remove deprecated local.cache.size from core-default.xml</b><br>

			
 
				+     <blockquote>MAPREDUCE-2379 documents the new name of this parameter (mapreduce.tasktracker.cache.local.size) in mapred-default.xml where it belongs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7172">HADOOP-7172</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (io, security)<br>

			
 
				+     <b>SecureIO should not check owner on non-secure clusters that have no native support</b><br>

			
 
				+     <blockquote>The SecureIOUtils.openForRead function currently uses a racy stat/open combo if security is disabled and the native libraries are not available. This ends up shelling out to &quot;ls -ld&quot; which is very very slow. We&apos;ve seen this cause significant performance regressions on clusters that match this profile.

			
 
				+<br>

			
 
				+<br>Since the racy permissions check doesn&apos;t buy us any security anyway, we should just fall back to a normal &quot;open&quot; without any stat() at all, if we can&apos;t use the native support to do it efficiently.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7156">HADOOP-7156</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>getpwuid_r is not thread-safe on RHEL6</b><br>

			
 
				+     <blockquote>Due to the following bug in SSSD, functions like getpwuid_r are not thread-safe in RHEL 6.0 if sssd is specified in /etc/nsswitch.conf (as it is by default):

			
 
				+<br>

			
 
				+<br>https://fedorahosted.org/sssd/ticket/640

			
 
				+<br>

			
 
				+<br>This causes many fetch failures in the case that the native libraries are available, since the SecureIO functions call getpwuid_r as part of fstat. By enabling -Xcheck:jni I get the following trace on JVM crash:

			
 
				+<br>

			
 
				+<br>*** glibc detected *** /mnt/toolchain/JDK6u20-64bit/bin/java: free(): invalid pointer: 0x0000003575741d23 ***

			
 
				+<br>======= Backtrace: =========

			
 
				+<br>/lib64/libc.so.6[0x3575675676]

			
 
				+<br>/lib64/libnss_sss.so.2(_nss_sss_getpwuid_r+0x11b)[0x7fe716cb42cb]

			
 
				+<br>/lib64/libc.so.6(getpwuid_r+0xdd)[0x35756a5dfd]

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7154">HADOOP-7154</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by tlipcon (scripts)<br>

			
 
				+     <b>Should set MALLOC_ARENA_MAX in hadoop-env.sh</b><br>

			
 
				+     <blockquote>New versions of glibc present in RHEL6 include a new arena allocator design. In several clusters we&apos;ve seen this new allocator cause huge amounts of virtual memory to be used, since when multiple threads perform allocations, they each get their own memory arena. On a 64-bit system, these arenas are 64M mappings, and the maximum number of arenas is 8 times the number of cores. We&apos;ve observed a DN process using 14GB of vmem for only 300M of resident set. This causes all kinds of nasty issues for obvious reasons.

			
 
				+<br>

			
 
				+<br>Setting MALLOC_ARENA_MAX to a low number will restrict the number of memory arenas and bound the virtual memory, with no noticeable downside in performance - we&apos;ve been recommending MALLOC_ARENA_MAX=4. We should set this in hadoop-env.sh to avoid this issue as RHEL6 becomes more and more common.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7146">HADOOP-7146</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>RPC server leaks file descriptors</b><br>

			
 
				+     <blockquote>Both the Listener and Responder thread call Selector.open but don&apos;t have a matching .close(). This causes a leak of anonymous pipes. Not a big deal because people rarely close and re-open servers, but worth fixing.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7145">HADOOP-7145</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>Configuration.getLocalPath should trim whitespace from the provided directories</b><br>

			
 
				+     <blockquote>MR and HDFS use the Configuration.getTrimmedStrings API for local directory lists, but in a few places also use Configuration.getLocalPath. The former API trims whitespace around each entry in the list, but the latter doesn&apos;t. This can cause some subtle problems - the latter API should be fixed to also trim the directory names.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7140">HADOOP-7140</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>IPC Reader threads do not stop when server stops</b><br>

			
 
				+     <blockquote>After HADOOP-6713, the new IPC &quot;Reader&quot; threads are not properly stopped when the server shuts down. One repercussion of this is that conditions that are supposed to shut down a daemon no longer work (eg the TT doesn&apos;t shut itself down if it detects an incompatible build version)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7137">HADOOP-7137</a>.

			
 
				+     Major task reported by nidaley and fixed by nidaley <br>

			
 
				+     <b>Remove hod contrib</b><br>

			
 
				+     <blockquote>As per vote on general@ (http://mail-archives.apache.org/mod_mbox/hadoop-general/201102.mbox/%3CAC35A7EF-1D68-4055-8D47-EDA2FCF8C2F6@mac.com%3E) I will 

			
 
				+<br>svn remove common/trunk/src/contrib/hod

			
 
				+<br>using this Jira.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7134">HADOOP-7134</a>.

			
 
				+     Major improvement reported by rvs and fixed by rvs (build)<br>

			
 
				+     <b>configure files that are generated as part of the released tarball need to have executable bit set</b><br>

			
 
				+     <blockquote>Currently the configure files that are packaged in a tarball are -rw-rw-r--</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7126">HADOOP-7126</a>.

			
 
				+     Major bug reported by pocheung and fixed by pocheung <br>

			
 
				+     <b>TestDFSShell fails in trunk</b><br>

			
 
				+     <blockquote>TestDFSShell.testFilePermissions() fails on an assert in Windows.  This originated from HDFS-1084 but the fix is in Common.

			
 
				+<br>

			
 
				+<br>junit.framework.ComparisonFailure: null expected:&lt;rwxr[w----]&gt; but was:&lt;rwxr[-xr-x]&gt;

			
 
				+<br>  at junit.framework.Assert.assertEquals(Assert.java:81)

			
 
				+<br>  at junit.framework.Assert.assertEquals(Assert.java:87)

			
 
				+<br>  at org.apache.hadoop.hdfs.TestDFSShell.confirmPermissionChange(TestDFSShell.java:836)

			
 
				+<br>  at org.apache.hadoop.hdfs.TestDFSShell.testChmod(TestDFSShell.java:777)

			
 
				+<br>  at org.apache.hadoop.hdfs.TestDFSShell.testFilePermissions(TestDFSShell.java:856)

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7122">HADOOP-7122</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (util)<br>

			
 
				+     <b>Timed out shell commands leak Timer threads</b><br>

			
 
				+     <blockquote>When a shell command times out, the TimerThread used to cause the timeout is leaked.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7121">HADOOP-7121</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (ipc)<br>

			
 
				+     <b>Exceptions while serializing IPC call response are not handled well</b><br>

			
 
				+     <blockquote>We had a situation where for some reason the serialization of an RPC call&apos;s response was throwing OOME. When this happens, the exception is not caught, and the call never gets a response - the client just hangs. Additionally, the OOME propagated all the way to the top of the IPC handler and caused the handler. Plus, the Handler upon exit only logged to stdout and not to the log4j logs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7118">HADOOP-7118</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>NPE in Configuration.writeXml</b><br>

			
 
				+     <blockquote>In HADOOP-7082 I stupidly introduced a regression whereby Configuration.writeXml will throw an NPE if it is called before any .get() call is made, since the properties member is not initialized. This is causing a failure in TestCapacitySchedulerWithJobTracker on my box, but doesn&apos;t appear to trigger any failures in the non-contrib tests since .get() is usually called first.

			
 
				+<br>

			
 
				+<br>This JIRA is to fix the bug and add a unit test for writeXml in common (apparently it never had a unit test)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7110">HADOOP-7110</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (io, native)<br>

			
 
				+     <b>Implement chmod with JNI</b><br>

			
 
				+     <blockquote>MapReduce is currently using a race-prone workaround to approximate chmod() because forking chmod is too expensive. This race is causing build failures (and probably task failures too). We should implement chmod in the NativeIO library so we can have good performance (ie not fork) and still not be prone to races.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7106">HADOOP-7106</a>.

			
 
				+     Blocker improvement reported by nidaley and fixed by tlipcon (build)<br>

			
 
				+     <b>Re-organize hadoop subversion layout</b><br>

			
 
				+     <blockquote>As discussed on general@ at http://tinyurl.com/4q6lhxm</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7104">HADOOP-7104</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (ipc, security)<br>

			
 
				+     <b>Remove unnecessary DNS reverse lookups from RPC layer</b><br>

			
 
				+     <blockquote>RPC connection authorization needs to verify client&apos;s Kerberos principal name matches what specified for the protocol. For service clients like DN&apos;s, their Kerberos principal names can be specified in the form of  &quot;datanode/_HOST@DOMAIN.COM&quot;. To get the expected

			
 
				+<br>client principal name, the server needs to substitute &quot;_HOST&quot; with the client&apos;s fully qualified domain name, which requires a reverse DNS lookup from client IP address. However, for connections from clients whose principal name are either unspecified or specified not using the &quot;_HOST&quot; convention, the substitution is not required and the reverse DNS lookup should be avoided. Currently the reverse DNS lookup is done for all clients, which could slow services like NN down, when local named cache is not available.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7102">HADOOP-7102</a>.

			
 
				+     Major bug reported by shv and fixed by shv (conf)<br>

			
 
				+     <b>Remove &quot;fs.ramfs.impl&quot; field from core-deafult.xml</b><br>

			
 
				+     <blockquote>&quot;fs.ramfs.impl&quot; used to be configuration parameter for InMemoryFileSystem, which was deprecated in 0.18 (HADOOP-3501) and removed in 0.21 (HADOOP-4648). Configuration should have been cleaned up at the time.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7101">HADOOP-7101</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (security)<br>

			
 
				+     <b>UserGroupInformation.getCurrentUser() fails when called from non-Hadoop JAAS context</b><br>

			
 
				+     <blockquote>If a Hadoop client is run from inside a container like Tomcat, and the current AccessControlContext has a Subject associated with it that is not created by Hadoop, then UserGroupInformation.getCurrentUser() will throw NoSuchElementException, since it assumes that any Subject will have a hadoop User principal.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7100">HADOOP-7100</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (build, contrib/cloud)<br>

			
 
				+     <b>Build broken by HADOOP-6811</b><br>

			
 
				+     <blockquote>The commit of HADOOP-6811 removed the ec2 contrib but didn&apos;t update build.xml, which references some of these files from the packaging targets. So, the hudson build is currently broken.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7097">HADOOP-7097</a>.

			
 
				+     Blocker bug reported by nwatkins and fixed by nwatkins (build, native)<br>

			
 
				+     <b>java.library.path missing basedir</b><br>

			
 
				+     <blockquote>My Hadoop installation is  having trouble loading the native code library. It appears from the log below that java.library.path is missing the basedir in its path. The libraries are built, and present in the directory shown below (relative to hadoop-common directory). Instead of seeing:

			
 
				+<br>

			
 
				+<br> /build/native/Linux-amd64-64/lib

			
 
				+<br>

			
 
				+<br>I would expect to see:

			
 
				+<br>

			
 
				+<br> /path/to/hadoop-common/build/native/Linux-amd64-64/lib

			
 
				+<br>

			
 
				+<br>I&apos;m working in branch-0.22.

			
 
				+<br>

			
 
				+<br>2011-01-10 17:09:27,695 DEBUG org.apache.hadoop.util.NativeCodeLoader: Failed to load native-hadoop with error: java.lang.UnsatisfiedLinkError: no hadoop in java.library.path

			
 
				+<br>2011-01-10 17:09:27,695 DEBUG org.apache.hadoop.util.NativeCodeLoader: java.library.path=/build/native/Linux-amd64-64/lib

			
 
				+<br>2011-01-10 17:09:27,695 WARN org.apache.hadoop.util.NativeCodeLoader: Unable to load native-hadoop library for your platform... using builtin-java classes where applicable</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7094">HADOOP-7094</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by cos (build)<br>

			
 
				+     <b>hadoop.css got lost during project split</b><br>

			
 
				+     <blockquote>hadoop.css no longer exists in common or HDFS, so the web UIs look pretty ugly. The HTML still refers to this file, it&apos;s just gone.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7093">HADOOP-7093</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (io)<br>

			
 
				+     <b>Servlets should default to text/plain</b><br>

			
 
				+     <blockquote>In trunk the servlets like /stacks and /metrics are returning text/html content-type instead of text/plain. Security wise it&apos;s much safer to default to text/plain and require servlets to explicitly set the content-type to text/html when required.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7091">HADOOP-7091</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (security)<br>

			
 
				+     <b>reloginFromKeytab() should happen even if TGT can&apos;t be found</b><br>

			
 
				+     <blockquote>HADOOP-6965 introduced a getTGT() method and prevents reloginFromKeytab() from happening when TGT is not found. This results in the RPC layer not being able to refresh TGT after TGT expires. The reason is RPC layer only does relogin when the expired TGT is used and an exception is thrown. However, when that happens, the expired TGT will be removed from Subject. Therefore, getTGT() will return null and relogin will not be performed. We observed, for example, JT will not be able to re-connect to NN after TGT expires.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7089">HADOOP-7089</a>.

			
 
				+     Minor bug reported by eli and fixed by eli (scripts)<br>

			
 
				+     <b>Fix link resolution logic in hadoop-config.sh</b><br>

			
 
				+     <blockquote>The link resolution logic in bin/hadoop-config.sh fails when when executed via a symlink, from the root directory.  We can replace this logic with cd -P and pwd -P, which should be portable across Linux, Solaris, BSD, and OSX. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7087">HADOOP-7087</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (io)<br>

			
 
				+     <b>SequenceFile.createWriter ignores FileSystem parameter</b><br>

			
 
				+     <blockquote>The SequenceFile.createWriter methods that take a FileSystem ignore this parameter after HADOOP-6856. This is causing some MR tests to fail and is a breaking change when users pass unqualified paths to these calls.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7082">HADOOP-7082</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (conf)<br>

			
 
				+     <b>Configuration.writeXML should not hold lock while outputting</b><br>

			
 
				+     <blockquote>Common side of HDFS-1542</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7070">HADOOP-7070</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (security)<br>

			
 
				+     <b>JAAS configuration should delegate unknown application names to pre-existing configuration</b><br>

			
 
				+     <blockquote>As reported here: https://issues.cloudera.org/browse/DISTRO-66 it is impossible to use secured Hadoop inside an application that relies on other JAAS configurations. This is because the static initializer of UserGroupInformation replaces the JAAS configuration, but we don&apos;t delegate unknown applications up to whatever Configuration was installed previously. The delegation technique seems to be used by JBoss&apos;s XMLLoginConfigImpl for example.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7068">HADOOP-7068</a>.

			
 
				+     Major bug reported by vicaya and fixed by vicaya <br>

			
 
				+     <b>Ivy resolve force mode should be turned off by default</b><br>

			
 
				+     <blockquote>The problem is introduced by  HADOOP-6486. Which have caused a lot of mysterious artifact issues (unable to downgrade or do parallel dev, without wiping out both m2 and ivy caches etc.) wasting countless hours of dev (many people&apos;s) time to track down the issue.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7057">HADOOP-7057</a>.

			
 
				+     Minor bug reported by cos and fixed by cos (util)<br>

			
 
				+     <b>IOUtils.readFully and IOUtils.skipFully have typo in exception creation&apos;s message</b><br>

			
 
				+     <blockquote>throw new IOException( &quot;Premeture EOF from inputStream&quot;);

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7054">HADOOP-7054</a>.

			
 
				+     Major improvement reported by sanjay.radia and fixed by sanjay.radia <br>

			
 
				+     <b>Change NN LoadGenerator to use the new FileContext api</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7046">HADOOP-7046</a>.

			
 
				+     Blocker bug reported by nidaley and fixed by pocheung (security)<br>

			
 
				+     <b>1 Findbugs warning on trunk and branch-0.22</b><br>

			
 
				+     <blockquote>There is 1 findbugs warnings on trunk. See attached html file. This must be fixed or filtered out to get back to 0 warnings. The OK_FINDBUGS_WARNINGS property in src/test/test-patch.properties should also be set to 0 in the patch that fixes this issue.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7038">HADOOP-7038</a>.

			
 
				+     Minor bug reported by gnawux and fixed by gnawux (build)<br>

			
 
				+     <b>saveVersion script includes an additional \r while running whoami under windows</b><br>

			
 
				+     <blockquote>I built common under windows occasionally, and found it failed because the &apos;user&apos; in build/src/o/a/h/package-info.java is &quot;myhostmyname^M&quot;.

			
 
				+<br>It seems because the whoami of windows give a string with &apos;\n\r&apos; rather than &apos;\n&apos; only. thus I add an additional tr for it to eliminate the problem.

			
 
				+<br>Since only windows would generate &apos;\n\r&apos; output, I think it won&apos;t harm to any other platform.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7034">HADOOP-7034</a>.

			
 
				+     Major test reported by eli and fixed by eli (fs)<br>

			
 
				+     <b>Add TestPath tests to cover dot, dot dot, and slash normalization</b><br>

			
 
				+     <blockquote>Add tests for the current path normalization for dot, dot dot, and slash in TestPath (from HDFS-836).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7032">HADOOP-7032</a>.

			
 
				+     Major improvement reported by eli and fixed by eli (fs)<br>

			
 
				+     <b>Assert type constraints in the FileStatus constructor</b><br>

			
 
				+     <blockquote>A FileStatus may represent a file, directory or symlink.  This is indicated using the isdir and symlink members, let&apos;s add an assert that validates the contstraints on these members (eg a directory may not have the symlink member set).  We could also verify this by having more than one constructor but we don&apos;t statically know the type of the file status when we create it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7028">HADOOP-7028</a>.

			
 
				+     Minor bug reported by patrickangeles and fixed by patrickangeles (build)<br>

			
 
				+     <b>ant eclipse does not include requisite ant.jar in the classpath</b><br>

			
 
				+     <blockquote>RccTask imports classes from ant.jar

			
 
				+<br>Importing the project into Eclipse results in these classes not being found, because ant.jar is not in the classpath.

			
 
				+<br>Note that this patch requires that ANT_HOME be set, but this is consistent with the documentation as per

			
 
				+<br>http://wiki.apache.org/hadoop/EclipseEnvironment

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7024">HADOOP-7024</a>.

			
 
				+     Major test reported by kzhang and fixed by kzhang (test)<br>

			
 
				+     <b>Create a test method for adding file systems during tests.</b><br>

			
 
				+     <blockquote>It allows a (mocked) filesystem object to be added to cache for testing purposes. This is used by HDFS-1187.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7013">HADOOP-7013</a>.

			
 
				+     Major improvement reported by pkling and fixed by pkling <br>

			
 
				+     <b>Add boolean field isCorrupt to BlockLocation</b><br>

			
 
				+     <blockquote>This is needed to allow DFSClient.getBlockLocations to notify the calling application when returning a BlockLocation that corresponds to a corrupt block. Currently, this happens when there are no uncorrupted replicas of a requested block.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7011">HADOOP-7011</a>.

			
 
				+     Major bug reported by atm and fixed by atm <br>

			
 
				+     <b>KerberosName.main(...) throws NPE</b><br>

			
 
				+     <blockquote>The main method of KerberosName attempts to do short name translation before calling KerberosName.setConfiguration(...).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7010">HADOOP-7010</a>.

			
 
				+     Minor improvement reported by yaojingguo and fixed by yaojingguo (fs)<br>

			
 
				+     <b>Typo in FileSystem.java</b><br>

			
 
				+     <blockquote>For the Javadoc for getLocal method, &quot;Get the local file syste&quot; should be &quot;Get the local file system.&quot;.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7009">HADOOP-7009</a>.

			
 
				+     Major improvement reported by hairong and fixed by hairong (io)<br>

			
 
				+     <b>MD5Hash provides a public factory method that creates an instance of MessageDigest</b><br>

			
 
				+     <blockquote>MD5Hash has a private way of creating a MessageDigest object that&apos;s thread local. I&apos;d like to have such a method which is public so that checksuming fsimage (HDFS-903) could use it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7008">HADOOP-7008</a>.

			
 
				+     Major improvement reported by nidaley and fixed by gkesavan (test)<br>

			
 
				+     <b>Enable test-patch.sh to have a configured number of acceptable findbugs and javadoc warnings</b><br>

			
 
				+     <blockquote>test-patch.sh should be able to accept a properties file containing an acceptable number of findbugs and javadoc warnings.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7007">HADOOP-7007</a>.

			
 
				+     Major improvement reported by gkesavan and fixed by gkesavan (build)<br>

			
 
				+     <b>update the hudson-test-patch target to work with the latest test-patch script.</b><br>

			
 
				+     <blockquote>The hudson-test-patch target has to be updated to work with the current test-patch.sh script. Since the callback login in the test-patch.sh is removed. by hadoop-7005</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7006">HADOOP-7006</a>.

			
 
				+     Major bug reported by cnauroth and fixed by cnauroth (fs)<br>

			
 
				+     <b>hadoop fs -getmerge does not work using codebase from trunk.</b><br>

			
 
				+     <blockquote>Running the codebase from trunk, the hadoop fs -getmerge command does not work.  As implemented in prior versions (i.e. 0.20.2), I could run hadoop fs -getmerge pointed at a directory containing multiple files.  It would merge all files into a single file on the local file system.  Running the same command using the codebase from trunk, it looks like nothing happens.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7005">HADOOP-7005</a>.

			
 
				+     Major improvement reported by nidaley and fixed by nidaley (test)<br>

			
 
				+     <b>Update test-patch.sh to remove callback to Hudson master</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6996">HADOOP-6996</a>.

			
 
				+     Major new feature reported by hairong and fixed by hairong (io)<br>

			
 
				+     <b>Allow CodecFactory to return a codec object given a codec&apos; class name</b><br>

			
 
				+     <blockquote>CodecFactory specify the list of codec that are supported by Hadoop. However, it returns a codec only by a file&apos;s name. I would like to make getCodec method to alternatively take a codec&apos;s class name.

			
 
				+<br>

			
 
				+<br>This is required by  HDFS-1435, where

			
 
				+<br>1. it allows an HDFS admin to configure which codec to use to save an image. 

			
 
				+<br>2. It stores the codec class name in its on-disk image instead of a file&apos;s suffix.

			
 
				+<br>

			
 
				+<br>When saving and reading an image, I&apos;d like to get an codec from CodecFactory by its class name. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6991">HADOOP-6991</a>.

			
 
				+     Minor bug reported by chris.douglas and fixed by chris.douglas <br>

			
 
				+     <b>SequenceFile::Reader discards length for files, does not call openFile</b><br>

			
 
				+     <blockquote>While the sorting and merging in {{SequenceFile}} is deprecated and {{openFile}} is archaic, the semantics should remain consistent.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6989">HADOOP-6989</a>.

			
 
				+     Major bug reported by jghoman and fixed by chris.douglas <br>

			
 
				+     <b>TestSetFile is failing on trunk</b><br>

			
 
				+     <blockquote>Testsuite: org.apache.hadoop.io.TestSetFile

			
 
				+<br>Tests run: 1, Failures: 0, Errors: 1, Time elapsed: 1.015 sec

			
 
				+<br>------------- Standard Output ---------------

			
 
				+<br>2010-10-04 16:32:01,030 INFO  io.TestSetFile (TestSetFile.java:generate(56)) - generating 10000 records in memory

			
 
				+<br>2010-10-04 16:32:01,249 INFO  io.TestSetFile (TestSetFile.java:generate(63)) - sorting 10000 records

			
 
				+<br>2010-10-04 16:32:01,350 INFO  io.TestSetFile (TestSetFile.java:writeTest(72)) - creating with 10000 records

			
 
				+<br>------------- ---------------- ---------------

			
 
				+<br>

			
 
				+<br>Testcase: testSetFile took 0.964 sec

			
 
				+<br>  Caused an ERROR

			
 
				+<br>key class or comparator option must be set

			
 
				+<br>java.lang.IllegalArgumentException: key class or comparator option must be set

			
 
				+<br>  at org.apache.hadoop.io.MapFile$Writer.&lt;init&gt;(MapFile.java:247)

			
 
				+<br>  at org.apache.hadoop.io.SetFile$Writer.&lt;init&gt;(SetFile.java:60)

			
 
				+<br>  at org.apache.hadoop.io.TestSetFile.writeTest(TestSetFile.java:73)

			
 
				+<br>  at org.apache.hadoop.io.TestSetFile.testSetFile(TestSetFile.java:45)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6987">HADOOP-6987</a>.

			
 
				+     Major improvement reported by jghoman and fixed by jghoman (test)<br>

			
 
				+     <b>Use JUnit Rule to optionally fail test cases that run more than 10 seconds</b><br>

			
 
				+     <blockquote>Using JUnit Rules annotations we can fail tests cases that take longer than 10 seconds (for instance) to run.  This provides a regression check against test cases taking longer than they had previously due to unintended code changes, as well as provides a membership criteria for unit tests versus integration tests in HDFS and MR.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6985">HADOOP-6985</a>.

			
 
				+     Minor improvement reported by rvadali and fixed by rvadali <br>

			
 
				+     <b>Suggest that HADOOP_OPTS be preserved in hadoop-env.sh.template</b><br>

			
 
				+     <blockquote>For an administrator who wants to customize HADOOP_OPTS, it would be better to have

			
 
				+<br>

			
 
				+<br># if [ &quot;$HADOOP_OPTS&quot; == &quot;&quot; ]; then export HADOOP_OPTS=-server; else FOO+=&quot; -server&quot;; fi

			
 
				+<br>

			
 
				+<br>instead of

			
 
				+<br>

			
 
				+<br># Extra Java runtime options.  Empty by default.

			
 
				+<br># export HADOOP_OPTS=-server

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6984">HADOOP-6984</a>.

			
 
				+     Minor bug reported by chris.douglas and fixed by chris.douglas (io)<br>

			
 
				+     <b>NPE from SequenceFile::Writer.CompressionCodecOption</b><br>

			
 
				+     <blockquote>The deprecated HADOOP-6856 constructors can create a compressed writers with a null-wrapped {{CompressionCodecOption}}</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6978">HADOOP-6978</a>.

			
 
				+     Blocker new feature reported by tlipcon and fixed by tlipcon (io, native, security)<br>

			
 
				+     <b>Add JNI support for secure IO operations</b><br>

			
 
				+     <blockquote>In support of MAPREDUCE-2096, we need to add some JNI functionality. In particular, we need the ability to use fstat() on an open file stream, and to use open() with O_EXCL, O_NOFOLLOW, and without O_CREAT.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6977">HADOOP-6977</a>.

			
 
				+     Major improvement reported by cos and fixed by cos (test)<br>

			
 
				+     <b>Herriot daemon clients should vend statistics</b><br>

			
 
				+     <blockquote>The HDFS web user interface serves useful information through dfshealth.jsp and dfsnodelist.jsp.

			
 
				+<br>

			
 
				+<br>The Herriot interface to Hadoop cluster daemons would benefit from the addition of some way to channel metics information.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6975">HADOOP-6975</a>.

			
 
				+     Major bug reported by pkling and fixed by pkling <br>

			
 
				+     <b>integer overflow in S3InputStream for blocks &gt; 2GB</b><br>

			
 
				+     <blockquote>S3InputStream has the same integer overflow issue as DFSInputStream (fixed in HDFS-96).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6970">HADOOP-6970</a>.

			
 
				+     Major bug reported by shv and fixed by boryas (build)<br>

			
 
				+     <b>SecurityAuth.audit should be generated under /build</b><br>

			
 
				+     <blockquote>SecurityAuth.audit is generated under currently root project directory whenever I run anything, and is not being cleaned up by the clean target. It should be created under build directory instead.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6965">HADOOP-6965</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>Method in UGI to get Kerberos ticket. </b><br>

			
 
				+     <blockquote>The getTGT method in AutoRenewal thread is moved to the outer UGI class. It is still a private method but can be used by reloginFromKeyTab to check for TGT expiry. This jira covers common changes for HDFS-1364</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6951">HADOOP-6951</a>.

			
 
				+     Major bug reported by atm and fixed by atm (security)<br>

			
 
				+     <b>Distinct minicluster services (e.g. NN and JT) overwrite each other&apos;s service policies</b><br>

			
 
				+     <blockquote>Because the protocol -&gt; ACL mapping in ServiceAuthorizationManager is static, services which are run in the same JVM have the potential to clobber the other&apos;s service authorization ACLs whenever ServiceAuthorizationManager.refresh() is called. This causes authorization failures if one tries to launch a 2NN connected to a minicluster with hadoop.security.authorization enabled. Seems like each service should have its own instance of a ServiceAuthorizationManager, instead of using static methods.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6950">HADOOP-6950</a>.

			
 
				+     Trivial improvement reported by philip and fixed by philip (scripts)<br>

			
 
				+     <b>Suggest that HADOOP_CLASSPATH should be preserved in hadoop-env.sh.template</b><br>

			
 
				+     <blockquote>HADOOP_CLASSPATH tends to be used to add to bin/hadoop&apos;s classpath.  Because of the way the comment is written, administrator&apos;s who customize hadoop-env.sh often inadvertently disable user&apos;s abilities to use it, by not including the present value of the variable.

			
 
				+<br>

			
 
				+<br>I propose we change the commented out suggestion code to include the present value.

			
 
				+<br>

			
 
				+<br> # Extra Java CLASSPATH elements.  Optional.

			
 
				+<br>-# export HADOOP_CLASSPATH=

			
 
				+<br>+# export HADOOP_CLASSPATH=&quot;&lt;extra_entries&gt;:$HADOOP_CLASSPATH&quot;

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6949">HADOOP-6949</a>.

			
 
				+     Major improvement reported by navis and fixed by mattf (io)<br>

			
 
				+     <b>Reduces RPC packet size for primitive arrays, especially long[], which is used at block reporting</b><br>

			
 
				+     <blockquote>Current implementation of oah.io.ObjectWritable marshals primitive array types as general object array ; array type string + array length + (element type string + value)*n

			
 
				+<br>

			
 
				+<br>It would not be needed to specify each element types for primitive arrays.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6947">HADOOP-6947</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (security)<br>

			
 
				+     <b>Kerberos relogin should set refreshKrb5Config to true</b><br>

			
 
				+     <blockquote>In working on securing a daemon that uses two different principals from different threads, I found that I wasn&apos;t able to login from a second keytab after I&apos;d logged in from the first. This is because we don&apos;t set the refreshKrb5Config in the Configuration for the Krb5LoginModule - hence it won&apos;t switch over to the correct keytab file if it&apos;s different than the first.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6943">HADOOP-6943</a>.

			
 
				+     Major improvement reported by atm and fixed by atm (security)<br>

			
 
				+     <b>The GroupMappingServiceProvider interface should be public</b><br>

			
 
				+     <blockquote>The GroupMappingServiceProvider interface is presently package-protected. It seems likely that many organizations will be implementing their own versions of this to suit their particular setup. It would be nice if this interface were made public, and annotated with &quot;@InterfaceAudience.Private&quot; and &quot;@InterfaceStability.Evolving&quot;.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6940">HADOOP-6940</a>.

			
 
				+     Minor bug reported by tomwhite and fixed by tomwhite (fs)<br>

			
 
				+     <b>RawLocalFileSystem&apos;s markSupported method misnamed markSupport</b><br>

			
 
				+     <blockquote>It should be named markSupported to override the method defined in InputStream. Since it doesn&apos;t change the default no harm is done.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6938">HADOOP-6938</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (ipc, security)<br>

			
 
				+     <b>ConnectionId.getRemotePrincipal() should check if security is enabled</b><br>

			
 
				+     <blockquote>When security is not enabled, getRemotePrincipal() should return null, which means the Kerberos principal of the remote server is ignored. This bug was caught by TestCLI on Yahoo 20S branch.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6933">HADOOP-6933</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by tlipcon (test)<br>

			
 
				+     <b>TestListFiles is flaky</b><br>

			
 
				+     <blockquote>TestListFiles assumes a particular order of the files returned by the directory iterator. There&apos;s no such guarantee made by the underlying API, so the test fails on some hosts.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6932">HADOOP-6932</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>Namenode start (init) fails because of invalid kerberos key, even when security set to &quot;simple&quot;</b><br>

			
 
				+     <blockquote>NameNode.initialize() calls login() method even when security set to simple</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6930">HADOOP-6930</a>.

			
 
				+     Major bug reported by sharadag and fixed by sharadag (ipc)<br>

			
 
				+     <b>AvroRpcEngine doesn&apos;t work with generated Avro code</b><br>

			
 
				+     <blockquote>AvroRpcEngine uses &apos;reflect&apos; based java implementation. There should be a way to have it work with &apos;specific&apos; (generated code from avro idl).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6926">HADOOP-6926</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by tlipcon (io)<br>

			
 
				+     <b>SocketInputStream incorrectly implements read()</b><br>

			
 
				+     <blockquote>SocketInputStream&apos;s read() implementation doesn&apos;t upcast to int correctly, so it can&apos;t read bytes &gt; 0x80. This is the same bug as HADOOP-6925, but in a different spot.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6922">HADOOP-6922</a>.

			
 
				+     Major bug reported by ravidotg and fixed by ravidotg (documentation, security)<br>

			
 
				+     <b>COMMON part of MAPREDUCE-1664</b><br>

			
 
				+     <blockquote>MAPREDUCE-1664 changes the behavior of queue acls and job acls. This needs documentation changes to cluster_setup.xml and a small change in AccessControlList.java</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6913">HADOOP-6913</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (security)<br>

			
 
				+     <b>Circular initialization between UserGroupInformation and KerberosName</b><br>

			
 
				+     <blockquote>If the first call to UGI is UGI.setConfiguration(conf), it will try to initialize UGI class. During this initialization, the code calls KerberosName.setConfiguration(). KerberosName&apos;s static initializer will in turn call UGI.isSecurityEnabled(). Since UGI hasn&apos;t been completely initialized yet, isSecurityEnabled() will re-initialize UGI with a DEFAULT conf. As a result, the original conf used in UGI.setConfiguration(conf) will be overwritten by the DEFAULT conf.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6911">HADOOP-6911</a>.

			
 
				+     Minor improvement reported by boryas and fixed by  <br>

			
 
				+     <b>doc update for DelegationTokenFetcher (part of HDFS-1036)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6907">HADOOP-6907</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (ipc, security)<br>

			
 
				+     <b>Rpc client doesn&apos;t use the per-connection conf to figure out server&apos;s Kerberos principal</b><br>

			
 
				+     <blockquote>Currently, RPC client caches the conf that was passed in to its constructor and uses that same conf (or values obtained from it) for every connection it sets up. This is not sufficient for security since each connection needs to figure out server&apos;s Kerberos principal on a per-connection basis. It&apos;s not reasonable to expect the first conf used by a user to contain all the Kerberos principals that her future connections will ever need. Or worse, if her first conf contains an incorrect principal name, it will prevent the user from connecting to the server even if she later on passes in a correct conf on retry (by calling RPC.getProxy()).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6906">HADOOP-6906</a>.

			
 
				+     Major bug reported by vinodkv and fixed by vinodkv (fs)<br>

			
 
				+     <b>FileContext copy() utility doesn&apos;t work with recursive copying of directories.</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6905">HADOOP-6905</a>.

			
 
				+     Major improvement reported by kzhang and fixed by kzhang (security)<br>

			
 
				+     <b>Better logging messages when a delegation token is invalid</b><br>

			
 
				+     <blockquote>From our production logs, we see some logging messages of &quot;token is expired or doesn&apos;t exist&quot;. It would be helpful to know whose token it was.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6903">HADOOP-6903</a>.

			
 
				+     Major improvement reported by sanjay.radia and fixed by sanjay.radia <br>

			
 
				+     <b>Make AbstractFileSystem&apos;s methods public to allow filter-Fs like implementions in a differnt package than fs</b><br>

			
 
				+     <blockquote>Make AbstractFileSystem&apos;s methods public to allow filter-Fs like implementions in a differnt package than fs</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6900">HADOOP-6900</a>.

			
 
				+     Major bug reported by sureshms and fixed by hairong <br>

			
 
				+     <b>FileSystem#listLocatedStatus should not throw generic RuntimeException to indicate error conditions</b><br>

			
 
				+     <blockquote>HDFS-6870 introduced FileSystem#listLocatedStatus(), that returns an Iterator to iterate through LocatedFileStatus for files under a directory or recursively under a sub-directory. Iterator currently throws generic RuntimeException to indicate error conditions. API needs to be changed to throw appropriate exceptions to indicate error conditions.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6899">HADOOP-6899</a>.

			
 
				+     Major bug reported by sanjay.radia and fixed by sanjay.radia (fs)<br>

			
 
				+     <b>RawLocalFileSystem#setWorkingDir() does not work for relative names</b><br>

			
 
				+     <blockquote>RawLocalFileSystem#setWorkingDir() does not work for relative names</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6898">HADOOP-6898</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by atm (fs, security)<br>

			
 
				+     <b>FileSystem.copyToLocal creates files with 777 permissions</b><br>

			
 
				+     <blockquote>FileSystem.copyToLocal ends up calling through to FileUtil.copy, which calls create() on the target file system without passing any permission object. Therefore, the file ends up getting created locally with 777 permissions, which is dangerous -- even if the caller then fixes up permissions afterwards, it exposes a window in which an attacker can open the file.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6892">HADOOP-6892</a>.

			
 
				+     Major new feature reported by jghoman and fixed by jghoman (security)<br>

			
 
				+     <b>Common component of HDFS-1150 (Verify datanodes&apos; identities to clients in secure clusters)</b><br>

			
 
				+     <blockquote>HDFS-1150 will have changes to the start-up scripts and HttpServer.  These are handled here.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6890">HADOOP-6890</a>.

			
 
				+     Major improvement reported by hairong and fixed by hairong (fs)<br>

			
 
				+     <b>Improve listFiles API introduced by HADOOP-6870</b><br>

			
 
				+     <blockquote>This jira is mainly for addressing Suresh&apos;s review comments for HADOOP-6870:

			
 
				+<br>

			
 
				+<br>   1. General comment: I have concerns about recursive listing. This could be abused by the applications, creating a lot of requests into HDFS.

			
 
				+<br>   2. Any deletion of files/directories while reursing through directories results in RuntimeException and application has a partial result. Should we ignore if a directory was in stack and was not found later when iterating through it?

			
 
				+<br>   3. FileSystem.java

			
 
				+<br>          * listFile() - method javadoc could be better organized - first write about if path is directory and two cases recursive=true and false. Then if path is file and two cases recursive=true or false.

			
 
				+<br>          * listFile() - document throwing RuntimeException, UnsupportedOperationException and the possible cause. IOException is no longer thrown.

			
 
				+<br>   4. TestListFiles.java

			
 
				+<br>          * testDirectory() - comments test empty directory and test directory with 1 file should be moved up to relevant sections of the test.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6889">HADOOP-6889</a>.

			
 
				+     Major new feature reported by hairong and fixed by johnvijoe (ipc)<br>

			
 
				+     <b>Make RPC to have an option to timeout</b><br>

			
 
				+     <blockquote>Currently Hadoop RPC does not timeout when the RPC server is alive. What it currently does is that a RPC client sends a ping to the server whenever a socket timeout happens. If the server is still alive, it continues to wait instead of throwing a SocketTimeoutException. This is to avoid a client to retry when a server is busy and thus making the server even busier. This works great if the RPC server is NameNode.

			
 
				+<br>

			
 
				+<br>But Hadoop RPC is also used for some of client to DataNode communications, for example, for getting a replica&apos;s length. When a client comes across a problematic DataNode, it gets stuck and can not switch to a different DataNode. In this case, it would be better that the client receives a timeout exception.

			
 
				+<br>

			
 
				+<br>I plan to add a new configuration ipc.client.max.pings that specifies the max number of pings that a client could try. If a response can not be received after the specified max number of pings, a SocketTimeoutException is thrown. If this configuration property is not set, a client maintains the current semantics, waiting forever.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6888">HADOOP-6888</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (fs, security)<br>

			
 
				+     <b>Being able to close all cached FileSystem objects for a given UGI</b><br>

			
 
				+     <blockquote>This is the Common part of MAPREDUCE-1900. It adds a utility method to FileSystem that closes all cached filesystems for a given UGI.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6885">HADOOP-6885</a>.

			
 
				+     Major bug reported by eli and fixed by eli (security)<br>

			
 
				+     <b>Fix java doc warnings in Groups and RefreshUserMappingsProtocol</b><br>

			
 
				+     <blockquote>There are a couple java docs warnings in Groups and RefreshUserMappingsProtocol.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6884">HADOOP-6884</a>.

			
 
				+     Major improvement reported by zasran and fixed by zasran <br>

			
 
				+     <b>Add LOG.isDebugEnabled() guard for each LOG.debug(&quot;...&quot;)</b><br>

			
 
				+     <blockquote>Each LOG.debug(&quot;...&quot;) should be executed only if LOG.isDebugEnabled() is true, in some cases it&apos;s expensive to construct the string that is being printed to log. It&apos;s much easier to always use LOG.isDebugEnabled() because it&apos;s easier to check (rather than in each case reason whether it&apos;s necessary or not).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6879">HADOOP-6879</a>.

			
 
				+     Major improvement reported by iyappans and fixed by cos (build, test)<br>

			
 
				+     <b>Provide SSH based (Jsch) remote execution API for system tests</b><br>

			
 
				+     <blockquote>http://mvnrepository.com/

			
 
				+<br>com.jcraft » jsch 

			
 
				+<br>0.1.42 version needs to be included in the build. This is  needed to facilitate implementation of some system (Herriot) testcases .

			
 
				+<br>

			
 
				+<br>Please include this in ivy.

			
 
				+<br>

			
 
				+<br>jsch is originally located in http://www.jcraft.com/jsch/</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6877">HADOOP-6877</a>.

			
 
				+     Major improvement reported by kzhang and fixed by kzhang (ipc)<br>

			
 
				+     <b>Common part of HDFS-1178</b><br>

			
 
				+     <blockquote>This is the Common part of HDFS-1178.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6873">HADOOP-6873</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>using delegation token over hftp for long running clients (part of hdfs 1296)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6870">HADOOP-6870</a>.

			
 
				+     Major new feature reported by hairong and fixed by hairong (fs)<br>

			
 
				+     <b>Add FileSystem#listLocatedStatus to list a directory&apos;s content together with each file&apos;s block locations</b><br>

			
 
				+     <blockquote>This jira implements the new FileSystem API as proposed in HDFS-202. The new API aims to eliminate individual &quot;getFileBlockLocations&quot; calls to NN for each file in the input directory of a job. Instead, a file&apos;s block locations are returned together with FileStatus when listing a directory, thus improving getSplits performance.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6862">HADOOP-6862</a>.

			
 
				+     Major improvement reported by amareshwari and fixed by amareshwari (security)<br>

			
 
				+     <b>Add api to add user/group to AccessControlList</b><br>

			
 
				+     <blockquote>Add api addUser(String user) and addGroup(String group) to add user/group to AccessControlList</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6861">HADOOP-6861</a>.

			
 
				+     Major improvement reported by jnp and fixed by jnp <br>

			
 
				+     <b>Method in Credentials to read and write a token storage file.</b><br>

			
 
				+     <blockquote>The jira covers the changes in common corresponding to MAPREDUCE-1566. 

			
 
				+<br>

			
 
				+<br>This jira adds  new non-static methods in Credentials to read and write token storage file. A method to copy tokens from another credential object is also added. Static method readTokensAndLoadInUGI is removed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6859">HADOOP-6859</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms <br>

			
 
				+     <b>Introduce additional statistics to FileSystem</b><br>

			
 
				+     <blockquote>Currently FileSystem#statistics tracks bytesRead and bytesWritten. Additional statistics that gives summary of operations performed will be useful for tracking file system use.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6856">HADOOP-6856</a>.

			
 
				+     Major improvement reported by owen.omalley and fixed by owen.omalley (io)<br>

			
 
				+     <b>SequenceFile and MapFile need cleanup to remove redundant constructors</b><br>

			
 
				+     <blockquote>Currently there are 2 public SequenceFile.Reader constructors, 3 public SequenceFile.Writer constructors, 9 public SequenceFile.createWriter, 2 public MapFile.Reader constructors, and 8 public MapFile.Writer constructors. All of with various historical combinations of parameters that don&apos;t cover the entire space.

			
 
				+<br>

			
 
				+<br>All of this makes it *very* difficult to add new optional parameters to SequenceFile and MapFile. 

			
 
				+<br>

			
 
				+<br>I&apos;d like change to the style of FileContext.create with option parameters. I&apos;ll implement one public SequenceFile.Reader constructor and one public SequenceFile.createWriter and implement all of the current variants based on those two. I&apos;ll do the same for MapFile.Reader and MapFile.Writer including passing parameters down to the underlying SequenceFile.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6853">HADOOP-6853</a>.

			
 
				+     Major bug reported by jghoman and fixed by jghoman <br>

			
 
				+     <b>Common component of HDFS-1045</b><br>

			
 
				+     <blockquote>HDFS-1045 modified UGI, which is in Common on trunk.  This JIRA is for that change.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6846">HADOOP-6846</a>.

			
 
				+     Major task reported by tomwhite and fixed by tomwhite (build)<br>

			
 
				+     <b>Scripts for building Hadoop 0.22.0 release</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6845">HADOOP-6845</a>.

			
 
				+     Major improvement reported by jnp and fixed by jnp <br>

			
 
				+     <b>TokenStorage renamed to Credentials.</b><br>

			
 
				+     <blockquote>This jira tracks common changes for MAPREDUCE-1528.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6835">HADOOP-6835</a>.

			
 
				+     Major improvement reported by tomwhite and fixed by roelofs (io)<br>

			
 
				+     <b>Support concatenated gzip files</b><br>

			
 
				+     <blockquote>When running MapReduce with concatenated gzip files as input only the first part is read, which is confusing, to say the least. Concatenated gzip is described in http://www.gnu.org/software/gzip/manual/gzip.html#Advanced-usage and in http://www.ietf.org/rfc/rfc1952.txt. (See original report at http://www.nabble.com/Problem-with-Hadoop-and-concatenated-gzip-files-to21383097.html)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6834">HADOOP-6834</a>.

			
 
				+     Major bug reported by ahadr and fixed by hong.tang (io)<br>

			
 
				+     <b>TFile.append compares initial key against null lastKey  </b><br>

			
 
				+     <blockquote>The following code in TFile.KeyReigster.close: 

			
 
				+<br>

			
 
				+<br>            byte[] lastKey = lastKeyBufferOS.getBuffer();

			
 
				+<br>            int lastLen = lastKeyBufferOS.size();

			
 
				+<br>            if (tfileMeta.getComparator().compare(key, 0, len, lastKey, 0,

			
 
				+<br>                lastLen) &lt; 0) {

			
 
				+<br>              throw new IOException(&quot;Keys are not added in sorted order&quot;);

			
 
				+<br>            }

			
 
				+<br>

			
 
				+<br>compares the initial  key (passed in via  TFile.Writer.append) against a technically NULL lastKey. lastKey is not initialized until after the first call to TFile.Writer.append. The underlying RawComparator interface used for comparisons does not stipulate the proper behavior when either length 1  or length 2 is zero. In the case of LongWritable, its WritableComparator implementation does an unsafe read on the passed in byte arrays b1 and b2. Since TFile pre-allocates the buffer used for storing lastKey, this passes a valid buffer with zero count to LongWritable&apos;s comparator, which ignores length and thus produces incorrect results. 

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6832">HADOOP-6832</a>.

			
 
				+     Major new feature reported by owen.omalley and fixed by owen.omalley (security)<br>

			
 
				+     <b>Provide a web server plugin that uses a static user for the web UI</b><br>

			
 
				+     <blockquote>We need a simple plugin that uses a static user for clusters with security that don&apos;t want to authenticate users on the web UI.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6825">HADOOP-6825</a>.

			
 
				+     Major improvement reported by rschmidt and fixed by rschmidt <br>

			
 
				+     <b>FileStatus needs unit tests</b><br>

			
 
				+     <blockquote>We need some unit tests for FileStatus to prevent problems like those we recently had on HADOOP-6796 and MAPREDUCE-1858.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6818">HADOOP-6818</a>.

			
 
				+     Major improvement reported by devaraj and fixed by devaraj (security)<br>

			
 
				+     <b>Provide a JNI-based implementation of GroupMappingServiceProvider</b><br>

			
 
				+     <blockquote>The default implementation of GroupMappingServiceProvider does a fork of a unix command to get the groups of a user. Since the group resolution happens in the servers, this might be costly. This jira aims at providing a JNI-based implementation for GroupMappingServiceProvider.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6815">HADOOP-6815</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>refreshSuperUserGroupsConfiguration should use server side configuration for the refresh</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6814">HADOOP-6814</a>.

			
 
				+     Major improvement reported by jnp and fixed by jnp <br>

			
 
				+     <b>Method in UGI to get the authentication method of the real user.</b><br>

			
 
				+     <blockquote>UGI should have a method to return the authentication method of the real user for a proxy-user scenario.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6812">HADOOP-6812</a>.

			
 
				+     Major bug reported by appodictic and fixed by chris.douglas (documentation)<br>

			
 
				+     <b>fs.inmemory.size.mb not listed in conf. Cluster setup page gives wrong advice.</b><br>

			
 
				+     <blockquote>http://hadoop.apache.org/common/docs/current/cluster_setup.html

			
 
				+<br>fs.inmemory.size.mb does not appear in any xml file

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6811">HADOOP-6811</a>.

			
 
				+     Blocker improvement reported by tomwhite and fixed by tomwhite <br>

			
 
				+     <b>Remove EC2 bash scripts</b><br>

			
 
				+     <blockquote>The bash scripts are deprecated in 0.21 (HADOOP-6403) in favour of scripts in Whirr (http://incubator.apache.org/projects/whirr.html). They should be removed in 0.22. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6805">HADOOP-6805</a>.

			
 
				+     Major improvement reported by boryas and fixed by boryas <br>

			
 
				+     <b>add buildDTServiceName method to SecurityUtil (as part of MAPREDUCE-1718)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6803">HADOOP-6803</a>.

			
 
				+     Major test reported by eli and fixed by eli (io)<br>

			
 
				+     <b>Add native gzip read/write coverage to TestCodec </b><br>

			
 
				+     <blockquote>Looking at ZlibCompressor I noticed that the finished member is never modified, and is therefore always false. This means ZlibCompressor#finished will always return false so CompressorStream#close loops indefinitely in finish:

			
 
				+<br>

			
 
				+<br>      while (!compressor.finished()) {

			
 
				+<br>        compress();

			
 
				+<br>      }

			
 
				+<br>

			
 
				+<br>I modifed TestCodec#testGzipCodecWrite to also cover writing using the native lib and confirmed the hang with jstack. The fix is simple, ZlibCompressor should record when it&apos;s been finished.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6791">HADOOP-6791</a>.

			
 
				+     Major improvement reported by boryas and fixed by boryas <br>

			
 
				+     <b>Refresh for proxy superuser config  (common part for HDFS-1096)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6787">HADOOP-6787</a>.

			
 
				+     Major bug reported by vicaya and fixed by vicaya (fs)<br>

			
 
				+     <b>Factor out glob pattern code from FileContext and Filesystem</b><br>

			
 
				+     <blockquote>Refactor the glob pattern code out of FileContext and FileSystem into a package private GlobFilter and the reusable GlobPattern class (InterfaceAudience.Private)

			
 
				+<br>

			
 
				+<br>Also fix the handling of ^ outside character class ([...]) reported in HADOOP-6618 and make the glob pattern code less restrictive (not throwing on some valid glob patterns.) and more POSIX standard compliant (support [!...]).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6781">HADOOP-6781</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>security audit log shouldn&apos;t have exception in it.</b><br>

			
 
				+     <blockquote>security audit log in Server.java also prints the exception information. It shouldn&apos;t be there.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6778">HADOOP-6778</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>add isRunning() method to AbstractDelegationTokenSecretManager (for  HDFS-1044)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6763">HADOOP-6763</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by boryas <br>

			
 
				+     <b>Remove verbose logging from the Groups class</b><br>

			
 
				+     <blockquote>

			
 
				+2010-02-25 08:30:52,269 INFO  security.Groups (Groups.java:&lt;init&gt;(60)) - Group mapping impl=org.apache.hadoop.security.ShellBasedUnixGroupsMapping; cacheTimeout=300000

			
 
				+<br>...

			
 
				+<br>2010-02-25 08:30:57,872 INFO  security.Groups (Groups.java:getGroups(76)) - Returning cached groups for &apos;oom&apos;

			
 
				+<br>

			
 
				+<br>should both be demoted to debug level.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6761">HADOOP-6761</a>.

			
 
				+     Major improvement reported by dms and fixed by dms <br>

			
 
				+     <b>Improve Trash Emptier</b><br>

			
 
				+     <blockquote>There are two inefficiencies in the Trash functionality right now that have caused some problems for us.

			
 
				+<br>First if you configured your trash interval to be one day (24 hours) that means that you store 2 days worth of data eventually. The Current and the previous timestamp that will not be deleted until the end of the interval.

			
 
				+<br>And another problem is accumulating a lot of data in Trash before the Emptier wakes up. If there are a couple of million files trashed and the Emptier does deletion on HDFS the NameNode will freeze until everything is removed. (this particular problem hopefully will be addressed with HDFS-1143).

			
 
				+<br>

			
 
				+<br>My proposal is to have two configuration intervals. One for deleting the trashed data and another for checkpointing. This way for example for intervals of one day and one hour we will only store 25 hours of data instead of 48 right now and the deletions will be happening in smaller chunks every hour of the day instead of a huge deletion at the end of the day now.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6758">HADOOP-6758</a>.

			
 
				+     Major bug reported by azaroth and fixed by azaroth <br>

			
 
				+     <b>MapFile.fix does not allow index interval definition</b><br>

			
 
				+     <blockquote>When using the static methond MapFile.fix() there is no way to override the default IndexInterval that is 128.

			
 
				+<br>

			
 
				+<br>The IndexInterval should be taken from the configuration that is passed to the method.

			
 
				+<br>int indexInterval = 128; 

			
 
				+<br>indexInterval = conf.getInt(INDEX_INTERVAL, indexInterval); 

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6756">HADOOP-6756</a>.

			
 
				+     Major bug reported by zasran and fixed by zasran (fs)<br>

			
 
				+     <b>Clean up and add documentation for configuration keys in CommonConfigurationKeys.java</b><br>

			
 
				+     <blockquote>Configuration keys in CommonConfigurationKeys.java should be cleaned up and documented (javadoc comments, appropriate *-default.xml descriptions).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6747">HADOOP-6747</a>.

			
 
				+     Major bug reported by vicaya and fixed by tlipcon <br>

			
 
				+     <b>TestNetUtils fails on Mac OS X</b><br>

			
 
				+     <blockquote>TestNetUtils fails consistently after HADOOP-6722 on Mac OS X Leopard 10.5.8:

			
 
				+<br>

			
 
				+<br>------------- Standard Error -----------------

			
 
				+<br>local address: /127.0.0.1

			
 
				+<br>local port: 64991

			
 
				+<br>------------- ---------------- ---------------

			
 
				+<br>

			
 
				+<br>Testcase: testAvoidLoopbackTcpSockets took 0.421 sec

			
 
				+<br>        Caused an ERROR

			
 
				+<br>Invalid argument

			
 
				+<br>java.net.SocketException: Invalid argument

			
 
				+<br>        at sun.nio.ch.Net.connect(Native Method)

			
 
				+<br>        at sun.nio.ch.SocketChannelImpl.connect(SocketChannelImpl.java:507)

			
 
				+<br>        at org.apache.hadoop.net.SocketIOWithTimeout.connect(SocketIOWithTimeout.java:192)

			
 
				+<br>        at org.apache.hadoop.net.NetUtils.connect(NetUtils.java:369)

			
 
				+<br>        at org.apache.hadoop.net.TestNetUtils.testAvoidLoopbackTcpSockets(TestNetUtils.java:46)

			
 
				+<br>

			
 
				+<br>Although TCP spec seems to allow it, at least one implementation disallows this corner case. 

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6745">HADOOP-6745</a>.

			
 
				+     Minor improvement reported by boryas and fixed by boryas (ipc)<br>

			
 
				+     <b>adding some java doc to Server.RpcMetrics, UGI</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6730">HADOOP-6730</a>.

			
 
				+     Major bug reported by eli and fixed by raviphulari (fs, test)<br>

			
 
				+     <b>Bug in FileContext#copy and provide base class for FileContext tests</b><br>

			
 
				+     <blockquote>Thanks to Eli, He noticed that there is no test for FileContext#Copy operation. 

			
 
				+<br>On further investigation with the help of Sanjay we found that there is bug in FileContext#checkDest.

			
 
				+<br> *FileStatus dstFs = getFileStatus(dst);* should be in try...catch block.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6715">HADOOP-6715</a>.

			
 
				+     Major bug reported by ravidotg and fixed by ravidotg (security, util)<br>

			
 
				+     <b>AccessControlList.toString() returns empty string when we set acl to &quot;*&quot;</b><br>

			
 
				+     <blockquote>AccessControlList.toString() returns empty string when we set the acl to &quot;\*&quot; and also when we set it to empty(i.e. &quot; &quot;). This is causing wrong values for ACLs shown on jobdetails.jsp and jobdetailshistory.jsp web pages when acls are set to &quot;\*&quot;.

			
 
				+<br>

			
 
				+<br>I think AccessControlList.toString() needs to be changed to return &quot;\*&quot; when we set the acl to &quot;\*&quot;.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6714">HADOOP-6714</a>.

			
 
				+     Major improvement reported by patrickangeles and fixed by patrickangeles <br>

			
 
				+     <b>FsShell &apos;hadoop fs -text&apos; does not support compression codecs</b><br>

			
 
				+     <blockquote>Currently, &apos;hadoop fs -text myfile&apos; looks at the first few magic bytes of a file to determine whether it is gzip compressed or a sequence file. This means &apos;fs -text&apos; cannot properly decode .deflate or .bz2 files (or other codecs specified via configuration).

			
 
				+<br>

			
 
				+<br>It should be fairly straightforward to add support for other codecs by checking the file extension against the CompressionCodecFactory to retrieve an appropriate Codec.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6706">HADOOP-6706</a>.

			
 
				+     Major bug reported by devaraj and fixed by devaraj (security)<br>

			
 
				+     <b>Relogin behavior for RPC clients could be improved</b><br>

			
 
				+     <blockquote>Currently, the relogin in the RPC client happens on only a SaslException. But we have seen cases where other exceptions are thrown (like IllegalStateException when the client&apos;s ticket is invalid). This jira is to fix that behavior.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6693">HADOOP-6693</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms <br>

			
 
				+     <b>Add metrics to track kerberos login activity</b><br>

			
 
				+     <blockquote>Need metrics to track kerberos login activity such as login rate and the time taken for login.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6683">HADOOP-6683</a>.

			
 
				+     Minor sub-task reported by xiaokang and fixed by xiaokang (io)<br>

			
 
				+     <b>the first optimization: ZlibCompressor does not fully utilize the buffer</b><br>

			
 
				+     <blockquote>Thanks for Hong Tang&apos;s advice.

			
 
				+<br>

			
 
				+<br>Sub task created for the first optimization. HADOOP-6662 closed. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6682">HADOOP-6682</a>.

			
 
				+     Major bug reported by jghoman and fixed by jghoman (io)<br>

			
 
				+     <b>NetUtils:normalizeHostName does not process hostnames starting with [a-f] correctly</b><br>

			
 
				+     <blockquote>  public static String normalizeHostName(String name) {

			
 
				+<br>    if (Character.digit(name.charAt(0), 16) != -1) {

			
 
				+<br>      return name;

			
 
				+<br>

			
 
				+<br>This code is attempting to short-circuit the hostname-&gt;ip resolution on the assumption that if name starts with a digit, it&apos;s already an ip address.  This is of questionable value, but because it checks for a hex digit, it will fail on names starting with [a-f].  Such names will not be converted to an ip address, but be returned unchanged.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6674">HADOOP-6674</a>.

			
 
				+     Major improvement reported by jnp and fixed by jnp <br>

			
 
				+     <b>Performance Improvement in Secure RPC</b><br>

			
 
				+     <blockquote>This jira introduces two performance improvements in Sasl RPC

			
 
				+<br>1. Setting of Sasl &apos;quality of protection&apos; to authentication only.

			
 
				+<br>2. Addition of BufferedOutputStream underneath SaslOutputStream.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6670">HADOOP-6670</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by owen.omalley (security)<br>

			
 
				+     <b>UserGroupInformation doesn&apos;t support use in hash tables</b><br>

			
 
				+     <blockquote>The UserGroupInformation objects are mutable, but they are used as keys in hash tables. This leads to serious problems in the FileSystem cache and RPC connection cache. We need to change the hashCode to be the identity hash code of the Subject and change equals to use == between the Subjects.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6669">HADOOP-6669</a>.

			
 
				+     Minor bug reported by knoguchi and fixed by knoguchi (io)<br>

			
 
				+     <b>zlib.compress.level  ignored for DefaultCodec initialization </b><br>

			
 
				+     <blockquote>HADOOP-5879 added a compression level for codecs, but DefaultCodec seems to ignore this conf value when initialized.

			
 
				+<br>This is only when codec is first created.  reinit() probably sets it right. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6663">HADOOP-6663</a>.

			
 
				+     Major bug reported by xiaokang and fixed by xiaokang (io)<br>

			
 
				+     <b>BlockDecompressorStream get EOF exception when decompressing the file compressed from empty file</b><br>

			
 
				+     <blockquote>An empty file can be compressed using BlockDecompressorStream, which is for block-based compressiong algorithm such as LZO. However, when decompressing the compressed file, BlockDecompressorStream get EOF exception.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6656">HADOOP-6656</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by devaraj <br>

			
 
				+     <b>Security framework needs to renew Kerberos tickets while the process is running</b><br>

			
 
				+     <blockquote>While a client process is running, there should be a thread that periodically renews the Kerberos credentials to ensure they don&apos;t expire.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6652">HADOOP-6652</a>.

			
 
				+     Major bug reported by devaraj and fixed by devaraj <br>

			
 
				+     <b>ShellBasedUnixGroupsMapping shouldn&apos;t have a cache</b><br>

			
 
				+     <blockquote>Since the Groups class already has a time based cache, the cache from ShellBasedUnixGroupsMapping should be removed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6648">HADOOP-6648</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by devaraj (security)<br>

			
 
				+     <b>Credentials should ignore null tokens</b><br>

			
 
				+     <blockquote>When hftp goes to a non-secure cluster, getDelegationToken returns null. Credentials.addToken needs to ignore null tokens to avoid a NPE in serialization.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6642">HADOOP-6642</a>.

			
 
				+     Major bug reported by acmurthy and fixed by pocheung <br>

			
 
				+     <b>Fix javac, javadoc, findbugs warnings</b><br>

			
 
				+     <blockquote>Unfortunately we&apos;ve missed some javac, javadoc, findbugs warnings in the recent security work.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6632">HADOOP-6632</a>.

			
 
				+     Major improvement reported by kzhang and fixed by kzhang <br>

			
 
				+     <b>Support for using different Kerberos keys for different instances of Hadoop services</b><br>

			
 
				+     <blockquote>We tested using the same Kerberos key for all datanodes in a HDFS cluster or the same Kerberos key for all TaskTarckers in a MapRed cluster. But it doesn&apos;t work. The reason is that when datanodes try to authenticate to the namenode all at once, the Kerberos authenticators they send to the namenode may have the same timestamp and will be rejected as replay requests. This JIRA makes it possible to use a unique key for each service instance.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6623">HADOOP-6623</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by tlipcon (util)<br>

			
 
				+     <b>Add StringUtils.split for non-escaped single-character separator</b><br>

			
 
				+     <blockquote>This is for HDFS-1028 but useful generally. String.split(&quot;/&quot;) for example is way slower than an implementation that is specific to only single-character separators.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6620">HADOOP-6620</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>NPE if renewer is passed as null in getDelegationToken</b><br>

			
 
				+     <blockquote>If renewer is passed as null in getDelegationToken, an NPE is thrown. We should handle null renewer and the token must not be allowed to be renewed if the renewer is null or empty string.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6613">HADOOP-6613</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (ipc, security)<br>

			
 
				+     <b>RPC server should check for version mismatch first</b><br>

			
 
				+     <blockquote>Currently AuthMethod is checked before Version.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6612">HADOOP-6612</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas (security)<br>

			
 
				+     <b>Protocols RefreshUserToGroupMappingsProtocol and RefreshAuthorizationPolicyProtocol will fail with security enabled</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6605">HADOOP-6605</a>.

			
 
				+     Minor improvement reported by metcalfc and fixed by eli <br>

			
 
				+     <b>Add JAVA_HOME detection to hadoop-config</b><br>

			
 
				+     <blockquote>The commands that source hadoop-config.sh currently bail with an error if JAVA_HOME is not set. Let&apos;s detect JAVA_HOME (from a list of locations on various OS types) if JAVA_HOME is not already set by hadoop-env.sh or the environment. This way users don&apos;t have to manually configure it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6600">HADOOP-6600</a>.

			
 
				+     Major new feature reported by boryas and fixed by boryas <br>

			
 
				+     <b>mechanism for authorization check for inter-server protocols</b><br>

			
 
				+     <blockquote>allow configuration of authorization for based on protocol (inter-server).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6599">HADOOP-6599</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms <br>

			
 
				+     <b>Split RPC metrics into summary and detailed metrics</b><br>

			
 
				+     <blockquote>Currently RPC metrics tracks items that provides summary of RPC usage along with more detailed per method statistics that tracks number of method calls made, time spent on that call. Combining both summary and detailed together results in large metrics report which metrics collection systems may not handle. Proposal is to split the metrics into summary and detailed metrics.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6586">HADOOP-6586</a>.

			
 
				+     Major new feature reported by boryas and fixed by boryas (security)<br>

			
 
				+     <b>Log authentication and authorization failures and successes</b><br>

			
 
				+     <blockquote>This jira will cover RPC authentication and SL authorizations logging.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6584">HADOOP-6584</a>.

			
 
				+     Major improvement reported by jghoman and fixed by jghoman <br>

			
 
				+     <b>Provide Kerberized SSL encryption for webservices</b><br>

			
 
				+     <blockquote>Some web services should be authenticated via SSL backed by Kerberos, both to provide cross-cluster secure communication and to provide intra-cluster server authentication for services such as the {Name,SecondaryName,Backup,Checkpoint}node&apos;s image transfer and balancer.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6578">HADOOP-6578</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by pirroh (conf)<br>

			
 
				+     <b>Configuration should trim whitespace around a lot of value types</b><br>

			
 
				+     <blockquote>I&apos;ve seen multiple users make an error where they&apos;ve listed some whitespace around a class name (eg for configuring a scheduler). This results in a ClassNotFoundException which is very hard to debug, as you don&apos;t notice the whitespace in the exception! We should simply trim the whitespace in Configuration.getClass and Configuration.getClasses to avoid this class of user error.

			
 
				+<br>

			
 
				+<br>Similarly, we should trim in getInt, getLong, etc - anywhere that whitespace doesn&apos;t have semantic meaning we should be a little less strict on input.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6562">HADOOP-6562</a>.

			
 
				+     Minor improvement reported by eli and fixed by eli (test)<br>

			
 
				+     <b>FileContextSymlinkBaseTest should use FileContextTestHelper</b><br>

			
 
				+     <blockquote>FileContextSymlinkBaseTest should use FileContextTestHelper, both for utility methods and defining the root test directory instead of using /tmp. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6536">HADOOP-6536</a>.

			
 
				+     Major bug reported by amareshwari and fixed by ravidotg (fs)<br>

			
 
				+     <b>FileUtil.fullyDelete(dir) behavior is not defined when we pass a symlink as the argument</b><br>

			
 
				+     <blockquote>FileUtil.fullyDelete(dir) deletes contents of sym-linked directory when we pass a symlink. If this is the behavior, it should be documented as so. 

			
 
				+<br>Or it should be changed not to delete the contents of the sym-linked directory.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6496">HADOOP-6496</a>.

			
 
				+     Minor bug reported by lars_francke and fixed by tlipcon <br>

			
 
				+     <b>HttpServer sends wrong content-type for CSS files (and others)</b><br>

			
 
				+     <blockquote>CSS files are send as text/html causing problems if the HTML page is rendered in standards mode. The HDFS interface for example still works because it is rendered in quirks mode, the HBase interface doesn&apos;t work because it is rendered in standards mode. See HBASE-2110 for more details.

			
 
				+<br>

			
 
				+<br>I&apos;ve had a quick look at HttpServer but I&apos;m too unfamiliar with it to see the problem. I think this started happening with HADOOP-6441 which would lead me to believe that the filter is called for every request and not only *.jsp and *.html. I&apos;d consider this a bug but I don&apos;t know enough about this to provide a fix.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6482">HADOOP-6482</a>.

			
 
				+     Minor bug reported by cwilkes and fixed by eli (util)<br>

			
 
				+     <b>GenericOptionsParser constructor that takes Options and String[] ignores options</b><br>

			
 
				+     <blockquote>This constructor:

			
 
				+<br>

			
 
				+<br>  public GenericOptionsParser(Options opts, String[] args) {

			
 
				+<br>    this(new Configuration(), new Options(), args);

			
 
				+<br>  }

			
 
				+<br>

			
 
				+<br>should do a this(new Configuration(), opts, args)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6472">HADOOP-6472</a>.

			
 
				+     Major new feature reported by boryas and fixed by boryas <br>

			
 
				+     <b>add tokenCache option to GenericOptionsParser for passing file with secret keys to a map reduce job</b><br>

			
 
				+     <blockquote>for MAPRED-1338 - we need an option to pass a file with secreteKeys (tokens) to a mapreduce Job.

			
 
				+<br>Name of the file is set into the config and will be picked up by JobSubmiter.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6436">HADOOP-6436</a>.

			
 
				+     Major improvement reported by eli and fixed by rvs <br>

			
 
				+     <b>Remove auto-generated native build files </b><br>

			
 
				+     <blockquote>The repo currently includes the automake and autoconf generated files for the native build. Per discussion on HADOOP-6421 let&apos;s remove them and use the host&apos;s automake and autoconf. We should also do this for libhdfs and fuse-dfs. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6298">HADOOP-6298</a>.

			
 
				+     Major improvement reported by marz and fixed by owen.omalley <br>

			
 
				+     <b>BytesWritable#getBytes is a bad name that leads to programming mistakes</b><br>

			
 
				+     <blockquote>Pretty much everyone at Rapleaf who has worked with Hadoop has misused BytesWritable#getBytes at some point, not expecting the byte array to be padded. I think we can completely alleviate these programming mistakes by deprecating and renaming this method (again) to be more descriptive. I propose &quot;getPaddedBytes()&quot; or &quot;getPaddedValue()&quot;. It would also be helpful to have a helper method &quot;getNonPaddedValue()&quot; that makes a copy into a non-padded byte array. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6056">HADOOP-6056</a>.

			
 
				+     Major improvement reported by stevel@apache.org and fixed by pirroh (scripts)<br>

			
 
				+     <b>Use java.net.preferIPv4Stack to force IPv4</b><br>

			
 
				+     <blockquote>This was mentioned on HADOOP-3427, there is a property,  java.net.preferIPv4Stack, which you set to true for the java net process to switch to IPv4 everywhere. 

			
 
				+<br>

			
 
				+<br>As Hadoop doesn&apos;t work on IPv6, this should be set to true in the startup scripts. Hopefully this will ensure that Jetty will also pick it up.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-4675">HADOOP-4675</a>.

			
 
				+     Major improvement reported by bockelman and fixed by bockelman (metrics)<br>

			
 
				+     <b>Current Ganglia metrics implementation is incompatible with Ganglia 3.1</b><br>

			
 
				+     <blockquote>Ganglia changed its wire protocol in the 3.1.x series; the current implementation only works for 3.0.x.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-4487">HADOOP-4487</a>.

			
 
				+     Major new feature reported by kzhang and fixed by kzhang (security)<br>

			
 
				+     <b>Security features for Hadoop</b><br>

			
 
				+     <blockquote>This is a top-level tracking JIRA for security work we are doing in Hadoop. Please add reference to this when opening new security related JIRAs.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2287">HDFS-2287</a>.

			
 
				+     Trivial bug reported by tlipcon and fixed by tlipcon (test)<br>

			
 
				+     <b>TestParallelRead has a small off-by-one bug</b><br>

			
 
				+     <blockquote>Noticed this bug when I was running TestParallelRead - a simple off-by-one error in some internal bounds checking.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2573">HDFS-2573</a>.

			
 
				+     Major bug reported by shv and fixed by cos (data-node, test)<br>

			
 
				+     <b>TestFiDataXceiverServer is failing, not testing OOME</b><br>

			
 
				+     <blockquote>TestFiDataXceiverServer is failing occasionally. It turns out also that the test is not testing the desired condition, because OOME is not caught in DataXceiverServer.run()</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2514">HDFS-2514</a>.

			
 
				+     Major bug reported by eli and fixed by eli (name-node)<br>

			
 
				+     <b>Link resolution bug for intermediate symlinks with relative targets</b><br>

			
 
				+     <blockquote>There&apos;s a bug in the way the Namenode resolves intermediate symlinks (ie the symlink is not the final path component) in paths when the symlink&apos;s target is a relative path. Will post the full description in the first comment.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2513">HDFS-2513</a>.

			
 
				+     Major task reported by cos and fixed by cos (build)<br>

			
 
				+     <b>Bump jetty to 6.1.26</b><br>

			
 
				+     <blockquote>HDFS part of Hadoop-7450</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2491">HDFS-2491</a>.

			
 
				+     Major bug reported by umamaheswararao and fixed by umamaheswararao <br>

			
 
				+     <b>TestBalancer can fail when datanode utilization and avgUtilization is exactly same.</b><br>

			
 
				+     <blockquote>Stack Trace:

			
 
				+<br>junit.framework.AssertionFailedError: 127.0.0.1:60986is not an underUtilized node: utilization=22.0 avgUtilization=22.0 threshold=10.0

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.Balancer.initNodes(Balancer.java:1014)

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.Balancer.initNodes(Balancer.java:953)

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.Balancer.run(Balancer.java:1502)

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.TestBalancer.runBalancer(TestBalancer.java:247)

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.TestBalancer.test(TestBalancer.java:234)

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.TestBalancer.twoNodeTest(TestBalancer.java:312)

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.TestBalancer.__CLR2_4_39j3j5b10ou(TestBalancer.java:328)

			
 
				+<br>at org.apache.hadoop.hdfs.server.balancer.TestBalancer.testBalancer0(TestBalancer.java:324)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2452">HDFS-2452</a>.

			
 
				+     Major bug reported by shv and fixed by umamaheswararao (data-node)<br>

			
 
				+     <b>OutOfMemoryError in DataXceiverServer takes down the DataNode</b><br>

			
 
				+     <blockquote>OutOfMemoryError brings down DataNode, when DataXceiverServer tries to spawn a new data transfer thread.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2388">HDFS-2388</a>.

			
 
				+     Major bug reported by shv and fixed by shv (build)<br>

			
 
				+     <b>Remove dependency on different version of slf4j in avro</b><br>

			
 
				+     <blockquote>This is the HDFS part of HADOOP-7697.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2383">HDFS-2383</a>.

			
 
				+     Blocker bug reported by shv and fixed by shv (test)<br>

			
 
				+     <b>TestDfsOverAvroRpc is failing on 0.22</b><br>

			
 
				+     <blockquote>{{TestDfsOverAvroRpc.testWorkingDirectory()}} is failing. Possible the result of Avro upgrade.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2346">HDFS-2346</a>.

			
 
				+     Blocker bug reported by umamaheswararao and fixed by lakshman (test)<br>

			
 
				+     <b>TestHost2NodesMap &amp; TestReplicasMap will fail depending upon execution order of test methods</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2343">HDFS-2343</a>.

			
 
				+     Blocker bug reported by jrottinghuis and fixed by jrottinghuis (hdfs client)<br>

			
 
				+     <b>Make hdfs use same version of avro as HBase</b><br>

			
 
				+     <blockquote>HBase depends on avro 1.5.3 whereas hadoop-common depends on 1.3.2.

			
 
				+<br>When building HBase on top of hadoop, this should be consistent.

			
 
				+<br>Moreover, this should be consistent between common, hdfs, and mapreduce.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2341">HDFS-2341</a>.

			
 
				+     Blocker bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Contribs not building</b><br>

			
 
				+     <blockquote>Contribs are not getting built.

			
 
				+<br>Snippet from Jenkins:

			
 
				+<br>

			
 
				+<br>compile:

			
 
				+<br>   [subant] No sub-builds to iterate on</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2315">HDFS-2315</a>.

			
 
				+     Blocker bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Build fails with ant 1.7.0 but works with 1.8.0</b><br>

			
 
				+     <blockquote>Build failure:

			
 
				+<br>https://builds.apache.org/view/G-L/view/Hadoop/job/Hadoop-Hdfs-22-branch/80

			
 
				+<br>build.xml calls build.xml in contrib, which calls fuse build, which in turn uses build-contrib.

			
 
				+<br>The inheritAll=true overrides the basedir in ant 1.7.0 but not in 1.8.0.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2297">HDFS-2297</a>.

			
 
				+     Blocker bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>FindBugs OutOfMemoryError</b><br>

			
 
				+     <blockquote>When running the findbugs target from Jenkins, I get an OutOfMemory error.

			
 
				+<br>The &quot;effort&quot; in FindBugs is set to Max which ends up using a lot of memory to go through all the classes. The jvmargs passed to FindBugs is hardcoded to 512 MB max.

			
 
				+<br>

			
 
				+<br>We can leave the default to 512M, as long as we pass this as an ant parameter which can be overwritten in individual cases through -D, or in the build.properties file (either basedir, or user&apos;s home directory).

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2290">HDFS-2290</a>.

			
 
				+     Major bug reported by shv and fixed by benoyantony (name-node)<br>

			
 
				+     <b>Block with corrupt replica is not getting replicated</b><br>

			
 
				+     <blockquote>A block has one replica marked as corrupt and two good ones. countNodes() correctly detects that there are only 2 live replicas, and fsck reports the block as under-replicated. But ReplicationMonitor never schedules replication of good replicas.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2286">HDFS-2286</a>.

			
 
				+     Trivial improvement reported by tlipcon and fixed by tlipcon (data-node)<br>

			
 
				+     <b>DataXceiverServer logs AsynchronousCloseException at shutdown</b><br>

			
 
				+     <blockquote>During DN shutdown, the acceptor thread gets an AsynchronousCloseException, and logs it at WARN level. This exception is excepted, since another thread is closing the listener socket, so we should just swallow it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2285">HDFS-2285</a>.

			
 
				+     Major bug reported by shv and fixed by shv (name-node)<br>

			
 
				+     <b>BackupNode should reject requests trying to modify namespace</b><br>

			
 
				+     <blockquote>I am trying to remove file from BackupNode using

			
 
				+<br>{code}hadoop fs -fs hdfs://backup.node.com:50100 -rm /README.txt{code}

			
 
				+<br>which is supposed to fail. But it seems to be hanging forever.

			
 
				+<br>Needs some investigation. It used to throw SafeModeException if I remember correctly.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2281">HDFS-2281</a>.

			
 
				+     Major bug reported by shv and fixed by umamaheswararao (name-node)<br>

			
 
				+     <b>NPE in checkpoint during processIOError()</b><br>

			
 
				+     <blockquote>At the end of checkpoint BackupNode tries to convergeJournalSpool() and calls revertFileStreams(). The latter closes each file stream, and tries to rename the corresponding file to its permanent location current/edits. If for any reason the rename fails processIOError() is called for failed streams. processIOError() will try to close the stream again and will get NPE in EditLogFileOutputStream.close() because bufCurrent was set to null by the previous close.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2280">HDFS-2280</a>.

			
 
				+     Major bug reported by shv and fixed by shv (name-node)<br>

			
 
				+     <b>BackupNode fails with MD5 checksum Exception during checkpoint if BN&apos;s image is outdated.</b><br>

			
 
				+     <blockquote>If BN starts after NN made changes to namespace it fails with MD5 checksum Exception during checkpoint when it reads new image upload from NN. This is happening because {{imageDigest}} is not reset to null, but keeps the value of the originally loaded BN image.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2271">HDFS-2271</a>.

			
 
				+     Major bug reported by umamaheswararao and fixed by umamaheswararao (name-node)<br>

			
 
				+     <b>startJournalSpool should invoke ProcessIOError with failed storage directories if createEditLogFile throws any exception.  </b><br>

			
 
				+     <blockquote>Even If createEditsLogFile failes in startJournalSpool of BackUpStorage, BackUPNode will proceed with exceptions. 

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2258">HDFS-2258</a>.

			
 
				+     Major bug reported by shv and fixed by shv (name-node, test)<br>

			
 
				+     <b>TestLeaseRecovery2 fails as lease hard limit is not reset to default</b><br>

			
 
				+     <blockquote>TestLeaseRecovery2.testSoftLeaseRecovery() fails as lease hard limit remains set to 1 sec from the previous test case. If initial file creation in testSoftLeaseRecovery() takes longer than 1 sec, NN correctly reassigns the lease to itself and starts recovery. The test fails as the client cannot hflush() and close the file.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2232">HDFS-2232</a>.

			
 
				+     Blocker bug reported by shv and fixed by zero45 (test)<br>

			
 
				+     <b>TestHDFSCLI fails on 0.22 branch</b><br>

			
 
				+     <blockquote>Several HDFS CLI tests fail on 0.22 branch. I can see 2 reasons:

			
 
				+<br># Not generic enough regular expression for host names and paths. Similar to MAPREDUCE-2304.

			
 
				+<br># Some command outputs have new-line in the end.

			
 
				+<br># And some seem to produce [much] more output than expected.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2214">HDFS-2214</a>.

			
 
				+     Major bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Generated POMs hardcode dependency on hadoop-common version 0.22.0-SNAPSHOT</b><br>

			
 
				+     <blockquote>The generated poms inject the version of hdfs itsel, but hardcode the version of hadoop-common they depend on.

			
 
				+<br>When trying to build downstream projects for example mapreduce, then they will require hadoop-common-0.22.0-SNAPSHOT.jar.

			
 
				+<br>

			
 
				+<br>When trying to do an offline build this will fail to resolve as another hadoop-common has been installed in the local maven repo.

			
 
				+<br>Even during online build, it should compile against the hadoop-common that hdfs compiled against.

			
 
				+<br>

			
 
				+<br>When versions mismatch one cannot do a coherent build. That is particularly problematic when making simultaneous change in hadoop-common and hadoop-hdfs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2211">HDFS-2211</a>.

			
 
				+     Blocker bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Build does not pass along properties to contrib builds</b><br>

			
 
				+     <blockquote>Subant call to compile contribs do not pass along parameters from parent build.

			
 
				+<br>Properties such as hadoop-common.version, asfrepo, offline, etc. are not passed along.

			
 
				+<br>Result is that build not connected to Internet fails, hdfs proxy refuses to build against own recently built common but rather downloads 0.22-SNAPSHOT from apache again.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2189">HDFS-2189</a>.

			
 
				+     Blocker bug reported by zero45 and fixed by jrottinghuis <br>

			
 
				+     <b>guava-r09 dependency missing from &quot;ivy/hadoop-hdfs-template.xml&quot; in HDFS.</b><br>

			
 
				+     <blockquote>Corrected version of: https://issues.apache.org/jira/browse/MAPREDUCE-2627</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2071">HDFS-2071</a>.

			
 
				+     Minor bug reported by kihwal and fixed by kihwal (data-node)<br>

			
 
				+     <b>Use of isConnected() in DataXceiver is invalid</b><br>

			
 
				+     <blockquote>The use of Socket.isConnected() in DataXceiver.run() is not valid. It returns false until the connection is made and then always returns true after that. It will never return false after the initial connection is successfully made. Socket.isClosed() or SocketChannel.isOpen() should be used instead, assuming someone is handling SocketException and does Socket.close() or SocketChannel.close(). It seems the op handlers in DataXceiver are diligently using IOUtils.closeStream(), which will invoke SocketChannel.close().

			
 
				+<br>

			
 
				+<br>{code}

			
 
				+<br>- } while (s.isConnected() &amp;&amp; socketKeepaliveTimeout &gt; 0);

			
 
				+<br>+ } while (!s.isClosed() &amp;&amp; socketKeepaliveTimeout &gt; 0);

			
 
				+<br>{code}

			
 
				+<br>

			
 
				+<br>The effect of this bug is very minor, as the socket is read again right after. If the connection was closed, the readOp() will throw an EOFException, which is caught and dealt with properly.  The system still functions normally with probably only few microseconds of extra overhead in the premature connection closure cases.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2054">HDFS-2054</a>.

			
 
				+     Minor improvement reported by kihwal and fixed by kihwal (data-node)<br>

			
 
				+     <b>BlockSender.sendChunk() prints ERROR for connection closures encountered  during transferToFully()</b><br>

			
 
				+     <blockquote>The addition of ERROR was part of HDFS-1527. In environments where clients tear down FSInputStream/connection before reaching the end of stream, this error message often pops up. Since these are not really errors and especially not the fault of data node, the message should be toned down at least. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2039">HDFS-2039</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>TestNameNodeMetrics uses a bad test root path</b><br>

			
 
				+     <blockquote>I found that running TestNameNodeMetrics within eclipse fails, since TEST_ROOT_DIR_PATH has a default which is a non-absolute path. Since this path is a DFS path, rather than a local FS path, it shouldn&apos;t use the test root dir system property anyhow - we can just hardcode it to a path on DFS.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2012">HDFS-2012</a>.

			
 
				+     Blocker bug reported by atm and fixed by umamaheswararao (balancer, test)<br>

			
 
				+     <b>Recurring failure of TestBalancer due to incorrect treatment of nodes whose utilization equals avgUtilization.</b><br>

			
 
				+     <blockquote>This has been failing on Hudson for the last two builds and fails on my local box as well.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2002">HDFS-2002</a>.

			
 
				+     Major bug reported by shv and fixed by zero45 (name-node)<br>

			
 
				+     <b>Incorrect computation of needed blocks in getTurnOffTip()</b><br>

			
 
				+     <blockquote>{{SafeModeInfo.getTurnOffTip()}} under-reports the number of blocks needed to reach the safemode threshold.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-2000">HDFS-2000</a>.

			
 
				+     Major bug reported by atm and fixed by atm <br>

			
 
				+     <b>Missing deprecation for io.bytes.per.checksum</b><br>

			
 
				+     <blockquote>Hadoop long ago deprecated the configuration &quot;io.bytes.per.checksum&quot; in favor of &quot;dfs.bytes-per-checksum&quot;, but when the programmatic deprecation support was added, we didn&apos;t add an entry for this pair.

			
 
				+<br>

			
 
				+<br>This is causing some tests to fail on branch-0.22 since the inclusion of HADOOP-7287, since some tests which were inadvertently using default config values are now having their settings actually picked up.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1997">HDFS-1997</a>.

			
 
				+     Major sub-task reported by tlipcon and fixed by tlipcon (name-node)<br>

			
 
				+     <b>Image transfer process misreports client side exceptions</b><br>

			
 
				+     <blockquote>If the image transfer process receives a client-side error when transferring edit logs, it will throw an exception before it has completely read all of the input from the server-side servlet. Then, the finally clause will throw a new error, since the received length is less than the length given in the header. This masks the client-side exception and makes it look like a network error or a server-side problem.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1981">HDFS-1981</a>.

			
 
				+     Blocker bug reported by ram_krish and fixed by umamaheswararao (name-node)<br>

			
 
				+     <b>When namenode goes down while checkpointing and if is started again subsequent Checkpointing is always failing</b><br>

			
 
				+     <blockquote>This scenario is applicable in NN and BNN case.

			
 
				+<br>

			
 
				+<br>When the namenode goes down after creating the edits.new, on subsequent restart the divertFileStreams will not happen to edits.new as the edits.new file is already present and the size is zero.

			
 
				+<br>

			
 
				+<br>so on trying to saveCheckPoint an exception occurs 

			
 
				+<br>2011-05-23 16:38:57,476 WARN org.mortbay.log: /getimage: java.io.IOException: GetImage failed. java.io.IOException: Namenode has an edit log with timestamp of 2011-05-23 16:38:56 but new checkpoint was created using editlog  with timestamp 2011-05-23 16:37:30. Checkpoint Aborted.

			
 
				+<br>

			
 
				+<br>This is a bug or is that the behaviour.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1980">HDFS-1980</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (build)<br>

			
 
				+     <b>Move build/webapps deeper in directory heirarchy to aid eclipse users</b><br>

			
 
				+     <blockquote>Currently in order to successfully run unit tests in Eclipse, you have to add the &quot;build/&quot; directory to the classpath, or else the tests won&apos;t be able to find the &quot;webapps&quot; dir. This is really annoying because Eclipse then often confuses the classes in build/classes with the source during operations like &quot;go to definition of class&quot;.

			
 
				+<br>

			
 
				+<br>If we move it into another directory, eg build/web/webapps then we can add build/web to the eclipse classpath and have tests work by default without also having two copies of every class.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1978">HDFS-1978</a>.

			
 
				+     Major bug reported by brocknoland and fixed by eli (libhdfs)<br>

			
 
				+     <b>All but first option in LIBHDFS_OPTS is ignored</b><br>

			
 
				+     <blockquote>In getJNIEnv, we go though LIBHDFS_OPTS with strok and count the number of args. Then create an array of options based on that information. But when we actually setup the options we only the first arg.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1969">HDFS-1969</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (name-node)<br>

			
 
				+     <b>Running rollback on new-version namenode destroys namespace</b><br>

			
 
				+     <blockquote>The following sequence leaves the namespace in an inconsistent/broken state:

			
 
				+<br>- format NN using 0.20 (or any prior release, probably)

			
 
				+<br>- run hdfs namenode -upgrade on 0.22. ^C the NN once it comes up.

			
 
				+<br>- run hdfs namenode -rollback on 0.22  (this should fail but doesn&apos;t!)

			
 
				+<br>

			
 
				+<br>This leaves the name directory in a state such that the version file claims it&apos;s an 0.20 namespace, but the fsimage is in 0.22 format. It then crashes when trying to start up.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1965">HDFS-1965</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (security)<br>

			
 
				+     <b>IPCs done using block token-based tickets can&apos;t reuse connections</b><br>

			
 
				+     <blockquote>This is the reason that TestFileConcurrentReaders has been failing a lot. Reproducing a comment from HDFS-1057:

			
 
				+<br>

			
 
				+<br>The test has a thread which continually re-opens the file which is being written to. Since the file&apos;s in the middle of being written, it makes an RPC to the DataNode in order to determine the visible length of the file. This RPC is authenticated using the block token which came back in the LocatedBlocks object as the security ticket.

			
 
				+<br>

			
 
				+<br>When this RPC hits the IPC layer, it looks at its existing connections and sees none that can be re-used, since the block token differs between the two requesters. Hence, it reconnects, and we end up with hundreds or thousands of IPC connections to the datanode.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1964">HDFS-1964</a>.

			
 
				+     Major bug reported by atm and fixed by atm <br>

			
 
				+     <b>Incorrect HTML unescaping in DatanodeJspHelper.java</b><br>

			
 
				+     <blockquote>HDFS-1575 introduced some HTML unescaping of parameters so that viewing a file would work for paths containing HTML-escaped characters, but in two of the places did the unescaping either too early or too late.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1957">HDFS-1957</a>.

			
 
				+     Minor improvement reported by asrabkin and fixed by asrabkin (documentation)<br>

			
 
				+     <b>Documentation for HFTP</b><br>

			
 
				+     <blockquote>There should be some documentation for HFTP.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1954">HDFS-1954</a>.

			
 
				+     Major improvement reported by philovivero and fixed by phunt (name-node)<br>

			
 
				+     <b>Improve corrupt files warning message on NameNode web UI</b><br>

			
 
				+     <blockquote>On NameNode web interface, you may get this warning:

			
 
				+<br>

			
 
				+<br>  WARNING : There are about 32 missing blocks. Please check the log or run fsck.

			
 
				+<br>

			
 
				+<br>If the cluster was started less than 14 days before, it would be great to add: &quot;Is dfs.data.dir defined?&quot;

			
 
				+<br>

			
 
				+<br>If at the point of that error message, that parameter could be checked, and error made &quot;OMG dfs.data.dir isn&apos;t defined!&quot; that&apos;d be even better. As is, troubleshooting undefined parameters is a difficult proposition.

			
 
				+<br>

			
 
				+<br>I suspect this is an easy fix.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1952">HDFS-1952</a>.

			
 
				+     Major bug reported by mattf and fixed by azuriel <br>

			
 
				+     <b>FSEditLog.open() appears to succeed even if all EDITS directories fail</b><br>

			
 
				+     <blockquote>FSEditLog.open() appears to &quot;succeed&quot; even if all of the individual directories failed to allow creation of an EditLogOutputStream.  The problem and solution are essentially similar to that of HDFS-1505.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1948">HDFS-1948</a>.

			
 
				+     Major task reported by stack and fixed by stack <br>

			
 
				+     <b>Forward port &apos;hdfs-1520 lightweight namenode operation to trigger lease reccovery&apos;</b><br>

			
 
				+     <blockquote>This issue is about forward porting from branch-0.20-append the little namenode api that facilitates stealing of a file&apos;s lease.  The forward port would be an adaption of hdfs-1520 and its companion patches, hdfs-1555 and hdfs-1554, to suit the TRUNK.

			
 
				+<br>

			
 
				+<br>Intent is to get this fix into 0.22 time willing; i&apos;ll run a vote to get ok on getting it added to branch.  HBase needs this facility.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1947">HDFS-1947</a>.

			
 
				+     Trivial improvement reported by eli and fixed by eli (hdfs client)<br>

			
 
				+     <b>DFSClient should use mapreduce.task.attempt.id</b><br>

			
 
				+     <blockquote>DFSClient should use {{mapreduce.task.attempt.id}} instead of the deprecated {{mapred.task.id}}.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1946">HDFS-1946</a>.

			
 
				+     Major task reported by eli and fixed by eli <br>

			
 
				+     <b>HDFS part of HADOOP-7291</b><br>

			
 
				+     <blockquote>The hudson-test-patch target needs to be updated to not pass python.home since this argument is no longer needed.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1943">HDFS-1943</a>.

			
 
				+     Blocker bug reported by weiyj and fixed by mattf (scripts)<br>

			
 
				+     <b>fail to start datanode while start-dfs.sh is executed by root user</b><br>

			
 
				+     <blockquote>When start-dfs.sh is run by root user, we got the following error message:

			
 
				+<br># start-dfs.sh

			
 
				+<br>Starting namenodes on [localhost ]

			
 
				+<br>localhost: namenode running as process 2556. Stop it first.

			
 
				+<br>localhost: starting datanode, logging to /usr/hadoop/hadoop-common-0.23.0-SNAPSHOT/bin/../logs/hadoop-root-datanode-cspf01.out

			
 
				+<br>localhost: Unrecognized option: -jvm

			
 
				+<br>localhost: Could not create the Java virtual machine.

			
 
				+<br>

			
 
				+<br>The -jvm options should be passed to jsvc when we starting a secure

			
 
				+<br>datanode, but it still passed to java when start-dfs.sh is run by root

			
 
				+<br>while secure datanode is disabled. This is a bug of bin/hdfs.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1936">HDFS-1936</a>.

			
 
				+     Blocker bug reported by sureshms and fixed by sureshms (name-node)<br>

			
 
				+     <b>Updating the layout version from HDFS-1822 causes upgrade problems.</b><br>

			
 
				+     <blockquote>In HDFS-1822 and HDFS-1842, the layout versions for 203, 204, 22 and trunk were changed. Some of the namenode logic that depends on layout version is broken because of this. Read the comment for more description.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1935">HDFS-1935</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Build should not redownload ivy on every invocation</b><br>

			
 
				+     <blockquote>Currently we re-download ivy every time we build. If the jar already exists, we should skip this.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1932">HDFS-1932</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by jolly <br>

			
 
				+     <b>Ensure that HDFS configuration deprecations are set up in every spot that HDFS configurations are loaded.</b><br>

			
 
				+     <blockquote>Currently we have code blocks like the following in lots of places:

			
 
				+<br>

			
 
				+<br>  static{

			
 
				+<br>    Configuration.addDefaultResource(&quot;hdfs-default.xml&quot;);

			
 
				+<br>    Configuration.addDefaultResource(&quot;hdfs-site.xml&quot;);

			
 
				+<br>  }

			
 
				+<br>

			
 
				+<br>This is dangerous since, if we don&apos;t remember to also classload HdfsConfiguration, the config key deprecations won&apos;t work. We should add a method like HdfsConfiguration.init() which would load the default resources as well as ensure that deprecation gets initialized properly.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1925">HDFS-1925</a>.

			
 
				+     Major bug reported by shv and fixed by fwiffo <br>

			
 
				+     <b>SafeModeInfo should use DFS_NAMENODE_SAFEMODE_THRESHOLD_PCT_DEFAULT instead of 0.95</b><br>

			
 
				+     <blockquote>{{SafeMode()}} constructor has 0.95f default threshold hard-coded. This should be replaced by the constant {{DFS_NAMENODE_SAFEMODE_THRESHOLD_PCT_DEFAULT}}, which is correctly set to 0.999f.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1921">HDFS-1921</a>.

			
 
				+     Blocker bug reported by atm and fixed by mattf <br>

			
 
				+     <b>Save namespace can cause NN to be unable to come up on restart</b><br>

			
 
				+     <blockquote>I discovered this in the course of trying to implement a fix for HDFS-1505.

			
 
				+<br>

			
 
				+<br>Per the comment for {{FSImage.saveNamespace(...)}}, the algorithm for save namespace proceeds in the following order:

			
 
				+<br>

			
 
				+<br># rename current to lastcheckpoint.tmp for all of them,

			
 
				+<br># save image and recreate edits for all of them,

			
 
				+<br># rename lastcheckpoint.tmp to previous.checkpoint.

			
 
				+<br>

			
 
				+<br>The problem is that step 3 occurs regardless of whether or not an error occurs for all storage directories in step 2. Upon restart, the NN will see non-existent or corrupt {{current}} directories, and no {{lastcheckpoint.tmp}} directories, and so will conclude that the storage directories are not formatted.

			
 
				+<br>

			
 
				+<br>This issue appears to be present on both 0.22 and 0.23. This should arguably be a 0.22/0.23 blocker.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1909">HDFS-1909</a>.

			
 
				+     Major bug reported by tomwhite and fixed by tomwhite <br>

			
 
				+     <b>TestHDFSCLI fails due to typo in expected output </b><br>

			
 
				+     <blockquote>&quot;apended&quot; is misspelled in testHDFSConf.xml and causes the test to fail on the 0.22 branch.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1897">HDFS-1897</a>.

			
 
				+     Minor bug reported by asrabkin and fixed by whangsf (documentation)<br>

			
 
				+     <b>Documention refers to removed option dfs.network.script</b><br>

			
 
				+     <blockquote>The HDFS user guide tells users to use dfs.network.script for rack awareness. In fact, this option has been removed and using it will trigger a fatal error on DataNode startup. Documentation should describe the current rack awareness configuration system.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1891">HDFS-1891</a>.

			
 
				+     Major bug reported by sureshms and fixed by sureshms (test)<br>

			
 
				+     <b>TestBackupNode fails intermittently</b><br>

			
 
				+     <blockquote>TestBackupNode fails due to unexpected ipv6 address format.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1866">HDFS-1866</a>.

			
 
				+     Minor improvement reported by eli and fixed by qwertymaniac (data-node, documentation)<br>

			
 
				+     <b>Document dfs.datanode.max.transfer.threads in hdfs-default.xml</b><br>

			
 
				+     <blockquote>dfs.datanode.max.transfer.threads (formerly dfs.datanode.max.xcievers) should be covered in hdfs-default.xml.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1861">HDFS-1861</a>.

			
 
				+     Major improvement reported by eli and fixed by eli (data-node)<br>

			
 
				+     <b>Rename dfs.datanode.max.xcievers and bump its default value</b><br>

			
 
				+     <blockquote>Reasonably sized jobs and HBase easily exhaust the current default for dfs.datanode.max.xcievers. 4096 works better in practice.

			
 
				+<br>

			
 
				+<br>Let&apos;s also deprecate it in favor of a more intuitive name, eg dfs.datanode.max.receiver.threads.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1855">HDFS-1855</a>.

			
 
				+     Major test reported by mattf and fixed by mattf (test)<br>

			
 
				+     <b>TestDatanodeBlockScanner.testBlockCorruptionRecoveryPolicy() part 2 fails in two different ways</b><br>

			
 
				+     <blockquote>The second part of test case TestDatanodeBlockScanner.testBlockCorruptionRecoveryPolicy(), &quot;corrupt replica recovery for two corrupt replicas&quot;, always fails, half the time with a checksum error upon block replication, and half the time by timing out upon failure to delete the second corrupt replica.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1850">HDFS-1850</a>.

			
 
				+     Major bug reported by eli and fixed by eli (data-node, name-node)<br>

			
 
				+     <b>DN should transmit absolute failed volume count rather than increments to the NN</b><br>

			
 
				+     <blockquote>The API added in HDFS-811 for the DN to report volume failures to the NN is &quot;inc(DN)&quot;. However the given sequence of events will result in the NN forgetting about reported failed volumes:

			
 
				+<br>

			
 
				+<br># DN loses a volume and reports it

			
 
				+<br># NN restarts

			
 
				+<br># DN re-registers to the new NN

			
 
				+<br>

			
 
				+<br>A more robust interface would be to have the DN report the total number of volume failures to the NN each heart beat (the same way other volume state is transmitted).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1845">HDFS-1845</a>.

			
 
				+     Major bug reported by johnvijoe and fixed by johnvijoe <br>

			
 
				+     <b>symlink comes up as directory after namenode restart</b><br>

			
 
				+     <blockquote>When a symlink is first created, it get added to EditLogs. When namenode is restarted, it reads from this editlog and represents a symlink correctly and saves this information to its image. If the namenode is restarted again, it reads its from this FSImage, but thinks that a symlink is a directory. This is because it uses &quot;Block[] blocks&quot; to determine if an INode is a directory, a file, or symlink. Since both a directory and a symlink has blocks as null, it thinks that a symlink is a directory.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1825">HDFS-1825</a>.

			
 
				+     Major task reported by nidaley and fixed by nidaley <br>

			
 
				+     <b>Remove thriftfs contrib</b><br>

			
 
				+     <blockquote>As per vote on general@ (http://mail-archives.apache.org/mod_mbox/hadoop-general/201102.mbox/%3CEF44CFE2-692F-4956-8B33-D125D05E2B53@mac.com%3E) thriftfs can be removed: 

			
 
				+<br>svn remove hdfs/trunk/src/contrib/thriftfs

			
 
				+<br>and wiki updated:

			
 
				+<br>http://wiki.apache.org/hadoop/Attic</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1823">HDFS-1823</a>.

			
 
				+     Blocker bug reported by tomwhite and fixed by tomwhite (scripts)<br>

			
 
				+     <b>start-dfs.sh script fails if HADOOP_HOME is not set</b><br>

			
 
				+     <blockquote>HDFS portion of HADOOP-6953</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1822">HDFS-1822</a>.

			
 
				+     Blocker bug reported by sureshms and fixed by sureshms (name-node)<br>

			
 
				+     <b>Editlog opcodes overlap between 20 security and later releases</b><br>

			
 
				+     <blockquote>Same opcode are used for different operations between 0.20.security, 0.22 and 0.23. This results in failure to load editlogs on later release, especially during upgrades.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1821">HDFS-1821</a>.

			
 
				+     Major bug reported by johnvijoe and fixed by johnvijoe <br>

			
 
				+     <b>FileContext.createSymlink with kerberos enabled sets wrong owner</b><br>

			
 
				+     <blockquote>TEST SETUP

			
 
				+<br>Using attached sample hdfs java program that illustrates the issue.

			
 
				+<br>Using cluster with Kerberos enabled on cluster

			
 
				+<br>

			
 
				+<br># Compile instructions

			
 
				+<br>$ javac Symlink.java -cp `hadoop classpath`

			
 
				+<br>$ jar -cfe Symlink.jar Symlink Symlink.class

			
 
				+<br>

			
 
				+<br># create test file for symlink to use

			
 
				+<br>1. hadoop fs -touchz /user/username/filetest

			
 
				+<br>

			
 
				+<br># Create symlink using file context

			
 
				+<br>2. hadoop jar Symlink.jar ln /user/username/filetest /user/username/testsymlink

			
 
				+<br>

			
 
				+<br># Verify owner of test file

			
 
				+<br>3. hadoop jar Symlink.jar ls /user/username/

			
 
				+<br>-rw-r--r-- username hdfs /user/jeagles/filetest

			
 
				+<br>-rwxrwxrwx username@XX.XXXX.XXXXX.XXX hdfs /user/username/testsymlink

			
 
				+<br>

			
 
				+<br>RESULTS

			
 
				+<br>1. Owner shows &apos;username@XX.XXXX.XXXXX.XXX&apos; for symlink, expecting &apos;username&apos;.

			
 
				+<br>2. Symlink is corrupted and can&apos;t removed, since it was created with an invalid user

			
 
				+<br>

			
 
				+<br>

			
 
				+<br>------------------------

			
 
				+<br>Sample program to create Symlink

			
 
				+<br>

			
 
				+<br>FileContext fc = FileContext.getFileContext(getConf());

			
 
				+<br>fc.createSymlink(target, symlink, false);

			
 
				+<br>

			
 
				+<br>---------------------------------------</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1806">HDFS-1806</a>.

			
 
				+     Major bug reported by mattf and fixed by mattf (data-node, name-node)<br>

			
 
				+     <b>TestBlockReport.blockReport_08() and _09() are timing-dependent and likely to fail on fast servers</b><br>

			
 
				+     <blockquote>Method waitForTempReplica() polls every 100ms during block replication, attempting to &quot;catch&quot; a datanode in the state of having a TEMPORARY replica.  But examination of a current Hudson test failure log shows that the replica goes from &quot;start&quot; to &quot;TEMPORARY&quot; to &quot;FINALIZED&quot; in only 50ms, so of course the poll usually misses it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1786">HDFS-1786</a>.

			
 
				+     Minor bug reported by szetszwo and fixed by umamaheswararao (test)<br>

			
 
				+     <b>Some cli test cases expect a &quot;null&quot; message</b><br>

			
 
				+     <blockquote>There are a few tests cases specified in {{TestHDFSCLI}} and {{TestDFSShell}} expecting &quot;null&quot; messages.

			
 
				+<br>e.g. in {{testHDFSConf.xml}},

			
 
				+<br>          &lt;expected-output&gt;get: null&lt;/expected-output&gt;

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1782">HDFS-1782</a>.

			
 
				+     Major bug reported by johnvijoe and fixed by johnvijoe (name-node)<br>

			
 
				+     <b>FSNamesystem.startFileInternal(..) throws NullPointerException</b><br>

			
 
				+     <blockquote>I&apos;m observing when there is one balancer running trying to run another one results in

			
 
				+<br>&quot;Java.lang.NullPointerException&quot; error. I was hoping to see message &quot;Another balancer is running. 

			
 
				+<br>Exiting....  Exiting ...&quot;. This is a reproducible issue.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1781">HDFS-1781</a>.

			
 
				+     Major bug reported by johnvijoe and fixed by johnvijoe (scripts)<br>

			
 
				+     <b>jsvc executable delivered into wrong package...</b><br>

			
 
				+     <blockquote>The jsvc executable is delivered in the 0.22 hdfs package, but the script that uses it (bin/hdfs) refers to

			
 
				+<br>$HADOOP_HOME/bin/jsvc to find it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1762">HDFS-1762</a>.

			
 
				+     Major test reported by tomwhite and fixed by cos (build, test)<br>

			
 
				+     <b>Allow TestHDFSCLI to be run against a cluster</b><br>

			
 
				+     <blockquote>Currently TestHDFSCLI starts mini clusters to run tests against. It would be useful to be able to support running against arbitrary clusters for testing purposes.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1736">HDFS-1736</a>.

			
 
				+     Minor improvement reported by daryn and fixed by daryn (data-node)<br>

			
 
				+     <b>Break dependency between DatanodeJspHelper and FsShell</b><br>

			
 
				+     <blockquote>DatanodeJspHelper has an artificial dependency on a date formatter field in FsShell.  A pending bug is reorganizing the FsShell commands so this field will no longer be available.  The dependency should be broken by having DataNodeJspHelper contain its own independent date formatter.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1625">HDFS-1625</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by szetszwo (test)<br>

			
 
				+     <b>TestDataNodeMXBean fails if disk space usage changes during test run</b><br>

			
 
				+     <blockquote>I&apos;ve seen this on our internal hudson - we get failures like:

			
 
				+<br>

			
 
				+<br>null expected:&lt;...:{&quot;freeSpace&quot;:857683[43552],&quot;usedSpace&quot;:28672,&quot;...&gt; but was:&lt;...:{&quot;freeSpace&quot;:857683[59936],&quot;usedSpace&quot;:28672,&quot;...&gt;

			
 
				+<br>

			
 
				+<br>because some other build on the same build slave used up some disk space during the middle of the test.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1621">HDFS-1621</a>.

			
 
				+     Major bug reported by tlipcon and fixed by jolly <br>

			
 
				+     <b>Fix references to hadoop-common-${version} in build.xml</b><br>

			
 
				+     <blockquote>Similar to MAPREDUCE-2315, we should fix any references to the hadoop common jar that use ${version} instead of ${hadoop-common.version}.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1619">HDFS-1619</a>.

			
 
				+     Major improvement reported by rvs and fixed by rvs (libhdfs)<br>

			
 
				+     <b>Remove AC_TYPE* from the libhdfs</b><br>

			
 
				+     <blockquote>Remove AC_TYPE* from the libhdfs build since we get these via stdint.

			
 
				+<br>

			
 
				+<br>Currently configure.ac uses AC_TYPE_INT16_T, AC_TYPE_INT32_T, AC_TYPE_INT64_T and AC_TYPE_UINT16_T and thus requires autoconf 2.61 or higher. 

			
 
				+<br>This prevents using it on such platforms as CentOS/RHEL 5.4 and 5.5. Given that those are pretty popular and also given that it is really difficult to find a platform

			
 
				+<br>these days that doesn&apos;t natively define  intXX_t types I&apos;m curious as to whether we can simply remove those macros or perhaps fail ONLY if we happen to be on such

			
 
				+<br>a platform. 

			
 
				+<br>

			
 
				+<br>Here&apos;s a link to GNU autoconf docs for your reference:

			
 
				+<br>    http://www.gnu.org/software/hello/manual/autoconf/Particular-Types.html</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1618">HDFS-1618</a>.

			
 
				+     Major improvement reported by rvs and fixed by rvs (build)<br>

			
 
				+     <b>configure files that are generated as part of the released tarball need to have executable bit set </b><br>

			
 
				+     <blockquote>Currently the configure files that are packaged in a tarball are -rw-rw-r--</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1615">HDFS-1615</a>.

			
 
				+     Major bug reported by tlipcon and fixed by scott_carey <br>

			
 
				+     <b>seek() on closed DFS input stream throws NPE</b><br>

			
 
				+     <blockquote>After closing an input stream on DFS, seeking slightly ahead of the last read will throw an NPE:

			
 
				+<br>

			
 
				+<br>java.lang.NullPointerException

			
 
				+<br>        at org.apache.hadoop.hdfs.DFSInputStream.seek(DFSInputStream.java:749)

			
 
				+<br>        at org.apache.hadoop.fs.FSDataInputStream.seek(FSDataInputStream.java:42)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1602">HDFS-1602</a>.

			
 
				+     Major bug reported by cos and fixed by boryas (name-node)<br>

			
 
				+     <b>NameNode storage failed replica restoration is broken</b><br>

			
 
				+     <blockquote>NameNode storage restore functionality doesn&apos;t work (as HDFS-903 demonstrated). This needs to be either disabled, or removed, or fixed. This feature also fails HDFS-1496</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1597">HDFS-1597</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>Batched edit log syncs can reset synctxid throw assertions</b><br>

			
 
				+     <blockquote>The top of FSEditLog.logSync has the following assertion:

			
 
				+<br>        assert editStreams.size() &gt; 0 : &quot;no editlog streams&quot;;

			
 
				+<br>which should actually come after checking to see if the sync was already batched in by another thread.

			
 
				+<br>

			
 
				+<br>This is related to a second bug in which the same case causes synctxid to be reset to 0</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1591">HDFS-1591</a>.

			
 
				+     Major bug reported by pocheung and fixed by pocheung <br>

			
 
				+     <b>Fix javac, javadoc, findbugs warnings</b><br>

			
 
				+     <blockquote>Split from HADOOP-6642</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1582">HDFS-1582</a>.

			
 
				+     Major improvement reported by rvs and fixed by rvs (libhdfs)<br>

			
 
				+     <b>Remove auto-generated native build files</b><br>

			
 
				+     <blockquote>The repo currently includes the automake and autoconf generated files for the native build. Per discussion on HADOOP-6421 let&apos;s remove them and use the host&apos;s automake and autoconf. We should also do this for libhdfs and fuse-dfs. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1575">HDFS-1575</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by atm <br>

			
 
				+     <b>viewing block from web UI broken</b><br>

			
 
				+     <blockquote>DatanodeJspHelper seems to expect the file path to be in the &quot;path info&quot; of the HttpRequest, rather than in a parameter. I see the following exception when visiting the URL {{http://localhost.localdomain:50075/browseBlock.jsp?blockId=5006108823351810567&amp;blockSize=20&amp;genstamp=1001&amp;filename=%2Fuser%2Ftodd%2Fissue&amp;datanodePort=50010&amp;namenodeInfoPort=50070}}

			
 
				+<br>

			
 
				+<br>java.io.FileNotFoundException: File does not exist: /

			
 
				+<br>  at org.apache.hadoop.hdfs.server.namenode.FSNamesystem.getBlockLocationsInternal(FSNamesystem.java:834)

			
 
				+<br>...

			
 
				+<br>  at org.apache.hadoop.hdfs.server.datanode.DatanodeJspHelper.generateFileDetails(DatanodeJspHelper.java:258)

			
 
				+<br>  at org.apache.hadoop.hdfs.server.datanode.browseBlock_jsp._jspService(browseBlock_jsp.java:79)

			
 
				+<br>  at org.apache.jasper.runtime.HttpJspBase.service(HttpJspBase.java:97)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1572">HDFS-1572</a>.

			
 
				+     Blocker bug reported by liangly and fixed by jghoman <br>

			
 
				+     <b>Checkpointer should trigger checkpoint with specified period.</b><br>

			
 
				+     <blockquote>

			
 
				+     {dfs.namenode.checkpoint.period} in configuration determines the period of checkpoint. However, with above code, the Checkpointer triggers a checkpoint every 5 minutes (periodMSec=5*60*1000).

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1562">HDFS-1562</a>.

			
 
				+     Major test reported by eli and fixed by eli (name-node, test)<br>

			
 
				+     <b>Add rack policy tests</b><br>

			
 
				+     <blockquote>The existing replication tests (TestBlocksWithNotEnoughRacks, TestPendingReplication, TestOverReplicatedBlocks, TestReplicationPolicy, TestUnderReplicatedBlocks, and TestReplication) are missing tests for rack policy violations.  This jira adds the following tests which I created when generating a new patch for HDFS-15.

			
 
				+<br>

			
 
				+<br>* Test that blocks that have a sufficient number of total replicas, but are not replicated cross rack, get replicated cross rack when a rack becomes available.

			
 
				+<br>* Test that new blocks for an underreplicated file will get replicated cross rack. 

			
 
				+<br>* Mark a block as corrupt, test that when it is re-replicated that it is still replicated across racks.

			
 
				+<br>* Reduce the replication factor of a file, making sure that the only block that is across racks is not removed when deleting replicas.

			
 
				+<br>* Test that when a block is replicated because a replica is lost due to host failure the the rack policy is preserved.

			
 
				+<br>* Test that when the execss replicas of a block are reduced due to a node re-joining the cluster the rack policy is not violated.

			
 
				+<br>* Test that rack policy is still respected when blocks are replicated due to node decommissioning.

			
 
				+<br>* Test that rack policy is still respected when blocks are replicated due to node decommissioning, even when the blocks are over-replicated.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1561">HDFS-1561</a>.

			
 
				+     Blocker bug reported by shv and fixed by shv (name-node)<br>

			
 
				+     <b>BackupNode listens on default host</b><br>

			
 
				+     <blockquote>Currently BackupNode uses DNS to find its default host name, and then starts RPC server listening on that address ignoring the address specified in the configuration. Therefore, there is no way to start BackupNode on a particular ip or host address. BackupNode should use the address specified in the configuration instead.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1560">HDFS-1560</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by tlipcon (data-node)<br>

			
 
				+     <b>dfs.data.dir permissions should default to 700</b><br>

			
 
				+     <blockquote>Currently, dfs.data.dir defaults to 755 permissions, which isn&apos;t necessary for any reason, and is a security issue if not changed on a secured cluster. We should default to 700</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1550">HDFS-1550</a>.

			
 
				+     Blocker bug reported by hairong and fixed by hairong (hdfs client)<br>

			
 
				+     <b>NPE when listing a file with no location</b><br>

			
 
				+     <blockquote>Lines listed below will caused a NullPointerException in DFSUtil.locatedBlocks2Locations (line 208) because EMPTY_BLOCK_LOCS  will return null when calling blocks.getLocatedBlocks()

			
 
				+<br>   /** a default LocatedBlocks object, its content should not be changed */

			
 
				+<br>   private final static LocatedBlocks EMPTY_BLOCK_LOCS = new LocatedBlocks();

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1544">HDFS-1544</a>.

			
 
				+     Major bug reported by vicaya and fixed by vicaya <br>

			
 
				+     <b>Ivy resolve force mode should be turned off by default</b><br>

			
 
				+     <blockquote>cf. HADOOP-7068</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1542">HDFS-1542</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (hdfs client)<br>

			
 
				+     <b>Deadlock in Configuration.writeXml when serialized form is larger than one DFS block</b><br>

			
 
				+     <blockquote>Configuration.writeXml holds a lock on itself and then writes the XML to an output stream, during which DFSOutputStream will try to get a lock on ackQueue/dataQueue. Meanwihle the DataStreamer thread will call functions like conf.getInt() and deadlock against the other thread, since it could be the same conf object.

			
 
				+<br>

			
 
				+<br>This causes a deterministic deadlock whenever the serialized form is larger than block size.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1532">HDFS-1532</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (test)<br>

			
 
				+     <b>Exclude Findbugs warning in FSImageFormat$Saver</b><br>

			
 
				+     <blockquote>HDFS-1473 had a followup patch which changed a method name, but I forgot to modify the findbugs exclude file to match.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1531">HDFS-1531</a>.

			
 
				+     Trivial bug reported by tlipcon and fixed by tlipcon (data-node, name-node)<br>

			
 
				+     <b>Clean up stack traces due to duplicate MXBean registration</b><br>

			
 
				+     <blockquote>In the minicluster unit tests, we try to register MXBeans for each DN, but since the JMX context is JVM-wide, we get a InstanceAlreadyExistsException for all but the first. This stack trace clutters test logs a lot.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1529">HDFS-1529</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (hdfs client)<br>

			
 
				+     <b>Incorrect handling of interrupts in waitForAckedSeqno can cause deadlock</b><br>

			
 
				+     <blockquote>In HDFS-895 the handling of interrupts during hflush/close was changed to preserve interrupt status. This ends up creating an infinite loop in waitForAckedSeqno if the waiting thread gets interrupted, since Object.wait() has a strange semantic that it doesn&apos;t give up the lock even momentarily if the thread is already in interrupted state at the beginning of the call.

			
 
				+<br>

			
 
				+<br>We should decide what the correct behavior is here - if a thread is interrupted while it&apos;s calling hflush() or close() should we (a) throw an exception, perhaps InterruptedIOException (b) ignore, or (c) wait for the flush to finish but preserve interrupt status on exit?</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1527">HDFS-1527</a>.

			
 
				+     Major bug reported by pkling and fixed by pkling (data-node)<br>

			
 
				+     <b>SocketOutputStream.transferToFully fails for blocks &gt;= 2GB on 32 bit JVM</b><br>

			
 
				+     <blockquote>On 32 bit JVM, SocketOutputStream.transferToFully() fails if the block size is &gt;= 2GB. We should fall back to a normal transfer in this case. 

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1524">HDFS-1524</a>.

			
 
				+     Blocker bug reported by hairong and fixed by hairong (name-node)<br>

			
 
				+     <b>Image loader should make sure to read every byte in image file</b><br>

			
 
				+     <blockquote>When I work on HDFS-1070, I come across a very strange bug. Occasionally when loading a compressed image, NameNode throws an exception complaining that the image file is corrupt. However, the result returned by the md5sum utility matches the checksum value stored in the VERSION file. 

			
 
				+<br>

			
 
				+<br>It turns out the image loader leaves 4 bytes unread after loading all the real data of an image. Those unread bytes may be some compression-related meta-info. The image loader should make sure to read to the end of file in order for an correct checksum.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1523">HDFS-1523</a>.

			
 
				+     Major bug reported by cos and fixed by cos (test)<br>

			
 
				+     <b>TestLargeBlock is failing on trunk</b><br>

			
 
				+     <blockquote>TestLargeBlock is failing for more than a week not on 0.22 and trunk with

			
 
				+<br>java.io.IOException: Premeture EOF from inputStream

			
 
				+<br>  at org.apache.hadoop.io.IOUtils.readFully(IOUtils.java:118)

			
 
				+<br>  at org.apache.hadoop.hdfs.BlockReader.readChunk(BlockReader.java:275)

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1513">HDFS-1513</a>.

			
 
				+     Minor improvement reported by eli and fixed by eli <br>

			
 
				+     <b>Fix a number of warnings</b><br>

			
 
				+     <blockquote>There are a bunch of warnings besides DeprecatedUTF8, HDFS-1512 and two warnings caused by a Java bug (http://bugs.sun.com/view_bug.do?bug_id=646014) that we can fix.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1511">HDFS-1511</a>.

			
 
				+     Blocker bug reported by nidaley and fixed by jghoman <br>

			
 
				+     <b>98 Release Audit warnings on trunk and branch-0.22</b><br>

			
 
				+     <blockquote>There are 98 release audit warnings on trunk. See attached txt file. These must be fixed or filtered out to get back to a reasonably small number of warnings. The OK_RELEASEAUDIT_WARNINGS property in src/test/test-patch.properties should also be set appropriately in the patch that fixes this issue.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1507">HDFS-1507</a>.

			
 
				+     Minor bug reported by eli and fixed by eli (test)<br>

			
 
				+     <b>TestAbandonBlock should abandon a block</b><br>

			
 
				+     <blockquote>TestAbandonBlock as written just tests that if one client tries to abandon another it will fail because the new client doesn&apos;t have a lease on the other client&apos;s file, which doesn&apos;t cover the block abandonement code path.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1505">HDFS-1505</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by atm <br>

			
 
				+     <b>saveNamespace appears to succeed even if all directories fail to save</b><br>

			
 
				+     <blockquote>After HDFS-1071, saveNamespace now appears to &quot;succeed&quot; even if all of the individual directories failed to save.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1504">HDFS-1504</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by tlipcon (name-node)<br>

			
 
				+     <b>FSImageSaver should catch all exceptions, not just IOE</b><br>

			
 
				+     <blockquote>FSImageSaver currently just catches IOE. This means that if some other error like OOME or failed assert happens in saving one of the images, the coordinating thread won&apos;t know there was a problem.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1503">HDFS-1503</a>.

			
 
				+     Minor bug reported by eli and fixed by tlipcon (test)<br>

			
 
				+     <b>TestSaveNamespace fails</b><br>

			
 
				+     <blockquote>Will attach the full log. Here&apos;s the relevant snippet:

			
 
				+<br>

			
 
				+<br>Exception in thread &quot;FSImageSaver for /home/eli/src/hdfs4/build/test/data/dfs/na

			
 
				+<br>me1 of type IMAGE_AND_EDITS&quot; java.lang.RuntimeException: Injected fault: saveFSI

			
 
				+<br>mage second time

			
 
				+<br>....

			
 
				+<br>        at java.lang.Thread.run(Thread.java:619)

			
 
				+<br>Exception in thread &quot;FSImageSaver for /home/eli/src/hdfs4/build/test/data/dfs/na

			
 
				+<br>me2 of type IMAGE_AND_EDITS&quot; java.lang.StackOverflowError

			
 
				+<br>        at java.util.Arrays.copyOf(Arrays.java:2882)

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1502">HDFS-1502</a>.

			
 
				+     Minor bug reported by eli and fixed by hairong <br>

			
 
				+     <b>TestBlockRecovery triggers NPE in assert</b><br>

			
 
				+     <blockquote>

			
 
				+<br>Testcase: testRBW_RWRReplicas took 10.333 sec

			
 
				+<br>        Caused an ERROR

			
 
				+<br>null

			
 
				+<br>java.lang.NullPointerException

			
 
				+<br>        at org.apache.hadoop.hdfs.server.datanode.DataNode.syncBlock(DataNode.java:1881)

			
 
				+<br>        at org.apache.hadoop.hdfs.server.datanode.TestBlockRecovery.testSyncReplicas(TestBlockRecovery.java:144)

			
 
				+<br>        at org.apache.hadoop.hdfs.server.datanode.TestBlockRecovery.testRBW_RWRReplicas(TestBlockRecovery.java:305)

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1500">HDFS-1500</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (test, tools)<br>

			
 
				+     <b>TestOfflineImageViewer failing on trunk</b><br>

			
 
				+     <blockquote>Testcase: testOIV took 22.679 sec

			
 
				+<br>  FAILED

			
 
				+<br>Failed reading valid file: No image processor to read version -26 is available.

			
 
				+<br>junit.framework.AssertionFailedError: Failed reading valid file: No image processor to read version -26 is available.

			
 
				+<br>  at org.apache.hadoop.hdfs.tools.offlineImageViewer.TestOfflineImageViewer.outputOfLSVisitor(TestOfflineImageViewer.java:171)

			
 
				+<br>  at org.apache.hadoop.hdfs.tools.offlineImageViewer.TestOfflineImageViewer.testOIV(TestOfflineImageViewer.java:86)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1498">HDFS-1498</a>.

			
 
				+     Minor bug reported by eli and fixed by eli (name-node)<br>

			
 
				+     <b>FSDirectory#unprotectedConcat calls setModificationTime on a file</b><br>

			
 
				+     <blockquote>The HDFSConcat test fails when asserts are enabled because FSDirectory#unprotectedConcat calls INode#setModificationTime on a file, this method asserts that the argument is a directory. It should use setModificationTimeForce since we know the target is a file, it&apos;s mod time should be set to now unconditionally since we know we&apos;re modifying it. The behavior should be equivalent.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1491">HDFS-1491</a>.

			
 
				+     Major improvement reported by sanjay.radia and fixed by sanjay.radia <br>

			
 
				+     <b>Update  Hdfs to match the change of methods from protected to public  in AbstractFileSystem (Hadoop-6903)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1487">HDFS-1487</a>.

			
 
				+     Major bug reported by zhong and fixed by zhong (name-node)<br>

			
 
				+     <b>FSDirectory.removeBlock() should update diskspace count of the block owner node</b><br>

			
 
				+     <blockquote>This bug leads a quota computation error. When calling abandonBlock(), the cached diskspace count of INodeDirectoryWithQuota is larger than the actual consumed space value.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1485">HDFS-1485</a>.

			
 
				+     Minor improvement reported by yaojingguo and fixed by yaojingguo <br>

			
 
				+     <b>Typo in BlockPlacementPolicy.java</b><br>

			
 
				+     <blockquote>In line 157, &quot;thatis&quot; should be &quot;that is&quot;.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1483">HDFS-1483</a>.

			
 
				+     Major bug reported by pkling and fixed by pkling (hdfs client)<br>

			
 
				+     <b>DFSClient.getBlockLocations returns BlockLocations with no indication that the corresponding blocks are corrupt</b><br>

			
 
				+     <blockquote>When there are no uncorrupted replicas of a block, FSNamesystem.getBlockLocations returns LocatedBlocks corresponding to corrupt blocks. When DFSClient converts these to BlockLocations, the information that the corresponding block is corrupt is lost. We should add a field to BlockLocation to indicate whether the corresponding block is corrupt in order to warn the client that reading this block will fail. This would be especially useful for tools such as RAID FSCK, which could then easily inspect whether data or parity blocks are corrupted without having to make direct RPC calls.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1473">HDFS-1473</a>.

			
 
				+     Major sub-task reported by tlipcon and fixed by tlipcon (name-node)<br>

			
 
				+     <b>Refactor storage management into separate classes than fsimage file reading/writing</b><br>

			
 
				+     <blockquote>Currently the FSImage class is responsible both for storage management (eg moving around files, tracking file names, the VERSION file, etc) as well as for the actual serialization and deserialization of the &quot;fsimage&quot; file within the storage directory.

			
 
				+<br>

			
 
				+<br>I&apos;d like to refactor the loading and saving code into new classes. This will make testing easier and also make the major changes in HDFS-1073 easier to understand.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1472">HDFS-1472</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (tools)<br>

			
 
				+     <b>Refactor DFSck to allow programmatic access to output</b><br>

			
 
				+     <blockquote>DFSck prints the list of corrupt files to stdout. This jira proposes that it write to a PrintStream object that is passed to the constructor. This will allow components like RAID to programmatically get a list of corrupt files.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1467">HDFS-1467</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (data-node)<br>

			
 
				+     <b>Append pipeline never succeeds with more than one replica</b><br>

			
 
				+     <blockquote>TestPipelines appears to be failing on trunk:

			
 
				+<br>

			
 
				+<br>Should be RBW replica after sequence of calls append()/write()/hflush() expected:&lt;RBW&gt; but was:&lt;FINALIZED&gt;

			
 
				+<br>junit.framework.AssertionFailedError: Should be RBW replica after sequence of calls append()/write()/hflush() expected:&lt;RBW&gt; but was:&lt;FINALIZED&gt;

			
 
				+<br>        at org.apache.hadoop.hdfs.TestPipelines.pipeline_01(TestPipelines.java:109)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1466">HDFS-1466</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by eli (test)<br>

			
 
				+     <b>TestFcHdfsSymlink relies on /tmp/test not existing</b><br>

			
 
				+     <blockquote>The test case testLinkAcrossFileSystems works with files in a directory /tmp/test. On our shared build systems this sometimes breaks because such a directory already exists but owned by some other user. The test case should use the build test dir instead.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1462">HDFS-1462</a>.

			
 
				+     Major sub-task reported by tlipcon and fixed by tlipcon (name-node)<br>

			
 
				+     <b>Refactor edit log loading to a separate class from edit log writing</b><br>

			
 
				+     <blockquote>Before the major work in HDFS-1073, I&apos;d like to do this refactor to clean up the monster FSEditLog class. We can separate all the functions that take of loading edits into an FSN from the functions that take care of writing edits, rolling, etc.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1457">HDFS-1457</a>.

			
 
				+     Major improvement reported by hairong and fixed by hairong (name-node)<br>

			
 
				+     <b>Limit transmission rate when transfering image between primary and secondary NNs</b><br>

			
 
				+     <blockquote>If the fsimage is very big. The network is full in a short time when SeconaryNamenode do checkpoint, leading to Jobtracker access Namenode to get relevant file data to fail in job initialization phase. So we limit transmission speed and compress transmission to resolve the problem. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1456">HDFS-1456</a>.

			
 
				+     Major improvement reported by jghoman and fixed by jghoman (test)<br>

			
 
				+     <b>Provide builder for constructing instances of MiniDFSCluster</b><br>

			
 
				+     <blockquote>Time to fix a broken window. Of the 293 occurences of &quot;new MiniDFSCluster(&quot;... most look something like:

			
 
				+<br>{noformat}cluster = new MiniDFSCluster(0, config, numDatanodes, true, false, true,  null, null, null, null);{noformat}

			
 
				+<br>The largest constructor takes 10 parameters, and even the overloaded constructors can be difficult to read as their mainaly nulls or booleans.

			
 
				+<br>

			
 
				+<br>We should provide a Builder for constructing MiniDFSClusters to improve readability.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1454">HDFS-1454</a>.

			
 
				+     Major improvement reported by hammer and fixed by qwertymaniac (documentation, hdfs client)<br>

			
 
				+     <b>Update the documentation to reflect true client caching strategy</b><br>

			
 
				+     <blockquote>As noted on the mailing list (http://mail-archives.apache.org/mod_mbox/hadoop-hdfs-user/201010.mbox/%3CAANLkTi=2csK+aY05bTOuO-UZv=O4w6oX2Pq4nxGPDZBi@mail.gmail.com%3E), the &quot;Staging&quot; section of http://hadoop.apache.org/hdfs/docs/r0.21.0/hdfs_design.html#Data+Organization is out of date.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1440">HDFS-1440</a>.

			
 
				+     Major bug reported by sureshms and fixed by sureshms (test)<br>

			
 
				+     <b>TestComputeInvalidateWork fails intermittently</b><br>

			
 
				+     <blockquote>TestComputeInvalidateWork fails intermittently. This is due to incorrect synchronization introduced due to HDFS-1093. The test uses blocks synchronized on FSNamesystem monitor, however with HDFS-1093, the FSNamesystem uses explicit read/write lock for synchronization.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1435">HDFS-1435</a>.

			
 
				+     Major improvement reported by hairong and fixed by hairong (name-node)<br>

			
 
				+     <b>Provide an option to store fsimage compressed</b><br>

			
 
				+     <blockquote>Our HDFS has fsimage as big as 20G bytes. It consumes a lot of network bandwidth when secondary NN uploads a new fsimage to primary NN.

			
 
				+<br>

			
 
				+<br>If we could store fsimage compressed, the problem could be greatly alleviated.

			
 
				+<br>

			
 
				+<br>I plan to provide a new configuration hdfs.image.compressed with a default value of false. If it is set to be true, fsimage is stored as compressed.

			
 
				+<br>

			
 
				+<br>The fsimage will have a new layout with a new field &quot;compressed&quot; in its header, indicating if the namespace is stored compressed or not.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1434">HDFS-1434</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms (data-node)<br>

			
 
				+     <b>Refactor Datanode#startDataNode method</b><br>

			
 
				+     <blockquote>This method is very long, approximately 190 lines. Splitting this method into smaller methods. This also helps in federation where some of the initialization in this methods will be done once for a datanode and others once in every heartbeat thread per namenode in DN.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1433">HDFS-1433</a>.

			
 
				+     Major bug reported by sureshms and fixed by sureshms (test)<br>

			
 
				+     <b>Fix test failures - TestPread and TestFileLimit</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1426">HDFS-1426</a>.

			
 
				+     Major improvement reported by hairong and fixed by hairong (name-node)<br>

			
 
				+     <b>Remove unused method BlockInfo#listCount</b><br>

			
 
				+     <blockquote>BlockInfo#listCount is not used anywhere so removing it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1417">HDFS-1417</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms <br>

			
 
				+     <b>Add @Override annotation to SimulatedFSDataset methods that implement FSDatasetInterface</b><br>

			
 
				+     <blockquote>@Override annotations are inconsistently added to methods implementing the interface.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1409">HDFS-1409</a>.

			
 
				+     Trivial bug reported by chingshen and fixed by chingshen (name-node)<br>

			
 
				+     <b>The &quot;register&quot; method of the BackupNode class should be &quot;UnsupportedActionException(&quot;register&quot;)&quot;</b><br>

			
 
				+     <blockquote>The register method of the BackupNode class should be &quot;UnsupportedActionException(&quot;register&quot;)&quot; rather than  &quot;UnsupportedActionException(&quot;journal&quot;)&quot;.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1408">HDFS-1408</a>.

			
 
				+     Major improvement reported by almacro and fixed by cos (test)<br>

			
 
				+     <b>Herriot NN and DN clients should vend statistics</b><br>

			
 
				+     <blockquote>The HDFS web user interface serves useful information through dfshealth.jsp and dfsnodelist.jsp.

			
 
				+<br>The Herriot interface to the namenode and datanode (as implemented in NNClient and DNClient, respectively) would benefit from the addition of some way to channel this information. In the case of DNClient this can be an injected method that returns a DatanodeDescriptor relevant to the underlying datanode.

			
 
				+<br>There seems to be no analagous NamenodeDescriptor. It may be useful to add this as a facade to a visitor that aggregates values across the filesystem datanodes.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1399">HDFS-1399</a>.

			
 
				+     Major bug reported by atm and fixed by atm (security)<br>

			
 
				+     <b>Distinct minicluster services (e.g. NN and JT) overwrite each other&apos;s service policies</b><br>

			
 
				+     <blockquote>HDFS portion of HADOOP-6951.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1395">HDFS-1395</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms (data-node)<br>

			
 
				+     <b>Add @Override annotation to FSDataset methods that implement FSDatasetInterface</b><br>

			
 
				+     <blockquote>@Override annotations are inconsistently added to methods implementing the interface.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1387">HDFS-1387</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (documentation, security)<br>

			
 
				+     <b>Update HDFS permissions guide for security</b><br>

			
 
				+     <blockquote>The HDFS permissions guide currently makes several statements that are no longer correct now that we provide security.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1383">HDFS-1383</a>.

			
 
				+     Major improvement reported by szetszwo and fixed by szetszwo <br>

			
 
				+     <b>Better error messages on hftp </b><br>

			
 
				+     <blockquote>If the file is not accessible, HftpFileSystem returns only a HTTP response code.

			
 
				+<br>2010-08-27 20:57:48,091 INFO org.apache.hadoop.tools.DistCp: FAIL README.txt : java.io.IOException:

			
 
				+<br> Server returned HTTP response code: 400 for URL: http:/namenode:50070/data/user/tsz/README.txt?ugi=tsz,users

			
 
				+<br>        at sun.net.www.protocol.http.HttpURLConnection.getInputStream(HttpURLConnection.java:1290)

			
 
				+<br>        at org.apache.hadoop.hdfs.HftpFileSystem.open(HftpFileSystem.java:143)

			
 
				+<br>        at org.apache.hadoop.fs.FileSystem.open(FileSystem.java:356)

			
 
				+<br>        ...

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1369">HDFS-1369</a>.

			
 
				+     Trivial improvement reported by eli and fixed by eli (data-node)<br>

			
 
				+     <b>Invalid javadoc reference in FSDatasetMBean.java </b><br>

			
 
				+     <blockquote>FSDatasetMBean.java references non-existant class DataNodeStatisticsMBean, I believe it meant to reference DataNodeActivityMBean.

			
 
				+<br>After this patch the javadoc and javadoc-dev targets run cleanly:

			
 
				+<br>

			
 
				+<br>     [exec] -1 overall.  

			
 
				+<br>     [exec] 

			
 
				+<br>     [exec]     +1 @author.  The patch does not contain any @author tags.

			
 
				+<br>     [exec] 

			
 
				+<br>     [exec]     -1 tests included.  The patch doesn&apos;t appear to include any new or modified tests.

			
 
				+<br>     [exec]                         Please justify why no new tests are needed for this patch.

			
 
				+<br>     [exec]                         Also please list what manual steps were performed to verify this patch.

			
 
				+<br>     [exec] 

			
 
				+<br>     [exec]     +1 javadoc.  The javadoc tool did not generate any warning messages.

			
 
				+<br>     [exec] 

			
 
				+<br>     [exec]     +1 javac.  The applied patch does not increase the total number of javac compiler warnings.

			
 
				+<br>     [exec] 

			
 
				+<br>     [exec]     +1 findbugs.  The patch does not introduce any new Findbugs warnings.

			
 
				+<br>     [exec] 

			
 
				+<br>     [exec]     +1 release audit.  The applied patch does not increase the total number of release audit warnings.

			
 
				+<br>     [exec] 

			
 
				+<br>     [exec]     +1 system tests framework.  The patch passed system tests framework compile.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1368">HDFS-1368</a>.

			
 
				+     Major improvement reported by hairong and fixed by hairong (name-node)<br>

			
 
				+     <b>Add a block counter to DatanodeDescriptor</b><br>

			
 
				+     <blockquote>Many of time, we need to count the total number of blocks in a datanode by calling DatanodeDescriptor#numBlocks(). It has to traverse the block list to get the counter, which may not be trivial if there are millions of blocks. Adding a counter for each datanode does not cost much space but help save CPU processing time.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1364">HDFS-1364</a>.

			
 
				+     Major bug reported by kzhang and fixed by jnp (security)<br>

			
 
				+     <b>HFTP client should support relogin from keytab</b><br>

			
 
				+     <blockquote>If a user starts a long-running HFTP client using a keytab, we should do relogin automatically whenever TGT expires. Currently, HFTP client uses TGT to fetch a delegation token and cache that delegation token for HFTP operations. The delegation token is automatically renewed/refetched using TGT. However, when TGT expires, delegation token renewal/refetch will fail and no further HFTP operation is possible. This is unsatisfactory since the user has given us her keytab. We should be able to relogin from keytab and continue.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1361">HDFS-1361</a>.

			
 
				+     Major bug reported by shv and fixed by shv <br>

			
 
				+     <b>Add -fileStatus operation to NNThroughputBenchmark</b><br>

			
 
				+     <blockquote>getFileStatus() is a frequently used operation in HDFS. It important to benchmark the name-node throughput on it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1357">HDFS-1357</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (data-node, security)<br>

			
 
				+     <b>HFTP traffic served by DataNode shouldn&apos;t use service port on NameNode </b><br>

			
 
				+     <blockquote>HDFS-599 introduced a new service port on NameNode to separate system traffic (e.g., heartbeats/blockreports) from client file access requests so that they can be prioritized.  All Datanode traffic now goes to the service port. However, datanode also serves as a proxy for HFTP requests from client (served by StreamFile servlet). These HFTP traffic should continue to use the client port on NameNode. Moreover, using the service port for HFTP is incompatible with the existing way of selecting delegation tokens.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1356">HDFS-1356</a>.

			
 
				+     Major improvement reported by boryas and fixed by boryas <br>

			
 
				+     <b>Provide information as to whether or not security is enabled on web interface for NameNode (part of HADOOP-6822)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1355">HDFS-1355</a>.

			
 
				+     Major bug reported by vicaya and fixed by vicaya (build)<br>

			
 
				+     <b>ant veryclean (clean-cache) doesn&apos;t clean enough</b><br>

			
 
				+     <blockquote>Looks like since HDFS-1159, ant veryclean no longer work as expected for the case when hadoop common jars are changed. The proposed patch does a more through cleaning on hadoop jars.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1353">HDFS-1353</a>.

			
 
				+     Major improvement reported by jghoman and fixed by jghoman (name-node)<br>

			
 
				+     <b>Remove most of getBlockLocation optimization</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1352">HDFS-1352</a>.

			
 
				+     Major bug reported by eli and fixed by eli (build)<br>

			
 
				+     <b>Fix jsvc.location</b><br>

			
 
				+     <blockquote>The jsvc specified in build.xml 404s, causing the build to fail, because version 1.0.2 has been archived. Let&apos;s update the url, not sure we want to move to 1.0.3 or play the game where the build breaks with every jsvc dot release.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1349">HDFS-1349</a>.

			
 
				+     Major bug reported by tomwhite and fixed by eli <br>

			
 
				+     <b>Remove empty java files</b><br>

			
 
				+     <blockquote>Doug identified some empty java files that should be deleted:

			
 
				+<br>

			
 
				+<br>src/java/org/apache/hadoop/hdfs/server/namenode/metrics/NameNodeStatisticsMBean.java

			
 
				+<br>src/java/org/apache/hadoop/hdfs/server/namenode/metrics/NameNodeStatistics.java

			
 
				+<br>src/java/org/apache/hadoop/hdfs/server/datanode/metrics/DataNodeStatistics.java

			
 
				+<br>src/java/org/apache/hadoop/hdfs/server/datanode/metrics/DataNodeStatisticsMBean.java</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1347">HDFS-1347</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas (test)<br>

			
 
				+     <b>TestDelegationToken uses mortbay.log for logging</b><br>

			
 
				+     <blockquote>needs to be changed to commons.log</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1340">HDFS-1340</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>A null delegation token is appended to the url if security is disabled when browsing filesystem.</b><br>

			
 
				+     <blockquote>  When filesystem is being browsed and if security is disabled a null delegation token is added to the url. Also if a user changes the url and adds any random string for delegation token, it is retained in the links on returned html page. If security is disabled no delegation token parameter is required on the url.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1334">HDFS-1334</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>open in HftpFileSystem does not add delegation tokens to the url.</b><br>

			
 
				+     <blockquote>open method in HftpFileSystem uses ByteRangeInputStream for url connection. But it does not add the delegation tokens, even if security is enabled, to the url before passing it to the ByteRangeInputStream. Therefore request fails if security is enabled.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1330">HDFS-1330</a>.

			
 
				+     Major new feature reported by hairong and fixed by johnvijoe (data-node)<br>

			
 
				+     <b>Make RPCs to DataNodes timeout</b><br>

			
 
				+     <blockquote>This jira aims to make client/datanode or datanode/datanode RPC to have a timeout of DataNode#socketTimeout.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1320">HDFS-1320</a>.

			
 
				+     Major improvement reported by zasran and fixed by zasran <br>

			
 
				+     <b>Add LOG.isDebugEnabled() guard for each LOG.debug(&quot;...&quot;)</b><br>

			
 
				+     <blockquote>Each LOG.debug(&quot;...&quot;) should be executed only if LOG.isDebugEnabled() is true, in some cases it&apos;s expensive to construct the string that is being printed to log. It&apos;s much easier to always use LOG.isDebugEnabled() because it&apos;s easier to check (rather than in each case reason wheather it&apos;s neccessary or not).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1319">HDFS-1319</a>.

			
 
				+     Major sub-task reported by jghoman and fixed by jghoman (name-node)<br>

			
 
				+     <b>Fix location of re-login for secondary namenode from HDFS-999</b><br>

			
 
				+     <blockquote>A bugfix to the original patch (HDFS-999) hasn&apos;t been applied to trunk yet, causing the 2nn to not be logged in at the correct time when it makes an RPC call.  This JIRA is to forward port the bugfix.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1318">HDFS-1318</a>.

			
 
				+     Major new feature reported by sureshms and fixed by tanping <br>

			
 
				+     <b>HDFS Namenode and Datanode WebUI information needs to be accessible programmatically for scripts</b><br>

			
 
				+     <blockquote>Currently Namenode and Datanode web page needs to be scraped by scripts to get this information. Having an interface where this structured information is provided, will help building scripts around it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1317">HDFS-1317</a>.

			
 
				+     Major bug reported by rohini and fixed by rohini (contrib/hdfsproxy)<br>

			
 
				+     <b>HDFSProxy needs additional changes to work after changes to streamFile servlet in HDFS-1109</b><br>

			
 
				+     <blockquote>Before HDFS-1109, streamFile had filename passed as a parameter in the request. With HDFS-1109, the filename is part of the request path similar to listPaths and data servlets. The AuthorizationFilter in HdfsProxy needs updating to pick up the path from the request path instead of  looking for filename parameter. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1315">HDFS-1315</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms (name-node, tools)<br>

			
 
				+     <b>Add fsck event to audit log and remove other audit log events corresponding to FSCK listStatus and open calls</b><br>

			
 
				+     <blockquote>In Yahoo production cluster audit logs more than 50% of entries comes from FSCK. FSCK makes same {{Namenode}} method calls as clients. Because of this, the operations are logged in audit logs similar to operations invoked by the client. I want to make a change to namenode not to log operations invoked by FSCK in audit logs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1310">HDFS-1310</a>.

			
 
				+     Major test reported by sureshms and fixed by rash37 (hdfs client)<br>

			
 
				+     <b>TestFileConcurrentReader fails</b><br>

			
 
				+     <blockquote>For details of test failure see http://hudson.zones.apache.org/hudson/job/Hdfs-Patch-h2.grid.sp2.yahoo.net/218/testReport/</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1308">HDFS-1308</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b> job conf key for the services name of DelegationToken for HFTP url is constructed incorrectly in HFTPFileSystem (part of MR-1718)</b><br>

			
 
				+     <blockquote>change HFTP init code that checks for existing delegation tokens</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1307">HDFS-1307</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms (name-node, tools)<br>

			
 
				+     <b>Add start time, end time and total time taken for FSCK to FSCK report</b><br>

			
 
				+     <blockquote>FSCK is a long running operation and makes namenode very busy when it runs. Adding information such as start time, end time and time taken helps in determining when the FSCK was run and the impact of that on Namenode.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1304">HDFS-1304</a>.

			
 
				+     Major improvement reported by szetszwo and fixed by szetszwo (test)<br>

			
 
				+     <b>There is no unit test for HftpFileSystem.open(..)</b><br>

			
 
				+     <blockquote>HftpFileSystem.open(..) first opens an URL connection to namenode&apos;s FileDataServlet and then is redirected to datanode&apos;s StreamFile servlet.  Such redirection does not work in the unit test environment because the redirect URL uses real hostname instead of localhost.

			
 
				+<br>

			
 
				+<br>One way to get around it is to use fault-injection in order to replace the real hostname with localhost.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1302">HDFS-1302</a>.

			
 
				+     Major improvement reported by jnp and fixed by jnp <br>

			
 
				+     <b>Use writeTokenStorageToStream method in Credentials to store credentials to a file.</b><br>

			
 
				+     <blockquote>This jira covers hdfs changes correspoding to HADOOP-6861 and MAPREDUCE-1566. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1301">HDFS-1301</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>TestHDFSProxy need to use server side conf for ProxyUser stuff.</b><br>

			
 
				+     <blockquote>currently TestHdfsProxy sets hadoop.proxyuser.USER.groups in local copy of configuration. 

			
 
				+<br>But ProxyUsers only looks at the server side config.

			
 
				+<br>For test we can uses static method in ProxyUsers to load the config.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1298">HDFS-1298</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms <br>

			
 
				+     <b>Add support in HDFS to update statistics that tracks number of file system operations in FileSystem</b><br>

			
 
				+     <blockquote>See HADOOP-6859 for the new statistics.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1297">HDFS-1297</a>.

			
 
				+     Trivial improvement reported by midojeff and fixed by midojeff (documentation)<br>

			
 
				+     <b>Fix some comments</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1296">HDFS-1296</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>using delegation token over hftp for long running clients (spawn from hdfs-1007).</b><br>

			
 
				+     <blockquote>this patch incorporates patches 

			
 
				+<br>https://issues.apache.org/jira/secure/attachment/12446280/hdfs-1007-long-running-hftp-client.patch

			
 
				+<br>and 

			
 
				+<br>https://issues.apache.org/jira/secure/attachment/12446362/hdfs-1007-securityutil-fix.patch

			
 
				+<br>

			
 
				+<br>patches are attached.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1289">HDFS-1289</a>.

			
 
				+     Major bug reported by kzhang and fixed by kzhang (data-node)<br>

			
 
				+     <b>Datanode secure mode is broken</b><br>

			
 
				+     <blockquote>HDFS-520 introduced a new DataNode constructor, which tries to set up an RPC connection to the NN before a Kerberos login is done. This causes datanode to fail.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1284">HDFS-1284</a>.

			
 
				+     Major bug reported by shv and fixed by kzhang (test)<br>

			
 
				+     <b>TestBlockToken fails</b><br>

			
 
				+     <blockquote>Hudson runs fail several tests. {{TestBlockToken.testBlockTokenRpc}} is one of them.

			
 
				+<br>[See here|http://hudson.zones.apache.org/hudson/job/Hdfs-Patch-h5.grid.sp2.yahoo.net/423/testReport/junit/org.apache.hadoop.hdfs.security.token.block/TestBlockToken/testBlockTokenRpc/]</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1283">HDFS-1283</a>.

			
 
				+     Major bug reported by jghoman and fixed by jghoman (build)<br>

			
 
				+     <b>ant eclipse-files has drifted again</b><br>

			
 
				+     <blockquote>Library versions specified by ant eclipse-files have drifted from those used by ivy again.  Until HDFS-1035 meanders into the code, we need to make sure we keep these updated, otherwise bedlam breaks loose for Eclipse developers.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1272">HDFS-1272</a>.

			
 
				+     Major improvement reported by jnp and fixed by jnp <br>

			
 
				+     <b>HDFS changes corresponding to rename of TokenStorage to Credentials</b><br>

			
 
				+     <blockquote>TokenStorage is renamed to Credentials as part of MAPREDUCE-1528 and HADOOP-6845. This jira tracks hdfs changes corresponding to that.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1250">HDFS-1250</a>.

			
 
				+     Major bug reported by sureshms and fixed by sureshms (name-node)<br>

			
 
				+     <b>Namenode accepts block report from dead datanodes</b><br>

			
 
				+     <blockquote>When a datanode heartbeat times out namenode marks it dead. The subsequent heartbeat from the datanode is rejected with a command to datanode to re-register. However namenode accepts block report from the datanode although it is marked dead.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1205">HDFS-1205</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (data-node)<br>

			
 
				+     <b>FSDatasetAsyncDiskService should name its threads</b><br>

			
 
				+     <blockquote>FSDatasetAsyncService creates threads but doesn&apos;t name them. The ThreadFactory should name them with the volume they work on as well as a thread index.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1203">HDFS-1203</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (data-node)<br>

			
 
				+     <b>DataNode should sleep before reentering service loop after an exception</b><br>

			
 
				+     <blockquote>When the DN gets an exception in response to a heartbeat, it logs it and continues, but there is no sleep. I&apos;ve occasionally seen bugs produce a case where heartbeats continuously produce exceptions, and thus the DN floods the NN with bad heartbeats. Adding a 1 second sleep at least throttles the error messages for easier debugging and error isolation.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1202">HDFS-1202</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (data-node)<br>

			
 
				+     <b>DataBlockScanner throws NPE when updated before initialized</b><br>

			
 
				+     <blockquote>Missing an isInitialized() check in updateScanStatusInternal</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1201">HDFS-1201</a>.

			
 
				+     Major improvement reported by jnp and fixed by kzhang <br>

			
 
				+     <b> Support for using different Kerberos keys for Namenode and datanode.</b><br>

			
 
				+     <blockquote>This jira covers the hdfs changes to support different Kerberos keys for Namenode and datanode. This corresponds to changes in HADOOP-6632</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1198">HDFS-1198</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp (name-node)<br>

			
 
				+     <b>Resolving cross-realm principals</b><br>

			
 
				+     <blockquote>This jira covers hdfs changes corresponding to HADOOP-6603. Kerberos has bug in resolving cross realm principals. This jira provides a work-around for that.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1192">HDFS-1192</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>refreshSuperUserGroupsConfiguration should use server side configuration for the refresh (for HADOOP-6815)</b><br>

			
 
				+     <blockquote>Currently refreshSuperUserGroupsConfiguration is using client side Configuration.

			
 
				+<br>One of the issues with this is that if the cluster is restarted it will loose the &quot;refreshed&apos; values (unless they are copied to the NameNode/JobTracker machine).

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1190">HDFS-1190</a>.

			
 
				+     Minor improvement reported by midojeff and fixed by midojeff (data-node)<br>

			
 
				+     <b>Remove unused getNamenode() method from DataNode.</b><br>

			
 
				+     <blockquote>This patch removes the getNamenode() method from DataNode, which appears to be unused.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1187">HDFS-1187</a>.

			
 
				+     Major improvement reported by owen.omalley and fixed by owen.omalley (security)<br>

			
 
				+     <b>Modify fetchdt to allow renewing and canceling token</b><br>

			
 
				+     <blockquote>I would like to extend fetchdt to allow renewing and canceling tokens.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1185">HDFS-1185</a>.

			
 
				+     Minor improvement reported by midojeff and fixed by midojeff (data-node, name-node)<br>

			
 
				+     <b>Remove duplicate now() functions in DataNode, FSNamesystem</b><br>

			
 
				+     <blockquote>An identical now() function is defined in Util, DataNode, and FSNamesystem.  This patch removes the latter two and converts all calls to use the Util.now function.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1184">HDFS-1184</a>.

			
 
				+     Minor improvement reported by midojeff and fixed by midojeff <br>

			
 
				+     <b>Replace tabs in code with spaces</b><br>

			
 
				+     <blockquote>Replace some code indentation that uses tabs with spaces, to match the coding convention</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1183">HDFS-1183</a>.

			
 
				+     Minor improvement reported by midojeff and fixed by midojeff (name-node)<br>

			
 
				+     <b>Remove some duplicate code in NamenodeJspHelper.java</b><br>

			
 
				+     <blockquote>This patch refactors out some duplicate code in generateNodeData and generateDecommissioningNodeData in NamenodeJspHelper.java.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1178">HDFS-1178</a>.

			
 
				+     Major improvement reported by owen.omalley and fixed by owen.omalley (name-node)<br>

			
 
				+     <b>The NameNode servlets should not use RPC to connect to the NameNode</b><br>

			
 
				+     <blockquote>Currently some of the NameNode servlets use RPC to connect from the NameNode to itself. They should do it more directly with the NameNode object.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1167">HDFS-1167</a>.

			
 
				+     Major task reported by vinaythota and fixed by vinaythota (test)<br>

			
 
				+     <b>New property for local conf directory in system-test-hdfs.xml file.</b><br>

			
 
				+     <blockquote>Adding new property in system-test.xml file for local configuration directory.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1164">HDFS-1164</a>.

			
 
				+     Major bug reported by eli and fixed by tlipcon (contrib/hdfsproxy)<br>

			
 
				+     <b>TestHdfsProxy is failing</b><br>

			
 
				+     <blockquote>TestHdfsProxy is failing on trunk, seen in HDFS-1132 and HDFS-1143. It doesn&apos;t look like hudson posts test results for contrib and it&apos;s hard to see what&apos;s going on from the raw console output. Can someone with access to hudson upload the individual test output for TestHdfsProxy so we can see what the issue is?</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1163">HDFS-1163</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>normalize property names for JT/NN kerberos principal names in configuration (from HADOOP 6633)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1160">HDFS-1160</a>.

			
 
				+     Major improvement reported by eli and fixed by eli (data-node)<br>

			
 
				+     <b>Improve some FSDataset warnings and comments</b><br>

			
 
				+     <blockquote>The warning in FSDataset that prints &quot;removing block&quot; is more clear as &quot;Removing replica info for block&quot; since the DN is not actually removing the block. The attached patch also cleans up and fixes typos in some related comments and code. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1157">HDFS-1157</a>.

			
 
				+     Major bug reported by cos and fixed by cos (test)<br>

			
 
				+     <b>Modifications introduced by HDFS-1150 are breaking aspect&apos;s bindings</b><br>

			
 
				+     <blockquote>Modifications introduced by HDFS-1150 to DataNode class brakes the binding of some of Herriot (test framework) bindings. This JIRA is to track the fix.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1150">HDFS-1150</a>.

			
 
				+     Major new feature reported by jghoman and fixed by jghoman (data-node)<br>

			
 
				+     <b>Verify datanodes&apos; identities to clients in secure clusters</b><br>

			
 
				+     <blockquote>Currently we use block access tokens to allow datanodes to verify clients&apos; identities, however we don&apos;t have a way for clients to verify the authenticity of the datanodes themselves.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1146">HDFS-1146</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>Javadoc for getDelegationTokenSecretManager in FSNamesystem</b><br>

			
 
				+     <blockquote>Javadoc is missing for public method getDelegationTokenSecretManager in FSNamesystem.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1145">HDFS-1145</a>.

			
 
				+     Major bug reported by dhruba and fixed by dhruba (name-node)<br>

			
 
				+     <b>When NameNode is shutdown it tries to exit safemode</b><br>

			
 
				+     <blockquote>Suppose the NameNode is in safemode. Then we try to shuut it down by invoking NameNode.stop(). The stop() method interrupts all waiting threads, which in turn, causes the SafeMode monitor to exit and thus triggering replicating/deleting of blocks.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1141">HDFS-1141</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (name-node)<br>

			
 
				+     <b>completeFile does not check lease ownership</b><br>

			
 
				+     <blockquote>completeFile should check that the caller still owns the lease of the file that it&apos;s completing. This is for the &apos;testCompleteOtherLeaseHoldersFile&apos; case in HDFS-1139.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1140">HDFS-1140</a>.

			
 
				+     Minor improvement reported by dms and fixed by dms (name-node)<br>

			
 
				+     <b>Speedup INode.getPathComponents</b><br>

			
 
				+     <blockquote>When the namenode is loading the image there is a significant amount of time being spent in the DFSUtil.string2Bytes. We have a very specific workload here. The path that namenode does getPathComponents for shares N - 1 component with the previous path this method was called for (assuming current path has N components).

			
 
				+<br>Hence we can improve the image load time by caching the result of previous conversion.

			
 
				+<br>We thought of using some simple LRU cache for components, but the reality is, String.getBytes gets optimized during runtime and LRU cache doesn&apos;t perform as well, however using just the latest path components and their translation to bytes in two arrays gives quite a performance boost.

			
 
				+<br>I could get another 20% off of the time to load the image on our cluster (30 seconds vs 24) and I wrote a simple benchmark that tests performance with and without caching.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1138">HDFS-1138</a>.

			
 
				+     Major bug reported by dms and fixed by dms <br>

			
 
				+     <b>Modification times are being overwritten when FSImage loads</b><br>

			
 
				+     <blockquote>A very easy way to spot the bug is to do a second restart in TestRestartDFS and check that the modification time on root is the same as it was before the second restart.

			
 
				+<br>

			
 
				+<br>The problem is modifying time of the parent if the modification time of the child is greater than parent&apos;s in addToParent.

			
 
				+<br>

			
 
				+<br>So if you have /DIR/File then on creation of a file modification time of the DIR will be set, but on cluster restart, or when secondary is checkpointing and reading the image it will add DIR to &quot;/&quot; and write the new modification time for &quot;/&quot; which is the modification time of DIR.

			
 
				+<br>

			
 
				+<br>This is clearly a bug. I will attach a patch with one more parameter being passed from the loadFSImage that says to not propagate the time.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1132">HDFS-1132</a>.

			
 
				+     Minor test reported by eli and fixed by eli (test)<br>

			
 
				+     <b>Refactor TestFileStatus</b><br>

			
 
				+     <blockquote>When writing HADOOP-6585 I noticed TestFileStatus is an old test with just one monolithic test function. We should rewrite it as a junit4 style test and break up the functions into setup, teardown, and five individual test cases. Same tests being run, just easier to follow, modify and add news tests. Patch coming.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1130">HDFS-1130</a>.

			
 
				+     Major bug reported by amareshwari and fixed by devaraj (security)<br>

			
 
				+     <b>Pass Administrator acl to HTTPServer for common servlet access.</b><br>

			
 
				+     <blockquote>Once HADOOP-6748 is done, HDFS should pass administrator acl when HTTPServer is constructed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1119">HDFS-1119</a>.

			
 
				+     Major sub-task reported by szetszwo and fixed by szetszwo (name-node)<br>

			
 
				+     <b>Refactor BlocksMap with GettableSet</b><br>

			
 
				+     <blockquote>The data structure required in BlocksMap is a GettableSet.  See also [this comment|https://issues.apache.org/jira/browse/HDFS-1114?focusedCommentId=12862118&amp;page=com.atlassian.jira.plugin.system.issuetabpanels%3Acomment-tabpanel#action_12862118].</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1118">HDFS-1118</a>.

			
 
				+     Major bug reported by zshao and fixed by zshao <br>

			
 
				+     <b>DFSOutputStream socket leak when cannot connect to DataNode</b><br>

			
 
				+     <blockquote>The offending code is in {{DFSOutputStream.nextBlockOutputStream}}

			
 
				+<br>

			
 
				+<br>This function retries several times to call {{createBlockOutputStream}}. Each time when it fails, it leaves a {{Socket}} object in {{DFSOutputStream.s}}.

			
 
				+<br>That object is never closed, but overwritten the next time {{createBlockOutputStream}} is called.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1114">HDFS-1114</a>.

			
 
				+     Major improvement reported by szetszwo and fixed by szetszwo (name-node)<br>

			
 
				+     <b>Reducing NameNode memory usage by an alternate hash table</b><br>

			
 
				+     <blockquote>NameNode uses a java.util.HashMap to store BlockInfo objects.  When there are many blocks in HDFS, this map uses a lot of memory in the NameNode.  We may optimize the memory usage by a light weight hash table implementation.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1112">HDFS-1112</a>.

			
 
				+     Major bug reported by hairong and fixed by hairong (name-node)<br>

			
 
				+     <b>Edit log buffer should not grow unboundedly</b><br>

			
 
				+     <blockquote>Currently HDFS does not impose an upper limit on the edit log buffer. In case there are a large number of open operations coming in with access time update on, since open does not call sync automatically, there is a possibility that the buffer grow to a large size, therefore causes memory leak and full GC in extreme cases as described in HDFS-1104. 

			
 
				+<br>

			
 
				+<br>The edit log buffer should be automatically flushed when the buffer becomes full.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1111">HDFS-1111</a>.

			
 
				+     Major new feature reported by rschmidt and fixed by sriramsrao <br>

			
 
				+     <b>getCorruptFiles() should give some hint that the list is not complete</b><br>

			
 
				+     <blockquote>If the list of corruptfiles returned by the namenode doesn&apos;t say anything if the number of corrupted files is larger than the call output limit (which means the list is not complete). There should be a way to hint incompleteness to clients.

			
 
				+<br>

			
 
				+<br>A simple hack would be to add an extra entry to the array returned with the value null. Clients could interpret this as a sign that there are other corrupt files in the system.

			
 
				+<br>

			
 
				+<br>We should also do some rephrasing of the fsck output to make it more confident when the list is not complete and less confident when the list is known to be incomplete.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1110">HDFS-1110</a>.

			
 
				+     Major improvement reported by sureshms and fixed by sureshms <br>

			
 
				+     <b>Namenode heap optimization - reuse objects for commonly used file names</b><br>

			
 
				+     <blockquote>There are a lot of common file names used in HDFS, mainly created by mapreduce, such as file names starting with &quot;part&quot;. Reusing byte[] corresponding to these recurring file names will save significant heap space used for storing the file names in millions of INodeFile objects.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1109">HDFS-1109</a>.

			
 
				+     Major bug reported by dms and fixed by dms (contrib/hdfsproxy, data-node)<br>

			
 
				+     <b>HFTP and URL Encoding</b><br>

			
 
				+     <blockquote>We just saw this error happen in our cluster. If there is a file that has a &quot;+&quot; sign in the name it is not readable through HFTP protocol.

			
 
				+<br>The problem is when we are reading a file with HFTP we are passing a name of the file as a parameter in request and + gets undecoded into space on the server side. So the datanode receiving the streamFile request tries to access a file with space instead of + in the name and doesn&apos;t find that file.

			
 
				+<br>

			
 
				+<br>The proposed solution is to pass the filename as a part of URL as with all the other HFTP commands, since this is the only place where it is not being treated this way. Are there any objections to this?</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1096">HDFS-1096</a>.

			
 
				+     Major new feature reported by boryas and fixed by boryas (security)<br>

			
 
				+     <b>allow dfsadmin/mradmin refresh of superuser proxy group mappings</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1093">HDFS-1093</a>.

			
 
				+     Major improvement reported by dhruba and fixed by dhruba (name-node)<br>

			
 
				+     <b>Improve namenode scalability by splitting the FSNamesystem synchronized section in a read/write lock</b><br>

			
 
				+     <blockquote>Most critical data structures in the NameNode (NN) are protected by a syncronized methods in the FSNamesystem class. This essentially makes critical code paths in the NN single-threaded. However, a large percentage of the NN calls are listStatus, getBlockLocations, etc which do not change internal data structures at all, these are read-only calls. If we change the FSNamesystem lock to a read/write lock, many of the above operations can occur in parallel, thus improving the scalability of the NN.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1085">HDFS-1085</a>.

			
 
				+     Major bug reported by knoguchi and fixed by szetszwo (data-node)<br>

			
 
				+     <b>hftp read  failing silently</b><br>

			
 
				+     <blockquote>When performing a massive distcp through hftp, we saw many tasks fail with 

			
 
				+<br>

			
 
				+<br>2010-04-06 17:56:43,005 INFO org.apache.hadoop.tools.DistCp: FAIL 2010/0/part-00032 : java.io.IOException: File size not matched: copied 193855488 bytes (184.9m) to tmpfile (=hdfs://omehost.com:8020/somepath/part-00032)

			
 
				+<br>but expected 1710327403 bytes (1.6g) from hftp://someotherhost/somepath/part-00032

			
 
				+<br>        at org.apache.hadoop.tools.DistCp$CopyFilesMapper.copy(DistCp.java:435)

			
 
				+<br>        at org.apache.hadoop.tools.DistCp$CopyFilesMapper.map(DistCp.java:543)

			
 
				+<br>        at org.apache.hadoop.tools.DistCp$CopyFilesMapper.map(DistCp.java:310)

			
 
				+<br>        at org.apache.hadoop.mapred.MapRunner.run(MapRunner.java:50)

			
 
				+<br>        at org.apache.hadoop.mapred.MapTask.runOldMapper(MapTask.java:358)

			
 
				+<br>        at org.apache.hadoop.mapred.MapTask.run(MapTask.java:307)

			
 
				+<br>        at org.apache.hadoop.mapred.Child.main(Child.java:159)

			
 
				+<br>

			
 
				+<br>This means that read itself didn&apos;t fail but the resulted file was somehow smaller.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1081">HDFS-1081</a>.

			
 
				+     Major improvement reported by jghoman and fixed by jghoman (security)<br>

			
 
				+     <b>Performance regression in DistributedFileSystem::getFileBlockLocations in secure systems</b><br>

			
 
				+     <blockquote>We&apos;ve seen a significant decrease in the performance of DistributedFileSystem::getFileBlockLocations() with security turned on Y20. This JIRA is for correcting and tracking it both on Y20 and trunk.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1080">HDFS-1080</a>.

			
 
				+     Major bug reported by jghoman and fixed by jghoman (name-node)<br>

			
 
				+     <b>SecondaryNameNode image transfer should use the defined http address rather than local ip address</b><br>

			
 
				+     <blockquote>Currently when telling the NN where to get the merged image, SNN uses getLocalHost.getAddr(), which may not return the correct ip addr.  </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1079">HDFS-1079</a>.

			
 
				+     Major new feature reported by sureshms and fixed by sureshms (name-node)<br>

			
 
				+     <b>HDFS implementation should throw exceptions defined in AbstractFileSystem</b><br>

			
 
				+     <blockquote>HDFS implementation Hdfs.java should throw exceptions as defined in AbstractFileSystem. To facilitate this, ClientProtocol should be changed to throw specific exceptions, as defined in AbstractFileSystem.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1071">HDFS-1071</a>.

			
 
				+     Major sub-task reported by dhruba and fixed by dms (name-node)<br>

			
 
				+     <b>savenamespace should write the fsimage to all configured fs.name.dir in parallel</b><br>

			
 
				+     <blockquote>If you have a large number of files in HDFS, the fsimage file is very big. When the namenode restarts, it writes a copy of the fsimage to all directories configured in fs.name.dir. This takes a long time, especially if there are many directories in fs.name.dir. Make the NN write the fsimage to all these directories in parallel.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1061">HDFS-1061</a>.

			
 
				+     Minor improvement reported by bharathm and fixed by bharathm (name-node)<br>

			
 
				+     <b>Memory footprint optimization for INodeFile object. </b><br>

			
 
				+     <blockquote>I am proposing a footprint optimization to merge blockReplication and preferredBlockSize fields into one &apos;long header&apos; field in INodeFile class. This saves 8 bytes per INodeFile object on a 64 bit JVM. This memory optimization is transparent and changes are very minimal.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1055">HDFS-1055</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (data-node)<br>

			
 
				+     <b>Improve thread naming for DataXceivers</b><br>

			
 
				+     <blockquote>The DataXceiver threads are named using the default Daemon naming, which is Runnable.toString(). Currently this isn&apos;t implemented, so threads have names like org.apache.hadoop.hdfs.server.datanode.DataXceiver@579c9a6b. It would be very handy for debugging (and even ops maybe) to have a better name like &quot;DataXceiver for client 1.2.3.4 [reading block_234254242]&quot;</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1045">HDFS-1045</a>.

			
 
				+     Major bug reported by jghoman and fixed by jghoman (security)<br>

			
 
				+     <b>In secure clusters, re-login is necessary for https clients before opening connections</b><br>

			
 
				+     <blockquote>Ticket credentials expire and therefore clients opening https connections (only the NN and SNN doing image/edits exchange) should re-login before opening those connections.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1044">HDFS-1044</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>Cannot submit mapreduce job from secure client to unsecure sever</b><br>

			
 
				+     <blockquote>Looks like it tries to get DelegationToken and fails because SecureManger on Server doesn&apos;t start in non-secure environment.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1039">HDFS-1039</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>Service should be set in the token in JspHelper.getUGI</b><br>

			
 
				+     <blockquote> The delegation token added to the UGI in getUGI method in the JspHelper does not have service set. Therefore, this token cannot be used to connect to the namenode.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1038">HDFS-1038</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>In nn_browsedfscontent.jsp fetch delegation token only if security is enabled.</b><br>

			
 
				+     <blockquote>nn_browsedfscontent.jsp  calls getDelegationToken even if security is disabled, which causes NPE. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1036">HDFS-1036</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>in DelegationTokenFetch dfs.getURI returns no port</b><br>

			
 
				+     <blockquote>dfs.getUri().getPort() returns -1.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1035">HDFS-1035</a>.

			
 
				+     Major improvement reported by tomwhite and fixed by nidaley (build)<br>

			
 
				+     <b>Generate Eclipse&apos;s .classpath file from Ivy config</b><br>

			
 
				+     <blockquote>HDFS companion issue for HADOOP-6407.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1033">HDFS-1033</a>.

			
 
				+     Major improvement reported by jghoman and fixed by jghoman (name-node, security)<br>

			
 
				+     <b>In secure clusters, NN and SNN should verify that the remote principal during image and edits transfer</b><br>

			
 
				+     <blockquote>Currently anyone can connect and download image/edits from Namenode.  In a secure cluster we can verify the identity of the principal making the request; we should disallow requests from anyone except the NN and SNN principals (and their hosts due to the lousy KerbSSL limitation).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1028">HDFS-1028</a>.

			
 
				+     Minor improvement reported by tlipcon and fixed by dms (name-node)<br>

			
 
				+     <b>INode.getPathNames could split more efficiently</b><br>

			
 
				+     <blockquote>INode.getPathnames uses String.split(String) which actually uses the full Java regex implementation. Since we&apos;re always splitting on a single char, we could implement a faster one like StringUtils.split() (except without the escape character). This takes a significant amount of CPU during FSImage loading so should be a worthwhile speedup.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1027">HDFS-1027</a>.

			
 
				+     Trivial bug reported by raviphulari and fixed by raviphulari <br>

			
 
				+     <b>Update  year to 2010.</b><br>

			
 
				+     <blockquote>Copyright year needs to be updated from 2009 to 2010.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1023">HDFS-1023</a>.

			
 
				+     Major improvement reported by jghoman and fixed by jghoman (name-node)<br>

			
 
				+     <b>Allow http server to start as regular principal if https principal not defined.</b><br>

			
 
				+     <blockquote>Currently limitations in Sun&apos;s KerbSSL implementation require the https server to be run as &quot;host/[machine]@realm.&quot; and another Sun KerbSSL limitation appears to require you to store all principals in the same keytab, meaning fully functional, secured Namenodes require combined keytabs.  However, it may be that one wishes to run a namenode without a secondary namenode or other utilities that require https.  In this case, we should allow the http server to start and log a warning that it will not be able to accept https connections.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1021">HDFS-1021</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas (security)<br>

			
 
				+     <b>specify correct server principal for RefreshAuthorizationPolicyProtocol and RefreshUserToGroupMappingsProtocol protocols in DFSAdmin (for HADOOP-6612)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1019">HDFS-1019</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>Incorrect default values for delegation tokens in hdfs-default.xml</b><br>

			
 
				+     <blockquote> The default values for delegation token parameters in hdfs-default.xml are incorrect.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1017">HDFS-1017</a>.

			
 
				+     Major bug reported by jghoman and fixed by jghoman (security)<br>

			
 
				+     <b>browsedfs jsp should call JspHelper.getUGI rather than using createRemoteUser()</b><br>

			
 
				+     <blockquote>Currently the JSP for browsing the file system calls getRemoteUser(), which doesn&apos;t correctly auth the user on the web, causing failures when trying to browse the web.  It should call the utility method JspHelper.getUGI instead.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1007">HDFS-1007</a>.

			
 
				+     Major bug reported by devaraj and fixed by devaraj (security)<br>

			
 
				+     <b>HFTP needs to be updated to use delegation tokens</b><br>

			
 
				+     <blockquote>HFTPFileSystem should be updated to use the delegation tokens so that it can talk to the secure namenodes.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1006">HDFS-1006</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>getImage/putImage http requests should be https for the case of security enabled.</b><br>

			
 
				+     <blockquote>should use https:// and port 50475</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1005">HDFS-1005</a>.

			
 
				+     Major new feature reported by jnp and fixed by boryas <br>

			
 
				+     <b>Fsck security</b><br>

			
 
				+     <blockquote>This jira tracks implementation of security for Fsck. Fsck should make an authenticated connection to the namenode.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1004">HDFS-1004</a>.

			
 
				+     Major new feature reported by jghoman and fixed by jghoman (name-node)<br>

			
 
				+     <b>Update NN to support Kerberized SSL from HADOOP-6584</b><br>

			
 
				+     <blockquote>Namenode needs to be tweaked to use the new kerberized-back ssl connector.  </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1003">HDFS-1003</a>.

			
 
				+     Major new feature reported by boryas and fixed by boryas <br>

			
 
				+     <b>authorization checks for inter-server protocol (based on HADOOP-6600)</b><br>

			
 
				+     <blockquote>authorization checks for inter-server protocol (based on HADOOP-6600)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1001">HDFS-1001</a>.

			
 
				+     Minor bug reported by bcwalrus and fixed by bcwalrus (data-node)<br>

			
 
				+     <b>DataXceiver and BlockReader disagree on when to send/recv CHECKSUM_OK</b><br>

			
 
				+     <blockquote>Running the TestPread with additional debug statements reveals that the BlockReader sends CHECKSUM_OK when the DataXceiver doesn&apos;t expect it. Currently it doesn&apos;t matter since DataXceiver closes the connection after each op, and CHECKSUM_OK is the last thing on the wire. But if we want to cache connections, they need to agree on the exchange of CHECKSUM_OK.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-992">HDFS-992</a>.

			
 
				+     Major new feature reported by kzhang and fixed by kzhang (security)<br>

			
 
				+     <b>Re-factor block access token implementation to conform to the generic Token interface in Common</b><br>

			
 
				+     <blockquote>This makes it possible to use block access token as shared key for client-to-datanode authentication over RPC. However, access authorization is still based on block access token semantics.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-988">HDFS-988</a>.

			
 
				+     Blocker bug reported by dhruba and fixed by eli (name-node)<br>

			
 
				+     <b>saveNamespace race can corrupt the edits log</b><br>

			
 
				+     <blockquote>The adminstrator puts the namenode is safemode and then issues the savenamespace command. This can corrupt the edits log. The problem is that  when the NN enters safemode, there could still be pending logSycs occuring from other threads. Now, the saveNamespace command, when executed, would save a edits log with partial writes. I have seen this happen on 0.20.

			
 
				+<br>

			
 
				+<br>https://issues.apache.org/jira/browse/HDFS-909?focusedCommentId=12828853&amp;page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel#action_12828853</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-982">HDFS-982</a>.

			
 
				+     Blocker test reported by eli and fixed by pocheung (contrib/hdfsproxy, security)<br>

			
 
				+     <b>TestDelegationToken#testDelegationTokenWithRealUser is failing</b><br>

			
 
				+     <blockquote>Hudson is reporting that TestDelegationToken#testDelegationTokenWithRealUser is failing on trunk.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-981">HDFS-981</a>.

			
 
				+     Blocker test reported by eli and fixed by cos (contrib/hdfsproxy)<br>

			
 
				+     <b>test-contrib fails due to test-cactus failure</b><br>

			
 
				+     <blockquote>Relevant output from a recent run http://hudson.zones.apache.org/hudson/job/Hdfs-Patch-h5.grid.sp2.yahoo.net/232/console

			
 
				+<br>

			
 
				+<br>     [exec] BUILD FAILED

			
 
				+<br>     [exec] /grid/0/hudson/hudson-slave/workspace/Hdfs-Patch-h5.grid.sp2.yahoo.net/trunk/build.xml:568: The following error occurred while executing this line:

			
 
				+<br>     [exec] /grid/0/hudson/hudson-slave/workspace/Hdfs-Patch-h5.grid.sp2.yahoo.net/trunk/src/contrib/build.xml:48: The following error occurred while executing this line:

			
 
				+<br>     [exec] /grid/0/hudson/hudson-slave/workspace/Hdfs-Patch-h5.grid.sp2.yahoo.net/trunk/src/contrib/hdfsproxy/build.xml:292: org.codehaus.cargo.container.ContainerException: Failed to download [http://apache.osuosl.org/tomcat/tomcat-6/v6.0.18/bin/apache-tomcat-6.0.18.zip]</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-977">HDFS-977</a>.

			
 
				+     Trivial bug reported by stevel@apache.org and fixed by qwertymaniac (data-node)<br>

			
 
				+     <b>DataNode.createInterDataNodeProtocolProxy() guards a log at the wrong level</b><br>

			
 
				+     <blockquote>My IDE tells me that this code snippet in {{DataNode.createInterDataNodeProtocolProxy()}} is guarding the info log entry at debug level, and it should be reviewed

			
 
				+<br>    if (InterDatanodeProtocol.LOG.isDebugEnabled()) {

			
 
				+<br>      InterDatanodeProtocol.LOG.info(&quot;InterDatanodeProtocol addr=&quot; + addr);

			
 
				+<br>    }

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-970">HDFS-970</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (name-node)<br>

			
 
				+     <b>FSImage writing should always fsync before close</b><br>

			
 
				+     <blockquote>Without an fsync, it&apos;s common that filesystems will delay the writing of metadata to the journal until all of the data blocks have been flushed. If the system crashes while the dirty pages haven&apos;t been flushed, the file is left in an indeterminate state. In some FSs (eg ext4) this will result in a 0-length file. In others (eg XFS) it will result in the correct length but any number of data blocks getting zeroed. Calling FileChannel.force before closing the FSImage prevents this issue.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-947">HDFS-947</a>.

			
 
				+     Major improvement reported by dhruba and fixed by dms <br>

			
 
				+     <b>The namenode should redirect a hftp request to read a file to the datanode that has the maximum number of local replicas</b><br>

			
 
				+     <blockquote>A client that uses the Hftp protocol to read a file is redirected by the namenode to a random datanode. It would be nice if the client gets redirected to a datanode that has the maximum number of local replicas of the blocks of the file.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-941">HDFS-941</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by bcwalrus (data-node, hdfs client, performance)<br>

			
 
				+     <b>Datanode xceiver protocol should allow reuse of a connection</b><br>

			
 
				+     <blockquote>Right now each connection into the datanode xceiver only processes one operation.

			
 
				+<br>

			
 
				+<br>In the case that an operation leaves the stream in a well-defined state (eg a client reads to the end of a block successfully) the same connection could be reused for a second operation. This should improve random read performance significantly.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-912">HDFS-912</a>.

			
 
				+     Minor bug reported by aw and fixed by aw <br>

			
 
				+     <b> sed in build.xml fails</b><br>

			
 
				+     <blockquote>This is the HDFS version of HADOOP-6505.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-903">HDFS-903</a>.

			
 
				+     Critical bug reported by eli and fixed by hairong (name-node)<br>

			
 
				+     <b>NN should verify images and edit logs on startup</b><br>

			
 
				+     <blockquote>I was playing around with corrupting fsimage and edits logs when there are multiple dfs.name.dirs specified. I noticed that:

			
 
				+<br> * As long as your corruption does not make the image invalid, eg changes an opcode so it&apos;s an invalid opcode HDFS doesn&apos;t notice and happily uses a corrupt image or applies the corrupt edit.

			
 
				+<br>* If the first image in dfs.name.dir is &quot;valid&quot; it replaces the other copies in the other name.dirs, even if they are different, with this first image, ie if the first image is actually invalid/old/corrupt metadata than you&apos;ve lost your valid metadata, which can result in data loss if the namenode garbage collects blocks that it thinks are no longer used.

			
 
				+<br>

			
 
				+<br>How about we maintain a checksum as part of the image and edit log and check those on startup and refuse to startup if they are different. Or at least provide a configuration option to do so if people are worried about the overhead of maintaining checksums of these files. Even if we assume dfs.name.dir is reliable storage this guards against operator errors.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-900">HDFS-900</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by shv <br>

			
 
				+     <b>Corrupt replicas are not tracked correctly through block report from DN</b><br>

			
 
				+     <blockquote>This one is tough to describe, but essentially the following order of events is seen to occur:

			
 
				+<br>

			
 
				+<br># A client marks one replica of a block to be corrupt by telling the NN about it

			
 
				+<br># Replication is then scheduled to make a new replica of this node

			
 
				+<br># The replication completes, such that there are now 3 good replicas and 1 corrupt replica

			
 
				+<br># The DN holding the corrupt replica sends a block report. Rather than telling this DN to delete the node, the NN instead marks this as a new *good* replica of the block, and schedules deletion on one of the good replicas.

			
 
				+<br>

			
 
				+<br>I don&apos;t know if this is a dataloss bug in the case of 1 corrupt replica with dfs.replication=2, but it seems feasible. I will attach a debug log with some commentary marked by &apos;============&gt;&apos;, plus a unit test patch which I can get to reproduce this behavior reliably. (it&apos;s not a proper unit test, just some edits to an existing one to show it)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-895">HDFS-895</a>.

			
 
				+     Major improvement reported by dhruba and fixed by tlipcon (hdfs client)<br>

			
 
				+     <b>Allow hflush/sync to occur in parallel with new writes to the file</b><br>

			
 
				+     <blockquote>In the current trunk, the HDFS client methods writeChunk() and hflush./sync are syncronized. This means that if a hflush/sync is in progress, an applicationn cannot write data to the HDFS client buffer. This reduces the write throughput of the transaction log in HBase. 

			
 
				+<br>

			
 
				+<br>The hflush/sync should allow new writes to happen to the HDFS client even when a hflush/sync is in progress. It can record the seqno of the message for which it should receice the ack, indicate to the DataStream thread to star flushing those messages, exit the synchronized section  and just wai for that ack to arrive.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-884">HDFS-884</a>.

			
 
				+     Minor improvement reported by stevel@apache.org and fixed by stevel@apache.org (data-node)<br>

			
 
				+     <b>DataNode makeInstance should report the directory list when failing to start up</b><br>

			
 
				+     <blockquote>When {{Datanode.makeInstance()}} cannot work with one of the directories in dfs.data.dir, it logs this at warn level (while losing the stack trace). 

			
 
				+<br>

			
 
				+<br>It should include the nested exception for better troubleshooting. Then, when all dirs in the list fail, an exception is thrown, but this exception does not include the list of directories. It should list the absolute path of every missing/failing directory, so that whoever sees the exception can see where to start looking for problems: either the filesystem or the configuration. 

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-882">HDFS-882</a>.

			
 
				+     Minor improvement reported by stevel@apache.org and fixed by stevel@apache.org (data-node)<br>

			
 
				+     <b>Datanode could log what hostname and ports its listening on on startup</b><br>

			
 
				+     <blockquote>The Datanode logs the port it is listening too, but if you have having problems with multi-NIC systems or IPv6 grief, knowing the hostname is handy too. Also, it doesn&apos;t log the SSL port info.

			
 
				+<br>

			
 
				+<br>Proposed: provide more details at the debug level</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-881">HDFS-881</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>Refactor DataNode Packet header into DataTransferProtocol</b><br>

			
 
				+     <blockquote>The Packet Header format is used ad-hoc in various places. This JIRA is to refactor it into a class inside DataTransferProtocol (like was done with PipelineAck)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-874">HDFS-874</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (hdfs client, test)<br>

			
 
				+     <b>TestHDFSFileContextMainOperations fails on weirdly configured DNS hosts</b><br>

			
 
				+     <blockquote>On an internal build machine I see exceptions like this:

			
 
				+<br>java.lang.IllegalArgumentException: Wrong FS: hdfs://localhost:47262/data/1/scratch/patchqueue/patch-worker-20518/patch_21/svnrepo/build/test/data/test/test/testRenameWithQuota/srcdir, expected: hdfs://localhost.localdomain:47262

			
 
				+<br>

			
 
				+<br>&quot;hostname&quot; and &quot;hostname -f&quot; both show the machine&apos;s FQDN (not localhost). /etc/hosts is stock after CentOS 5 install. &quot;host 127.0.0.1&quot; reverses to &quot;localhost&quot;</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-853">HDFS-853</a>.

			
 
				+     Major improvement reported by dhruba and fixed by dms (name-node)<br>

			
 
				+     <b>The HDFS webUI should show a metric that summarizes whether the cluster is balanced regarding disk space usage</b><br>

			
 
				+     <blockquote>It is desirable to know how much the datanodes vary form one another in terms of space utilization to get a sense of how well a HDFS cluster is balanced.

			
 
				+<br>

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-829">HDFS-829</a>.

			
 
				+     Major bug reported by aw and fixed by aw <br>

			
 
				+     <b>hdfsJniHelper.c: #include &lt;error.h&gt; is not portable</b><br>

			
 
				+     <blockquote>hdfsJniHelper.c includes &lt;error.h&gt; but this appears to be unnecessary, since even under Linux none of the routines that are prototyped are used.  Worse yet, error.h doesn&apos;t appear to be a standard header file so this breaks on Mac OS X and Solaris and prevents libhdfs from being built.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-811">HDFS-811</a>.

			
 
				+     Minor new feature reported by raviphulari and fixed by eli (test)<br>

			
 
				+     <b>Add metrics, failure reporting and additional tests for HDFS-457</b><br>

			
 
				+     <blockquote> HDFS-457 introduced a improvement which allows  datanode to continue if a volume for replica storage fails. Previously a datanode resigned if any volume failed. 

			
 
				+<br>

			
 
				+<br>I suggest following additional tests for this improvement. 

			
 
				+<br>

			
 
				+<br>#1 Test successive  volume failures ( Minimum 4 volumes )

			
 
				+<br>#2 Test if each volume failure reports reduction in available DFS space and remaining space.

			
 
				+<br>#3 Test if failure of all volumes on a data nodes leads to the data node failure.

			
 
				+<br>#4 Test if correcting failed storage disk brings updates and increments available DFS space. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-752">HDFS-752</a>.

			
 
				+     Major new feature reported by sureshms and fixed by sureshms <br>

			
 
				+     <b>Add interface classification stable &amp; scope to HDFS</b><br>

			
 
				+     <blockquote>This jira addresses adding interface classification for the classes in hadoop hdfs, based on the mechanism described in Hadoop-5073.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-727">HDFS-727</a>.

			
 
				+     Blocker bug reported by eli and fixed by eli (libhdfs)<br>

			
 
				+     <b>bug setting block size hdfsOpenFile </b><br>

			
 
				+     <blockquote>In hdfsOpenFile in libhdfs invokeMethod needs to cast the block size argument to a jlong so a full 8 bytes are passed (rather than 4 plus some garbage which causes writes to fail due to a bogus block size). 

			
 
				+<br>

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-718">HDFS-718</a>.

			
 
				+     Minor improvement reported by andrewr and fixed by andrewr (name-node)<br>

			
 
				+     <b>configuration parameter to prevent accidental formatting of HDFS filesystem</b><br>

			
 
				+     <blockquote>Currently, any time the NameNode is not running, an HDFS filesystem will accept the &apos;format&apos; command, and will duly format itself. There are those of us who have multi-PB HDFS filesystems who are really quite uncomfortable with this behavior. There is &quot;Y/N&quot; confirmation in the format command, but if the formatter genuinely believes themselves to be doing the right thing, the filesystem will be formatted.

			
 
				+<br>

			
 
				+<br>This patch adds a configuration parameter to the namenode, dfs.namenode.support.allowformat, which defaults to &quot;true,&quot; the current behavior: always allow formatting if the NameNode is down or some other process is not holding the namenode lock. But if dfs.namenode.support.allowformat is set to &quot;false,&quot; the NameNode will not allow itself to be formatted until this config parameter is changed to &quot;true&quot;.

			
 
				+<br>

			
 
				+<br>The general idea is that for production HDFS filesystems, the user would format the HDFS once, then set dfs.namenode.support.allowformat to &quot;false&quot; for all time.

			
 
				+<br>

			
 
				+<br>The attached patch was generated against trunk and +1&apos;s on my test machine. We have a 0.20 version that we are using in our cluster as well.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-712">HDFS-712</a>.

			
 
				+     Major task reported by eli and fixed by eli (libhdfs)<br>

			
 
				+     <b>Move libhdfs from mr to hdfs </b><br>

			
 
				+     <blockquote>Here&apos;s an hdfs jira for MAPREDUCE-665. During the project split libhdfs was put in the mapreduce repo instead of hdfs, lets move it to hdfs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-708">HDFS-708</a>.

			
 
				+     Major new feature reported by shv and fixed by harlowja (test, tools)<br>

			
 
				+     <b>A stress-test tool for HDFS.</b><br>

			
 
				+     <blockquote>It would be good to have a tool for automatic stress testing HDFS, which would provide IO-intensive load on HDFS cluster.

			
 
				+<br>The idea is to start the tool, let it run overnight, and then be able to analyze possible failures.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-697">HDFS-697</a>.

			
 
				+     Major test reported by eli and fixed by eli <br>

			
 
				+     <b>Enable asserts for tests by default</b><br>

			
 
				+     <blockquote>See HADOOP-6309. Let&apos;s make the tests run with java asserts by default.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-696">HDFS-696</a>.

			
 
				+     Major test reported by eli and fixed by eli (test)<br>

			
 
				+     <b>Java assertion failures triggered by tests</b><br>

			
 
				+     <blockquote>Re-purposing as catch-all ticket for assertion failures when running tests with java asserts enabled. Running with the attached patch on trunk@823732 the following tests all trigger assertion failures:

			
 
				+<br> 

			
 
				+<br>TestAccessTokenWithDFS

			
 
				+<br>TestInterDatanodeProtocol

			
 
				+<br>TestBackupNode 

			
 
				+<br>TestBlockUnderConstruction

			
 
				+<br>TestCheckpoint  

			
 
				+<br>TestNameEditsConfigs

			
 
				+<br>TestStartup

			
 
				+<br>TestStorageRestore</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-671">HDFS-671</a>.

			
 
				+     Blocker bug reported by jnp and fixed by tomwhite <br>

			
 
				+     <b>Documentation change for updated configuration keys.</b><br>

			
 
				+     <blockquote> HDFS-531, HADOOP-6233 and HDFS-631 have resulted in changes in several config keys. The hadoop documentation needs to be updated to reflect those changes.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-613">HDFS-613</a>.

			
 
				+     Major bug reported by shv and fixed by tlipcon (test)<br>

			
 
				+     <b>TestBalancer and TestBlockTokenWithDFS fail Balancer assert</b><br>

			
 
				+     <blockquote>Running TestBalancer with asserts on. The asserts in {{Balancer.chooseNode()}} is triggered and the test fails. We do not see it in the builds because asserts are off there. So either the assert is irrelevant or there is another bug in the Balancer code.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-599">HDFS-599</a>.

			
 
				+     Major improvement reported by dhruba and fixed by dms (name-node)<br>

			
 
				+     <b>Improve Namenode robustness by prioritizing datanode heartbeats over client requests</b><br>

			
 
				+     <blockquote>The namenode processes RPC requests from clients that are reading/writing to files as well as heartbeats/block reports from datanodes.

			
 
				+<br>

			
 
				+<br>Sometime, because of various reasons (Java GC runs, inconsistent performance of NFS filer that stores HDFS transacttion logs, etc), the namenode encounters transient slowness. For example, if the device that stores the HDFS transaction logs becomes sluggish, the Namenode&apos;s ability to process RPCs slows down to a certain extent. During this time, the RPCs from clients as well as the RPCs from datanodes suffer in similar fashion. If the underlying problem becomes worse, the NN&apos;s ability to process a heartbeat from a DN is severly impacted, thus causing the NN to declare that the DN is dead. Then the NN starts replicating blocks that used to reside on the now-declared-dead datanode. This adds extra load to the NN. Then the now-declared-datanode finally re-establishes contact with the NN, and sends a block report. The block report processing on the NN is another heavyweight activity, thus casing more load to the already overloaded namenode. 

			
 
				+<br>

			
 
				+<br>My proposal is tha the NN should try its best to continue processing RPCs from datanodes and give lesser priority to serving client requests. The Datanode RPCs are integral to the consistency and performance of the Hadoop file system, and it is better to protect it at all costs. This will ensure that NN  recovers from the hiccup much faster than what it does now.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-556">HDFS-556</a>.

			
 
				+     Major improvement reported by jghoman and fixed by eli (name-node)<br>

			
 
				+     <b>Provide info on failed volumes in the web ui</b><br>

			
 
				+     <blockquote>HDFS-457 provided better handling of failed volumes but did not provide a corresponding view of this functionality on the web ui, such as a view of which datanodes have failed volumes.  This would be a good feature to have.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-528">HDFS-528</a>.

			
 
				+     Major new feature reported by tlipcon and fixed by tlipcon (scripts)<br>

			
 
				+     <b>Add ability for safemode to wait for a minimum number of live datanodes</b><br>

			
 
				+     <blockquote>When starting up a fresh cluster programatically, users often want to wait until DFS is &quot;writable&quot; before continuing in a script. &quot;dfsadmin -safemode wait&quot; doesn&apos;t quite work for this on a completely fresh cluster, since when there are 0 blocks on the system, 100% of them are accounted for before any DNs have reported.

			
 
				+<br>

			
 
				+<br>This JIRA is to add a command which waits until a certain number of DNs have reported as alive to the NN.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-455">HDFS-455</a>.

			
 
				+     Minor improvement reported by pirroh and fixed by pirroh (data-node, name-node)<br>

			
 
				+     <b>Make NN and DN handle in a intuitive way comma-separated configuration strings</b><br>

			
 
				+     <blockquote>The following configuration causes problems:

			
 
				+<br>&lt;property&gt;

			
 
				+<br>&lt;name&gt;dfs.data.dir&lt;/name&gt;

			
 
				+<br>&lt;value&gt;/mnt/hstore2/hdfs, /home/foo/dfs&lt;/value&gt; 

			
 
				+<br>&lt;/property&gt;

			
 
				+<br>

			
 
				+<br>The problem is that the space after the comma causes the second directory for storage to be &quot; /home/foo/dfs&quot; which is in a directory named &lt;SPACE&gt; which contains a sub-dir named &quot;home&quot; in the hadoop datanodes default directory. This will typically cause the user&apos;s home partition to fill, but will be very hard for the user to understand since a directory with a whitespace name is hard to understand.

			
 
				+<br>

			
 
				+<br>(ripped from HADOOP-2366)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-330">HDFS-330</a>.

			
 
				+     Trivial improvement reported by aw and fixed by aw (data-node)<br>

			
 
				+     <b>Datanode Web UIs should provide robots.txt</b><br>

			
 
				+     <blockquote>There is a potential issue that someone might have an internal corporate crawler that goes through HDFS browser accidentally.  It might be a good idea to provide a default robots file that disables crawling. [No, this didn&apos;t happen to us. :) ]</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-259">HDFS-259</a>.

			
 
				+     Major sub-task reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>Remove intentionally corrupt 0.13 directory layout creation</b><br>

			
 
				+     <blockquote>Given that 0.13 is incredibly old at this point, I think the likelihood of anyone trying to start an 0.20+ namenode on an 0.13 directly layout is essentially nil. The intentionally-corrupt &quot;${dfs.name.dir}/image/&quot; directory just serves to confuse new users at this point, so I propose removing it.

			
 
				+<br>

			
 
				+<br>If no one objects, I&apos;ll submit a patch. If there are objections, I propose at least adding a README explaining its purpose (same text as in the corrupt fsimage file)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-202">HDFS-202</a>.

			
 
				+     Major new feature reported by acmurthy and fixed by hairong (hdfs client, name-node)<br>

			
 
				+     <b>Add a bulk FIleSystem.getFileBlockLocations</b><br>

			
 
				+     <blockquote>Currently map-reduce applications (specifically file-based input-formats) use FileSystem.getFileBlockLocations to compute splits. However they are forced to call it once per file.

			
 
				+<br>The downsides are multiple:

			
 
				+<br>   # Even with a few thousand files to process the number of RPCs quickly starts getting noticeable

			
 
				+<br>   # The current implementation of getFileBlockLocations is too slow since each call results in &apos;search&apos; in the namesystem. Assuming a few thousand input files it results in that many RPCs and &apos;searches&apos;.

			
 
				+<br>

			
 
				+<br>It would be nice to have a FileSystem.getFileBlockLocations which can take in a directory, and return the block-locations for all files in that directory. We could eliminate both the per-file RPC and also the &apos;search&apos; by a &apos;scan&apos;.

			
 
				+<br>

			
 
				+<br>When I tested this for terasort, a moderate job with 8000 input files the runtime halved from the current 8s to 4s. Clearly this is much more important for latency-sensitive applications...</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-96">HDFS-96</a>.

			
 
				+     Major bug reported by dhruba and fixed by pkling <br>

			
 
				+     <b>HDFS does not support blocks greater than 2GB</b><br>

			
 
				+     <blockquote>HDFS currently does not support blocks greater than 2GB in size.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3438">MAPREDUCE-3438</a>.

			
 
				+     Major bug reported by shv and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>TestRaidNode fails because of &quot;Too many open files&quot;</b><br>

			
 
				+     <blockquote>TestRaidNode fails because it opens many connections.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2328">MAPREDUCE-2328</a>.

			
 
				+     Major bug reported by tlipcon and fixed by qwertymaniac <br>

			
 
				+     <b>memory-related configurations missing from mapred-default.xml</b><br>

			
 
				+     <blockquote>HADOOP-5881 added new configuration parameters for memory-based scheduling, but they weren&apos;t added to mapred-default.xml</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3429">MAPREDUCE-3429</a>.

			
 
				+     Major bug reported by cos and fixed by cos (contrib/capacity-sched, contrib/gridmix)<br>

			
 
				+     <b>Few contrib tests are failing because of the missing commons-lang dependency</b><br>

			
 
				+     <blockquote>As the result of MAPREDUCE-3311 fix a transient {{commons-lang}} isn&apos;t available anymore to contrib tests. This causing silent failure with timeout. The problem is only seeing if tests are ran with {{-Dtest.output=yes}}</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3311">MAPREDUCE-3311</a>.

			
 
				+     Major task reported by cos and fixed by cos (build)<br>

			
 
				+     <b>Bump jetty to 6.1.26</b><br>

			
 
				+     <blockquote>MapReduce part of HADOOP-7450</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3156">MAPREDUCE-3156</a>.

			
 
				+     Major test reported by cos and fixed by cos (test)<br>

			
 
				+     <b>Allow TestMRCLI to be run against a cluster</b><br>

			
 
				+     <blockquote>Mapreduce part of HDFS-1762</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3151">MAPREDUCE-3151</a>.

			
 
				+     Major bug reported by jrottinghuis and fixed by jrottinghuis (contrib/vertica)<br>

			
 
				+     <b>Contrib tests failing</b><br>

			
 
				+     <blockquote>Jenkins builds fail:

			
 
				+<br>https://builds.apache.org/view/G-L/view/Hadoop/job/Hadoop-Mapreduce-22-branch/80/console

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3139">MAPREDUCE-3139</a>.

			
 
				+     Major bug reported by shv and fixed by jghoman (test)<br>

			
 
				+     <b>SlivePartitioner generates negative partitions</b><br>

			
 
				+     <blockquote>{{SlivePartitioner.getPartition()}} returns negative partition numbers on some occasions, which is illegal.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3138">MAPREDUCE-3138</a>.

			
 
				+     Blocker bug reported by acmurthy and fixed by owen.omalley (client, mrv2)<br>

			
 
				+     <b>Allow for applications to deal with MAPREDUCE-954</b><br>

			
 
				+     <blockquote>MAPREDUCE-954 changed the context-objs api to interfaces. This breaks Pig. We need a bridge for them to move to 0.23.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3088">MAPREDUCE-3088</a>.

			
 
				+     Major bug reported by shv and fixed by shv (build)<br>

			
 
				+     <b>Clover 2.4.3 breaks build for 0.22 branch</b><br>

			
 
				+     <blockquote>Due to known bug in Clover 2.4.3 build for 0.22 branch is broken.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3039">MAPREDUCE-3039</a>.

			
 
				+     Major bug reported by jrottinghuis and fixed by jrottinghuis (contrib/capacity-sched, contrib/fair-share, contrib/gridmix, contrib/mrunit, contrib/mumak, contrib/raid, contrib/streaming, jobhistoryserver)<br>

			
 
				+     <b>Make mapreduce use same version of avro as HBase</b><br>

			
 
				+     <blockquote>HBase depends on avro 1.5.3 whereas hadoop-common depends on 1.3.2.

			
 
				+<br>When building HBase on top of hadoop, this should be consistent.

			
 
				+<br>Moreover, this should be consistent between common, hdfs, and mapreduce.

			
 
				+<br>

			
 
				+<br>Contribs seem to have declared a dependency on avro but are not in fact depending on it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3026">MAPREDUCE-3026</a>.

			
 
				+     Major bug reported by mayank_bansal and fixed by mayank_bansal (jobtracker)<br>

			
 
				+     <b>When user adds hierarchical queues to the cluster, mapred queue -list returns NULL Pointer Exception</b><br>

			
 
				+     <blockquote>When User adds the hierarchical queues, and try to see them from the command line using 

			
 
				+<br>mapred queue -list 

			
 
				+<br>It returns Null Pointer Exception.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-3025">MAPREDUCE-3025</a>.

			
 
				+     Blocker bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Contribs not building</b><br>

			
 
				+     <blockquote>Contribs are not getting built.

			
 
				+<br>Snippet from Jenkins:

			
 
				+<br>

			
 
				+<br>compile:

			
 
				+<br>[subant] No sub-builds to iterate on

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2991">MAPREDUCE-2991</a>.

			
 
				+     Major bug reported by priyomustafi and fixed by priyomustafi (scheduler)<br>

			
 
				+     <b>queueinfo.jsp fails to show queue status if any Capacity scheduler queue name has dash/hiphen in it.</b><br>

			
 
				+     <blockquote>If any queue name has a dash/hiphen in it, the queueinfo.jsp doesn&apos;t show any queue information.  This is happening because the queue name is used to create javascript variables and javascript doesn&apos;t allow dash in variable names.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2948">MAPREDUCE-2948</a>.

			
 
				+     Major bug reported by milindb and fixed by mahadev (contrib/streaming)<br>

			
 
				+     <b>Hadoop streaming test failure, post MR-2767</b><br>

			
 
				+     <blockquote>After removing LinuxTaskController in MAPREDUCE-2767, one of the tests in contrib/streaming: TestStreamingAsDifferentUser.java is failing since it imports import org.apache.hadoop.mapred.ClusterWithLinuxTaskController. Patch forthcoming.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2940">MAPREDUCE-2940</a>.

			
 
				+     Major bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Build fails with ant 1.7.0 but works with 1.8.0</b><br>

			
 
				+     <blockquote>contrib builds fail when using Ant 1.7.

			
 
				+<br>

			
 
				+<br>build.xml calls build.xml in contrib, which calls block-forensics build, which in turn uses build-contrib.

			
 
				+<br>The inheritAll=true overrides the basedir in ant 1.7.0 but not in 1.8.0.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2939">MAPREDUCE-2939</a>.

			
 
				+     Major task reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Ant setup on hadoop7 jenkins host</b><br>

			
 
				+     <blockquote>From the build error it looks like

			
 
				+<br>a) ant is not set up on the machine

			
 
				+<br>b) $ANT_HOME point to the wrong spot

			
 
				+<br>

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2779">MAPREDUCE-2779</a>.

			
 
				+     Major bug reported by mingma and fixed by mingma (job submission)<br>

			
 
				+     <b>JobSplitWriter.java can&apos;t handle large job.split file</b><br>

			
 
				+     <blockquote>We use cascading MultiInputFormat. MultiInputFormat sometimes generates big job.split used internally by hadoop, sometimes it can go beyond 2GB.

			
 
				+<br>In JobSplitWriter.java, the function that generates such file uses 32bit signed integer to compute offset into job.split.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2767">MAPREDUCE-2767</a>.

			
 
				+     Blocker bug reported by milindb and fixed by milindb (security)<br>

			
 
				+     <b>Remove Linux task-controller from 0.22 branch</b><br>

			
 
				+     <blockquote>There&apos;s a potential security hole in the task-controller as it stands. Based on the discussion on general@, removing task-controller from the 0.22 branch will pave way for 0.22.0 release. (This was done for the 0.21.0 release as well: see MAPREDUCE-2014.) We can roll a 0.22.1 release with the task-controller when it is fixed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2753">MAPREDUCE-2753</a>.

			
 
				+     Major bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Generated POMs hardcode dependency on hadoop-common version 0.22.0-SNAPSHOT</b><br>

			
 
				+     <blockquote>The generated poms inject the version of mapred itself, but hardcode the version of hadoop-common they depend on.

			
 
				+<br>When trying to build downstream projects (HBase), then they will require hadoop-common-0.22.0-SNAPSHOT.jar instead of the version they compiled against.

			
 
				+<br>

			
 
				+<br>When trying to do an offline build this will fail to resolve as another hadoop-common has been installed in the local maven repo.

			
 
				+<br>Even during online build, it should compile against the hadoop-common that hdfs compiled against.

			
 
				+<br>

			
 
				+<br>When versions mismatch one cannot do a coherent build. That is particularly problematic when making simultaneous change in hadoop-common and hadoop-mapreduce and you want to try this locally before committing each.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2752">MAPREDUCE-2752</a>.

			
 
				+     Minor bug reported by jrottinghuis and fixed by jrottinghuis (build)<br>

			
 
				+     <b>Build does not pass along properties to contrib builds</b><br>

			
 
				+     <blockquote>Subant call to compile contribs do not pass along parameters from parent build.

			
 
				+<br>Properties such as hadoop-common.version, asfrepo, offline, etc. are not passed along.

			
 
				+<br>Result is that build not connected to Internet fails, hdfs proxy refuses to build against own recently built common but rather downloads 0.22-SNAPSHOT from apache again.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2571">MAPREDUCE-2571</a>.

			
 
				+     Blocker bug reported by sinofool and fixed by sinofool <br>

			
 
				+     <b>CombineFileInputFormat.getSplits throws a java.lang.ArrayStoreException</b><br>

			
 
				+     <blockquote>The getSplits methods of 

			
 
				+<br>  org.apache.hadoop.mapred.lib.CombineFileInputFormat 

			
 
				+<br>not work.

			
 
				+<br>

			
 
				+<br>...mapred.lib.CombineFileInputFormat(0.20-style) is a proxy for ...mapreduce.lib.input.CombineFileInputFormat(0.21-style)

			
 
				+<br>

			
 
				+<br>The 0.21-style getSplits returns ArrayList&lt;...mapreduce.lib.input.CombineFileSplit&gt;

			
 
				+<br>and the 0.20-style delegation calls toArray(...mapred.InputSplit[])

			
 
				+<br>

			
 
				+<br>The ...mapreduce.lib.input.CombineFileSplit is based on ...mapreduce.InputSplit

			
 
				+<br>and ...mapred.InputSplit is a interface, not a super-class of ...mapreduce.InputSplit

			
 
				+<br>

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2531">MAPREDUCE-2531</a>.

			
 
				+     Blocker bug reported by revans2 and fixed by revans2 (client)<br>

			
 
				+     <b>org.apache.hadoop.mapred.jobcontrol.getAssignedJobID throw class cast exception </b><br>

			
 
				+     <blockquote>When using a combination of the mapred and mapreduce APIs (PIG) it is possible to have the following exception

			
 
				+<br>

			
 
				+<br>Caused by: java.lang.ClassCastException: org.apache.hadoop.mapreduce.JobID cannot be cast to

			
 
				+<br>org.apache.hadoop.mapred.JobID

			
 
				+<br>        at org.apache.hadoop.mapred.jobcontrol.Job.getAssignedJobID(Job.java:71)

			
 
				+<br>        at org.apache.pig.backend.hadoop.executionengine.mapReduceLayer.MapReduceLauncher.launchPig(MapReduceLauncher.java:239)

			
 
				+<br>        at org.apache.pig.PigServer.launchPlan(PigServer.java:1325)

			
 
				+<br>        ... 29 more

			
 
				+<br>

			
 
				+<br>This is because the JobID is just downcast.  It should be calling JobID.downgrade</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2516">MAPREDUCE-2516</a>.

			
 
				+     Minor bug reported by asrabkin and fixed by asrabkin <br>

			
 
				+     <b>option to control sensitive web actions</b><br>

			
 
				+     <blockquote>as per HADOOP-7302, webinterface.private.actions should not be in trunk. But it should be here, and should have a clearer name.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2515">MAPREDUCE-2515</a>.

			
 
				+     Major bug reported by asrabkin and fixed by asrabkin (jobtracker)<br>

			
 
				+     <b>MapReduce references obsolete options</b><br>

			
 
				+     <blockquote>Option topology.node.switch.mapping.impl has been renamed to net.topology.node.switch.mapping.impl; JT still uses old name. Likewise, JT uses old names for several other since-renamed options.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2505">MAPREDUCE-2505</a>.

			
 
				+     Minor improvement reported by matei and fixed by matei (contrib/fair-share, documentation)<br>

			
 
				+     <b>Explain how to use ACLs in the fair scheduler</b><br>

			
 
				+     <blockquote>The fair scheduler already works with the ACL system introduced through the mapred.queue.* parameters, but the documentation doesn&apos;t explain how to use this. We should add a paragraph or two about it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2502">MAPREDUCE-2502</a>.

			
 
				+     Trivial improvement reported by eli and fixed by eli (job submission)<br>

			
 
				+     <b>JobSubmitter should use mapreduce.job.maps</b><br>

			
 
				+     <blockquote>JobSubmitter should use {{mapreduce.job.maps}} instead of the deprecated {{mapred.map.tasks}}.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2487">MAPREDUCE-2487</a>.

			
 
				+     Minor bug reported by forvines and fixed by devaraj.k <br>

			
 
				+     <b>ChainReducer uses MAPPER_BY_VALUE instead of REDUCER_BY_VALUE</b><br>

			
 
				+     <blockquote>On line 293 of o.a.h.mapred.lib.Chain in setReducer(...):

			
 
				+<br>

			
 
				+<br>reducerConf.setBoolean(MAPPER_BY_VALUE, byValue);

			
 
				+<br>

			
 
				+<br>this should be REDUCER_BY_VALUE.

			
 
				+<br>

			
 
				+<br>http://grepcode.com/file/repository.cloudera.com/content/repositories/releases/com.cloudera.hadoop/hadoop-core/0.20.2-737/org/apache/hadoop/mapred/lib/Chain.java#293</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2486">MAPREDUCE-2486</a>.

			
 
				+     Blocker bug reported by dvryaboy and fixed by tlipcon <br>

			
 
				+     <b>0.22 - snapshot incorrect dependency published in .pom files</b><br>

			
 
				+     <blockquote>The pom at https://repository.apache.org/content/repositories/snapshots/org/apache/hadoop/hadoop-mapred/0.22.0-SNAPSHOT/ publishes a dependency on hadoop-common version &quot;0.22.0-dev-SNAPSHOT&quot; while hadoop-common only publishes &quot;0.22.0-SNAPSHOT&quot; (no -dev).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2472">MAPREDUCE-2472</a>.

			
 
				+     Major bug reported by tlipcon and fixed by atm (task-controller)<br>

			
 
				+     <b>Extra whitespace in mapred.child.java.opts breaks JVM initialization</b><br>

			
 
				+     <blockquote>When creating taskjvm.sh, we split mapred.child.java.opts on &quot; &quot; and then create a quoted argument for each of those results. So, if you have an extra space anywhere in this configuration, you get an argument &apos;&apos; in the child command line, which the JVM interprets as an empty class name. This results in a ClassNotFoundException and the task cannot run.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2457">MAPREDUCE-2457</a>.

			
 
				+     Critical bug reported by tucu00 and fixed by tucu00 (jobtracker)<br>

			
 
				+     <b>job submission should inject group.name (on the JT side)</b><br>

			
 
				+     <blockquote>Until Hadoop 0.20, the JobClient was injecting the property &apos;group.name&apos; on the JobConf submitted to the JobTracker.

			
 
				+<br>Since Hadoop 0.21, due to security related changes, this is not done anymore.

			
 
				+<br>This breaks backwards compatibility for jobs/components that expect the &apos;group.name&apos; to be automatically set at submission time.

			
 
				+<br>An example of a component being affected by this change is the FairScheduler where it is common to use the group.name as pool name. Different from other properties, a special characteristic of the group.name is that its value cannot be tampered by a user.

			
 
				+<br>For security reasons this should not be done (as it was done before) in the JobClient side. Instead, it should be done in the JobTracker when the JobConf is received.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2448">MAPREDUCE-2448</a>.

			
 
				+     Minor bug reported by szetszwo and fixed by eli (contrib/raid, test)<br>

			
 
				+     <b>NoSuchMethodError: org.apache.hadoop.hdfs.TestDatanodeBlockScanner.corruptReplica(..)</b><br>

			
 
				+     <blockquote>

			
 
				+java.lang.NoSuchMethodError: org.apache.hadoop.hdfs.TestDatanodeBlockScanner.corruptReplica(Ljava/lang/String;I)Z

			
 
				+<br>  at org.apache.hadoop.raid.TestBlockFixer.corruptBlock(TestBlockFixer.java:643)

			
 
				+<br>  at org.apache.hadoop.raid.TestBlockFixer.implBlockFix(TestBlockFixer.java:189)

			
 
				+<br>  at org.apache.hadoop.raid.TestBlockFixer.testBlockFixLocal(TestBlockFixer.java:139)

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2445">MAPREDUCE-2445</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (security, test)<br>

			
 
				+     <b>TestMiniMRWithDFSWithDistinctUsers is very broken</b><br>

			
 
				+     <blockquote>This test has a number of issues:

			
 
				+<br>- it side steps the normal job submission API for no apparent reason, manually writing splits file and uploading submission files. (but forgets to upload the job jar, so the jobs all fail)

			
 
				+<br>- it doesn&apos;t call waitForCompletion, or check job status (so it doesn&apos;t notice that the jobs all fail)

			
 
				+<br>- it doesn&apos;t verify in any way that the job output is owned by the user who supposedly ran the job

			
 
				+<br>- it shuts down DFS before MR

			
 
				+<br>

			
 
				+<br>These all conspire to make it pass, but it isn&apos;t actually testing anything.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2437">MAPREDUCE-2437</a>.

			
 
				+     Blocker bug reported by shv and fixed by shv (test)<br>

			
 
				+     <b>SLive should process only part* files while generating the report.</b><br>

			
 
				+     <blockquote>SliveTest when producing the final report scans all files in the reduce output directory. The directory now may contain {{_SUCCESS}} and {{_logs}} entries. SliveTest should process only files starting with {{part*}}.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2428">MAPREDUCE-2428</a>.

			
 
				+     Blocker bug reported by tomwhite and fixed by tomwhite <br>

			
 
				+     <b>start-mapred.sh script fails if HADOOP_HOME is not set</b><br>

			
 
				+     <blockquote>MapReduce portion of HADOOP-6953</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2410">MAPREDUCE-2410</a>.

			
 
				+     Minor improvement reported by dieter_be and fixed by qwertymaniac (contrib/streaming, documentation)<br>

			
 
				+     <b>document multiple keys per reducer oddity in hadoop streaming FAQ</b><br>

			
 
				+     <blockquote>Hi,

			
 
				+<br>for a newcomer to hadoop streaming, it comes as a surprise that the reducer receives arbitrary keys, unlike the &quot;real&quot; hadoop where a reducer works on a single key.

			
 
				+<br>An explanation for this is @ http://mail-archives.apache.org/mod_mbox/hadoop-common-user/201103.mbox/browser

			
 
				+<br>

			
 
				+<br>I suggest to add this to the FAQ of hadoop streaming</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2394">MAPREDUCE-2394</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>JUnit output format doesn&apos;t propagate into some contrib builds</b><br>

			
 
				+     <blockquote>Some of the contribs seem to have an issue where the test.junit.output.format property isn&apos;t propagating down into their builds. So, Hudson is unable to parse the test output, and we see failed builds with no actual parsed test results showing what failed.

			
 
				+<br>

			
 
				+<br>This is at least true for {{contrib/raid}} but maybe others as well.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2392">MAPREDUCE-2392</a>.

			
 
				+     Major bug reported by tomwhite and fixed by tomwhite <br>

			
 
				+     <b>TaskTracker shutdown in the tests sometimes take 60s</b><br>

			
 
				+     <blockquote>There are a lot of the following in the test logs:

			
 
				+<br>

			
 
				+<br>2011-03-16 13:47:02,267 INFO  mapred.TaskTracker (TaskTracker.java:shutdown(1275)) - Shutting down StatusHttpServer

			
 
				+<br>2011-03-16 13:48:02,349 ERROR mapred.TaskTracker (TaskTracker.java:offerService(1609)) - Caught exception: java.io.IOException: Call to localhost/127.0.0.1:57512 failed on local exception: java.nio.channels.ClosedByInterruptException

			
 
				+<br>

			
 
				+<br>Note there is over one minute between the first line and the second.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2383">MAPREDUCE-2383</a>.

			
 
				+     Major task reported by tlipcon and fixed by qwertymaniac (distributed-cache, documentation)<br>

			
 
				+     <b>Improve documentation of DistributedCache methods</b><br>

			
 
				+     <blockquote>Users find the various methods in DistributedCache confusing - it&apos;s not clearly documented what the difference is between addArchiveToClassPath vs addFileToClassPath. We should improve the docs to clarify this and perhaps add an example that uses the DistributedCache.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2372">MAPREDUCE-2372</a>.

			
 
				+     Major improvement reported by tlipcon and fixed by tlipcon (task)<br>

			
 
				+     <b>TaskLogAppender mechanism shouldn&apos;t be set in log4j.properties</b><br>

			
 
				+     <blockquote>The TaskLogAppender log4j appender relies on using log4j.properties to pass in some Java system properties into properties of the logger. This is problematic since we&apos;ve often found that users have customized log4j.properties and don&apos;t upgrade it when they upgrade the version of Hadoop.

			
 
				+<br>

			
 
				+<br>Since this is really an internal mechanism of how the task runner passes task info to the TLA, we shouldn&apos;t rely on these settings in log4j.properties at all. Rather, we should just get the system properties directly from System.getProperty.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2337">MAPREDUCE-2337</a>.

			
 
				+     Major improvement reported by tomwhite and fixed by tomwhite <br>

			
 
				+     <b>Remove dependence of public MapReduce API on classes in server package</b><br>

			
 
				+     <blockquote>Cluster#getJobTrackerState() returns a org.apache.hadoop.mapreduce.server.jobtracker.State enum, which makes the API in o.a.h.mapreduce have a dependency on the server package. It would be better to make the public API self-contained by using an equivalent enum in the Cluster class.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2336">MAPREDUCE-2336</a>.

			
 
				+     Major bug reported by tomwhite and fixed by tomwhite (documentation)<br>

			
 
				+     <b>Tool-related packages should be in the Tool javadoc group</b><br>

			
 
				+     <blockquote>Some of the tool packages are mistakenly in the general group.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2327">MAPREDUCE-2327</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>MapTask doesn&apos;t need to put username information in SpillRecord</b><br>

			
 
				+     <blockquote>This is an amendment to MAPREDUCE-2096 that&apos;s found in Yahoo&apos;s 0.20.100 branch.

			
 
				+<br>

			
 
				+<br>This bug causes task failures in the following case:

			
 
				+<br>- Cluster is not set up with LinuxTaskController (ie not secured cluster)

			
 
				+<br>- Job submitter is not the same as the user running the TT

			
 
				+<br>- Map output is more than one spill&apos;s worth

			
 
				+<br>

			
 
				+<br>The issue is that UserGroupInformation&apos;s view of the current user is the job submitter, but on disk the spill files will be owned by the TT user. SecureIO will then fail when constructing the spill record.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2315">MAPREDUCE-2315</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>javadoc is failing in nightly</b><br>

			
 
				+     <blockquote>Last nightly build failed to publish javadoc because the javadoc build failed:

			
 
				+<br>

			
 
				+<br>javadoc:

			
 
				+<br>    [mkdir] Created dir: /grid/0/hudson/hudson-slave/workspace/Hadoop-Mapreduce-22-branch/trunk/build/docs/api

			
 
				+<br>  [javadoc] Generating Javadoc

			
 
				+<br>  [javadoc] Javadoc execution

			
 
				+<br>  [javadoc] 1 error

			
 
				+<br>  [javadoc] javadoc: error - Cannot find doclet class org.apache.hadoop.classification.tools.ExcludePrivateAnnotationsStandardDoclet</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2314">MAPREDUCE-2314</a>.

			
 
				+     Major improvement reported by rvs and fixed by rvs (build)<br>

			
 
				+     <b>configure files that are generated as part of the released tarball need to have executable bit set</b><br>

			
 
				+     <blockquote>Currently the configure files that are packaged in a tarball are -rw-rw-r--

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2311">MAPREDUCE-2311</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by schen (contrib/fair-share)<br>

			
 
				+     <b>TestFairScheduler failing on trunk</b><br>

			
 
				+     <blockquote>Most of the test cases in this test are failing on trunk, unclear how long since the contrib tests weren&apos;t running while the core tests were failed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2304">MAPREDUCE-2304</a>.

			
 
				+     Minor bug reported by priyomustafi and fixed by priyomustafi (test)<br>

			
 
				+     <b>TestMRCLI fails when hostname has a hyphen (-)</b><br>

			
 
				+     <blockquote>TestMRCLI fails with below

			
 
				+<br>

			
 
				+<br>Comparator: [RegexpComparator]

			
 
				+<br>Comparision result:   [fail]

			
 
				+<br>Expected output: [mv: Wrong FS: har:/dest/dir0.har/dir0/file0, expected: hdfs://\w+[.a-z]*:[0-9]+]

			
 
				+<br>Actual output:   [mv: Wrong FS: har:/dest/dir0.har/dir0/file0, expected: hdfs://lab-something.host.com:34039

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2285">MAPREDUCE-2285</a>.

			
 
				+     Blocker bug reported by rvadali and fixed by tlipcon (test)<br>

			
 
				+     <b>MiniMRCluster does not start after ant test-patch</b><br>

			
 
				+     <blockquote>Any test using MiniMRCluster hangs in the MiniMRCluster constructor after running ant test-patch. Steps to reproduce:

			
 
				+<br> 1. ant -Dpatch.file=&lt;dummy patch to CHANGES.txt&gt;  -Dforrest.home=&lt;path to forrest&gt; -Dfindbugs.home=&lt;path to findbugs&gt; -Dscratch.dir=/tmp/testpatch  -Djava5.home=&lt;path to java5&gt; test-patch

			
 
				+<br> 2. Run any test that creates MiniMRCluster, say ant test -Dtestcase=TestFileArgs (contrib/streaming)

			
 
				+<br>

			
 
				+<br>Expected result: Test should succeed

			
 
				+<br>Actual result: Test hangs  in MiniMRCluster.&lt;init&gt;. This does not happen if we run ant clean after ant test-patch

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2284">MAPREDUCE-2284</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (test)<br>

			
 
				+     <b>TestLocalRunner.testMultiMaps times out</b><br>

			
 
				+     <blockquote>This test has timed out in a number of Hudson builds.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2283">MAPREDUCE-2283</a>.

			
 
				+     Blocker bug reported by nidaley and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>TestBlockFixer hangs initializing MiniMRCluster</b><br>

			
 
				+     <blockquote>TestBlockFixer (a raid contrib test) is hanging the precommit testing on Hudson</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2282">MAPREDUCE-2282</a>.

			
 
				+     Blocker bug reported by tomwhite and fixed by shv (test)<br>

			
 
				+     <b>MapReduce tests don&apos;t compile following HDFS-1561</b><br>

			
 
				+     <blockquote>TestMRServerPorts depends on TestHDFSServerPorts which was changed by HDFS-1561, resulting in a compilation failure.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2281">MAPREDUCE-2281</a>.

			
 
				+     Major bug reported by pocheung and fixed by pocheung <br>

			
 
				+     <b>Fix javac, javadoc, findbugs warnings</b><br>

			
 
				+     <blockquote>Split from HADOOP-6642</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2277">MAPREDUCE-2277</a>.

			
 
				+     Minor bug reported by tlipcon and fixed by tlipcon (contrib/capacity-sched)<br>

			
 
				+     <b>TestCapacitySchedulerWithJobTracker fails sometimes</b><br>

			
 
				+     <blockquote>Sometimes the testJobTrackerIntegration test fails on my Hudson. It seems the issue is that it doesn&apos;t ever wait for the first job to complete before checking its success status. Since the two jobs are in different queues, the first job may complete after the second job.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2272">MAPREDUCE-2272</a>.

			
 
				+     Trivial bug reported by tlipcon and fixed by qwertymaniac (tasktracker)<br>

			
 
				+     <b>Job ACL file should not be executable</b><br>

			
 
				+     <blockquote>For some reason the job ACL file is localized with permissions 700. This doesn&apos;t make sense, since it&apos;s not executable. It should be 600.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2260">MAPREDUCE-2260</a>.

			
 
				+     Major improvement reported by rvs and fixed by rvs (build)<br>

			
 
				+     <b>Remove auto-generated native build files</b><br>

			
 
				+     <blockquote>The repo currently includes the automake and autoconf generated files for the native build. Per discussion on HADOOP-6421 let&apos;s remove them and use the host&apos;s automake and autoconf. We should also do this for libhdfs and fuse-dfs. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2256">MAPREDUCE-2256</a>.

			
 
				+     Major bug reported by priyomustafi and fixed by priyomustafi (contrib/fair-share)<br>

			
 
				+     <b>FairScheduler fairshare preemption from multiple pools may preempt all tasks from one pool causing that pool to go below fairshare.</b><br>

			
 
				+     <blockquote>Scenarios:

			
 
				+<br>You have a cluster with 600 map slots and 3 pools.  Fairshare for each pool is 200 to start with.  Fairsharepreemption timeout is 5 mins.

			
 
				+<br>1)  Pool1 schedules 300 map tasks first

			
 
				+<br>2)  Pool2 then schedules another 300 map tasks

			
 
				+<br>3)  Pool3 demands 300 map tasks but doesn&apos;t get any slot as all slots are taken.

			
 
				+<br>4)  After 5 mins pool3 should preempt 200 map-slots.  Instead of peempting 100 slots each from pool1 and pool2, the bug would cause it to preempt all 200 slots from pool2 (last started) causing it to go below fairshare.  This is happening because the preemptTask method is not reducing the tasks left from a pool while preempting the tasks.  

			
 
				+<br>

			
 
				+<br>The above scenario could be an extreme case but some amount of excess preemption would happen because of this bug.

			
 
				+<br>

			
 
				+<br>The patch I created was for 0.22.0 but the code fix should work on 0.21  as well as looks like it has the same bug.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2253">MAPREDUCE-2253</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>Servlets should specify content type</b><br>

			
 
				+     <blockquote>HADOOP-7093 will change the default content-type to text/plain. So TaskLogServlet, which outputs HTML, needs to change to specify this content type. I believe the other HTML servlets already correctly specify a content type. The MapOutputServlet appears to specify no content type and work fine without one, but to be &quot;correct&quot; we may as well specify application/octet-stream</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2251">MAPREDUCE-2251</a>.

			
 
				+     Major bug reported by tlipcon and fixed by qwertymaniac <br>

			
 
				+     <b>Remove mapreduce.job.userhistorylocation config</b><br>

			
 
				+     <blockquote>Best I can tell, this config parameter is no longer used as of MAPREDUCE-157 but still exists in the code and in mapred-default.xml. We should remove it to avoid user confusion.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2241">MAPREDUCE-2241</a>.

			
 
				+     Trivial test reported by tlipcon and fixed by tlipcon (task-controller, test)<br>

			
 
				+     <b>ClusterWithLinuxTaskController should accept relative path on the command line</b><br>

			
 
				+     <blockquote>Currently if you pass a relative path for the -Dtaskcontroller-path option when running these tests, it fails in a fairly unintuitive way. We should absolutize it inside the tests to make it easier for people to run them.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2238">MAPREDUCE-2238</a>.

			
 
				+     Critical bug reported by eli and fixed by tlipcon (build, test)<br>

			
 
				+     <b>Undeletable build directories </b><br>

			
 
				+     <blockquote>The MR hudson job is failing, looks like it&apos;s due to a test chmod&apos;ing a build directory so the checkout can&apos;t clean the build dir.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2234">MAPREDUCE-2234</a>.

			
 
				+     Major sub-task reported by tlipcon and fixed by tlipcon (tasktracker)<br>

			
 
				+     <b>If Localizer can&apos;t create task log directory, it should fail on the spot</b><br>

			
 
				+     <blockquote>Currently, it simply emits a warning. Then, when the taskjvm.sh tries to pipe its output into this directory, it fails with a strange error code like &quot;exit code: 1&quot; which is not intuitive to ops. Instead it should simply throw an exception at initialization time rather than attempting to run the task.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2224">MAPREDUCE-2224</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (tasktracker)<br>

			
 
				+     <b>Synchronization bugs in JvmManager</b><br>

			
 
				+     <blockquote>JvmManager.JvmManagerForType has several HashMap members that are inconsistently synchronized. I&apos;ve seen sporadic NPEs in the 0.20 version of this code which has similar bugs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2222">MAPREDUCE-2222</a>.

			
 
				+     Major bug reported by vicaya and fixed by vicaya <br>

			
 
				+     <b>Ivy resolve force mode should be turned off by default</b><br>

			
 
				+     <blockquote>cf. HADOOP-7068</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2219">MAPREDUCE-2219</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon (jobtracker)<br>

			
 
				+     <b>JT should not try to remove mapred.system.dir during startup</b><br>

			
 
				+     <blockquote>During startup, the JT tries to clean up mapred.system.dir by recursively removing it and then recreating it. This requires that mapred.system.dir is inside a directory owned by the mapred user. For example, if set to /system/mapred then /system must be owned by the mapred account. This isn&apos;t documented properly and also seems unnecessary. Instead we can remove the *contents* of mapred.system.dir instead of the directory itself.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2200">MAPREDUCE-2200</a>.

			
 
				+     Major bug reported by cos and fixed by cos (test)<br>

			
 
				+     <b>TestUmbilicalProtocolWithJobToken is failing without Krb evironment: needs to be conditional</b><br>

			
 
				+     <blockquote>TestUmbilicalProtocolWithJobToken requires Krb environment to be set. For testing some &apos;pseudo&apos; environment is needed (similar to HDFS-1284). </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2195">MAPREDUCE-2195</a>.

			
 
				+     Major bug reported by cos and fixed by cos (test)<br>

			
 
				+     <b>New property for local conf directory in system-test-mapreduce.xml file.</b><br>

			
 
				+     <blockquote>As its counter-part HDFS-1167: new parameter needs to be added to the system-test configuration file to serve &apos;cluster restart with new  configuration&apos; feature</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2188">MAPREDUCE-2188</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by owen.omalley <br>

			
 
				+     <b>The new API MultithreadedMapper doesn&apos;t call the initialize method of the RecordReader</b><br>

			
 
				+     <blockquote>The wrapping RecordReader in the Multithreaded Mapper is never initialized. With HADOOP-6685, this becomes a problem because the ReflectionUtils.copy requires a non-null configuration.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2184">MAPREDUCE-2184</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>Port DistRaid.java to new mapreduce API</b><br>

			
 
				+     <blockquote>DistRaid.java was implemented with the older mapred API, this task is for porting it to the new API</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2180">MAPREDUCE-2180</a>.

			
 
				+     Minor test reported by tlipcon and fixed by tlipcon (contrib/fair-share)<br>

			
 
				+     <b>Add coverage of fair scheduler servlet to system test</b><br>

			
 
				+     <blockquote>MAPREDUCE-2051 added a system test for the fair scheduler which starts a minicluster and runs a couple jobs with preemption on. I recently found a deadlock in a previous version of the scheduler that was due to lock inversion between the scheduler servlet and some JT internals. I&apos;d like to modify the existing system test to also hit the /scheduler servlet, allowing jcarder to detect such lock inversions in the future.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2179">MAPREDUCE-2179</a>.

			
 
				+     Blocker bug reported by gkesavan and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RaidBlockSender.java compilation fails</b><br>

			
 
				+     <blockquote>

			
 
				+Mapreduce trunk compilation is broken

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2173">MAPREDUCE-2173</a>.

			
 
				+     Major bug reported by pkling and fixed by pkling <br>

			
 
				+     <b>Race condition in TestBlockFixer causes intermittent failure</b><br>

			
 
				+     <blockquote>TestBlockFixer sometimes fails in reportCorruptBlocks because a corrupt block is deleted before in.readFully is called. This causes a BlockMissingException instead of the expected ChecksumException.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2169">MAPREDUCE-2169</a>.

			
 
				+     Major task reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>Integrated Reed-Solomon code with RaidNode</b><br>

			
 
				+     <blockquote>Scott Chen recently checked in an implementation of  the Reed Solomon code. This task will track the integration of the code with RaidNode.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2167">MAPREDUCE-2167</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>Faster directory traversal for raid node</b><br>

			
 
				+     <blockquote>The RaidNode currently iterates over the directory structure to figure out which files to RAID. With millions of files, this can take a long time - especially if some files are already RAIDed and the RaidNode needs to look at parity files / parity file HARs to determine if the file needs to be RAIDed.

			
 
				+<br>

			
 
				+<br>The directory traversal is encapsulated inside the class DirectoryTraversal, which examines one file at a time, using the caller&apos;s thread.

			
 
				+<br>

			
 
				+<br>My proposal is to make this multi-threaded as follows:

			
 
				+<br> * use a pool of threads inside DirectoryTraversal

			
 
				+<br> * The caller&apos;s thread is used to retrieve directories, and each new directory is assigned to a thread in the pool. The worker thread examines all the files the directory.

			
 
				+<br> * If there sub-directories, those are added back as workitems to the pool.

			
 
				+<br>

			
 
				+<br>Comments?</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2150">MAPREDUCE-2150</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RaidNode should periodically fix corrupt blocks</b><br>

			
 
				+     <blockquote>(Recreating HDFS-1171 since RAID is in mapreduce)

			
 
				+<br>

			
 
				+<br>RaidNode currently does not fix missing blocks. The missing blocks have to be fixed using RaidShell.

			
 
				+<br>This task proposes that recovery be more automated:

			
 
				+<br>1. RaidNode periodically fetches a list of corrupt files from the NameNode

			
 
				+<br>2. If the corrupt files can be fixed using RAID, it should generate the block.

			
 
				+<br>3. Choose a datanode and send the block contents along with checksum to the datanode.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2147">MAPREDUCE-2147</a>.

			
 
				+     Trivial improvement reported by qwertymaniac and fixed by qwertymaniac (jobtracker)<br>

			
 
				+     <b>JobInProgress has some redundant lines in its ctor</b><br>

			
 
				+     <blockquote>In the ctor of JobInProgress class that&apos;s used by the JT, lines that create the various lists of TIPs are repeated for no purpose. Might&apos;ve been due to an overlook I think.

			
 
				+<br>

			
 
				+<br>Attaching a patch that removes these unnecessary repeats of re-init.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2146">MAPREDUCE-2146</a>.

			
 
				+     Minor bug reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>Raid should not affect access time of a source file</b><br>

			
 
				+     <blockquote>After a file is read for creating a raid parity file, the access time should be set back to the value before the read. The read by RAID code is not an application read and should not affect the access time.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2145">MAPREDUCE-2145</a>.

			
 
				+     Major improvement reported by gkesavan and fixed by gkesavan <br>

			
 
				+     <b>upgrade clover on the builds servers to v 3.0.2</b><br>

			
 
				+     <blockquote>upgrade clover on the builds servers to v 3.0.2, as the mr builds requires the latest version of clover for better coverage reporting...</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2143">MAPREDUCE-2143</a>.

			
 
				+     Major bug reported by rvadali and fixed by rvadali (harchive)<br>

			
 
				+     <b>HarFileSystem is not able to handle spaces in its path</b><br>

			
 
				+     <blockquote>If the Path to the HAR contains spaces, Path.getFileSystem() fails. The problem is in HarFileSystem.initialize(), which uses URI.toString() to get a string for getting to the .har suffix. URI.toString() returns a percent-encoded string when the path contains spaces. When this string is subsequently used to get the _index file, we get a FileNotFoundException. The fix is to use URI.getPath().

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2142">MAPREDUCE-2142</a>.

			
 
				+     Major task reported by pkling and fixed by pkling <br>

			
 
				+     <b>Refactor RaidNode to remove dependence on map reduce</b><br>

			
 
				+     <blockquote>I am refactoring the RaidNode code as follows: The base class RaidNode will contain the common functionality needed for raiding files. The derived class LocalRaidNode contains an implementation of RaidNode that performs raiding locally. The derived class DistRaidNode performs raiding using map reduce jobs. This way, only DistRaidNode has a dependency on map reduce code and RaidNode and LocalRaidNode can be moved to HDFS.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2141">MAPREDUCE-2141</a>.

			
 
				+     Minor improvement reported by matei and fixed by matei <br>

			
 
				+     <b>Add an &quot;extra data&quot; field to Task for use by Mesos</b><br>

			
 
				+     <blockquote>In order to support running Hadoop on the Mesos cluster manager (http://mesos.berkeley.edu/), I&apos;d like to add an extra String field to the Task class to allow extra data (a Mesos task ID) to be associated with each task. This should have no impact on normal operation other than making the serialized form of Task a few bytes longer. In the Mesos support patch for Hadoop, this field is set by a pluggable Hadoop scheduler implementation to allow code on the TaskTracker side to see which Mesos task corresponds to each Hadoop task. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2132">MAPREDUCE-2132</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>Need a command line option in RaidShell to fix blocks using raid</b><br>

			
 
				+     <blockquote>RaidShell currently has an option to recover a file and return the path to the recovered file. The administrator can then rename the recovered file to the damaged file.

			
 
				+<br>

			
 
				+<br>The problem with this is that the file metadata is altered, specifically the modification time. Instead we need a way to just repair the damaged blocks and send the fixed blocks to a data node.

			
 
				+<br>

			
 
				+<br>Once this is done, we can put automation around it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2127">MAPREDUCE-2127</a>.

			
 
				+     Major bug reported by gkesavan and fixed by bmahe (build, pipes)<br>

			
 
				+     <b>mapreduce trunk builds are failing on hudson</b><br>

			
 
				+     <blockquote>https://hudson.apache.org/hudson/job/Hadoop-Mapreduce-trunk-Commit/507/console

			
 
				+<br>

			
 
				+<br>[exec] checking for pthread.h... yes

			
 
				+<br>     [exec] checking for pthread_create in -lpthread... yes

			
 
				+<br>     [exec] checking for HMAC_Init in -lssl... no

			
 
				+<br>     [exec] configure: error: Cannot find libssl.so

			
 
				+<br>     [exec] /grid/0/hudson/hudson-slave/workspace/Hadoop-Mapreduce-trunk-Commit/trunk/src/c++/pipes/configure: line 4250: exit: please: numeric argument required

			
 
				+<br>     [exec] /grid/0/hudson/hudson-slave/workspace/Hadoop-Mapreduce-trunk-Commit/trunk/src/c++/pipes/configure: line 4250: exit: please: numeric argument required

			
 
				+<br>

			
 
				+<br>BUILD FAILED

			
 
				+<br>/grid/0/hudson/hudson-slave/workspace/Hadoop-Mapreduce-trunk-Commit/trunk/build.xml:1647: exec returned: 255

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2126">MAPREDUCE-2126</a>.

			
 
				+     Minor improvement reported by yaojingguo and fixed by yaojingguo (jobtracker)<br>

			
 
				+     <b>JobQueueJobInProgressListener&apos;s javadoc is inconsistent with source code</b><br>

			
 
				+     <blockquote>JobQueueJobInProgressListener.java has {@link #JobQueueJobInProgressListener(Collection)} in Javadoc. But it does not have the corresponding constructor. It has constructor JobQueueJobInProgressListener(Map&lt;JobSchedulingInfo, JobInProgress&gt; jobQueue). So {@link JobQueueJobInProgressListener(Collection)} should be {@link #JobQueueJobInProgressListener(Map)}.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2103">MAPREDUCE-2103</a>.

			
 
				+     Trivial improvement reported by tlipcon and fixed by tlipcon (task-controller)<br>

			
 
				+     <b>task-controller shouldn&apos;t require o-r permissions</b><br>

			
 
				+     <blockquote>The task-controller currently checks that &quot;other&quot; users don&apos;t have read permissions. This is unnecessary - we just need to make it&apos;s not executable. The debian policy manual explains it well:

			
 
				+<br>Setuid and setgid executables should be mode 4755 or 2755 respectively, and owned by the appropriate user or group. They should not be made unreadable (modes like 4711 or 2711 or even 4111); doing so achieves no extra security, because anyone can find the binary in the freely available Debian package; it is merely inconvenient. For the same reason you should not restrict read or execute permissions on non-set-id executables.

			
 
				+<br>Some setuid programs need to be restricted to particular sets of users, using file permissions. In this case they should be owned by the uid to which they are set-id, and by the group which should be allowed to execute them. They should have mode 4754; again there is no point in making them unreadable to those users who must not be allowed to execute them.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2099">MAPREDUCE-2099</a>.

			
 
				+     Major bug reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RaidNode should recreate outdated parity HARs</b><br>

			
 
				+     <blockquote>After parity files are archived into a parity HAR, a change in the source file does not cause the HAR to be recreated. Instead, individual parity files are created for the modified files but the HAR is not touched. This causes increased disk usage for parity data.

			
 
				+<br>

			
 
				+<br>The parity HAR could be recreated if a certain percentage of files in the HAR are determined to be outdated.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2096">MAPREDUCE-2096</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon (jobtracker, security, tasktracker)<br>

			
 
				+     <b>Secure local filesystem IO from symlink vulnerabilities</b><br>

			
 
				+     <blockquote>This JIRA is to contribute a patch developed on the private security@ mailing list.

			
 
				+<br>

			
 
				+<br>The vulnerability is that MR daemons occasionally open files that are located in a path where the user has write access. A malicious user may place a symlink in place of the expected file in order to cause the daemon to instead read another file on the system -- one which the attacker may not naturally be able to access. This includes delegation tokens belong to other users, log files, keytabs, etc.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2095">MAPREDUCE-2095</a>.

			
 
				+     Major bug reported by vinaythota and fixed by ranjit (contrib/gridmix)<br>

			
 
				+     <b>Gridmix unable to run for compressed traces(.gz format).</b><br>

			
 
				+     <blockquote>I was trying to run gridmix with compressed trace file.However, it throws a JsonParseException and exit.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2093">MAPREDUCE-2093</a>.

			
 
				+     Major improvement reported by cos and fixed by cos (test)<br>

			
 
				+     <b>Herriot JT and TT clients should vend statistics</b><br>

			
 
				+     <blockquote>Mapreduce counterpart of HDFS-1408</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2084">MAPREDUCE-2084</a>.

			
 
				+     Blocker bug reported by tomwhite and fixed by tomwhite (documentation)<br>

			
 
				+     <b>Deprecated org.apache.hadoop.util package in MapReduce produces deprecations in Common classes in Eclipse</b><br>

			
 
				+     <blockquote>As reported in [this thread|http://mail-archives.apache.org/mod_mbox/hadoop-mapreduce-user/201009.mbox/%3C4C9A0A08.3030901@web.de%3E] the classes in org.apache.hadoop.util from the Common JAR, like Tool, are marked as deprecated by Eclipse, even though they are not deprecated. The fix is to mark the individual classes in the MapReduce org.apache.hadoop.util class as deprecated, not the whole package.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2082">MAPREDUCE-2082</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>Race condition in writing the jobtoken password file when launching pipes jobs</b><br>

			
 
				+     <blockquote>In Application.java, when jobtoken password file is written, there is a race condition because the file is written in job&apos;s work directory. The file should rather be written in the task&apos;s working directory.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2078">MAPREDUCE-2078</a>.

			
 
				+     Major bug reported by vinaythota and fixed by amar_kamat (tools/rumen)<br>

			
 
				+     <b>TraceBuilder unable to generate the traces while giving the job history path by globing.</b><br>

			
 
				+     <blockquote>I was trying to generate the traces for MR job histories by using TraceBuilder. However, it&apos;s unable to generate the traces while giving the job history path by globing. It throws a file not found exception even though the job history path is exists.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2077">MAPREDUCE-2077</a>.

			
 
				+     Major bug reported by vicaya and fixed by vicaya <br>

			
 
				+     <b>Name clash in the deprecated o.a.h.util.MemoryCalculatorPlugin</b><br>

			
 
				+     <blockquote>Name clash compile error in the deprecated org.apache.hadoop.util.MemoryCalculatorPlugin due to JLS3 8.4.8.3 (cf. http://bugs.sun.com/view_bug.do?bug_id=6182950)

			
 
				+<br>

			
 
				+<br>The bug doesn&apos;t manifest in jdk 1.6 up to 20, but shows up in NetBeans 6.9+ due to its bundled (conforming) compiler. Fix is trivial: just remove the offending method in the deprecated subclass as its equivalent erasure is inherited from the parent class anyway.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2073">MAPREDUCE-2073</a>.

			
 
				+     Trivial test reported by tlipcon and fixed by tlipcon (distributed-cache, test)<br>

			
 
				+     <b>TestTrackerDistributedCacheManager should be up-front about requirements on build environment</b><br>

			
 
				+     <blockquote>TestTrackerDistributedCacheManager will fail on a system where the build directory is in any path where an ancestor doesn&apos;t have a+x permissions. On one of our hudson boxes, for example, hudson&apos;s workspace had 700 permissions and caused this test to fail reliably, but not in an obvious manner. It would be helpful if the test failed with a more obvious error message during setUp() when the build environment is misconfigured.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2067">MAPREDUCE-2067</a>.

			
 
				+     Major bug reported by atm and fixed by atm (security)<br>

			
 
				+     <b>Distinct minicluster services (e.g. NN and JT) overwrite each other&apos;s service policies</b><br>

			
 
				+     <blockquote>MR portion of HADOOP-6951.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2059">MAPREDUCE-2059</a>.

			
 
				+     Major bug reported by dadkins and fixed by subrotosanyal (jobtracker)<br>

			
 
				+     <b>RecoveryManager attempts to add jobtracker.info</b><br>

			
 
				+     <blockquote>The jobtracker is treating the file &apos;jobtracker.info&apos; in the system data directory as a job to be recovered

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2054">MAPREDUCE-2054</a>.

			
 
				+     Major bug reported by sandholm and fixed by sandholm (contrib/dynamic-scheduler)<br>

			
 
				+     <b>Hierarchical queue implementation broke dynamic queue addition in Dynamic Scheduler</b><br>

			
 
				+     <blockquote>Queue names were returned from the queue manager as an immutable set after the hierarchical queuname feature which breaks the dynamic priority scheduler</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2051">MAPREDUCE-2051</a>.

			
 
				+     Major test reported by tlipcon and fixed by tlipcon (contrib/fair-share)<br>

			
 
				+     <b>Contribute a fair scheduler preemption system test</b><br>

			
 
				+     <blockquote>We&apos;ve seen a number of bugs in the fair share scheduler not caught by its unit tests, which are heavily mock-based. This JIRA is to add an integration/system/stress test for the fairshare scheduler. This test can help identify races and deadlocks, and when run within the jcarder framework has identified several potential deadlocks for us that aren&apos;t turned up running small scale testing.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2046">MAPREDUCE-2046</a>.

			
 
				+     Major improvement reported by namit and fixed by dhruba <br>

			
 
				+     <b>A CombineFileInputSplit cannot be less than a dfs block </b><br>

			
 
				+     <blockquote>I ran into this while testing some hive features.

			
 
				+<br>

			
 
				+<br>Whether we use hiveinputformat or combinehiveinputformat, a split cannot be less than a dfs block size.

			
 
				+<br>This is a problem if we want to increase the block size for older data to reduce memory consumption for the

			
 
				+<br>name node.

			
 
				+<br>

			
 
				+<br>It would be useful if the input split was independent of the dfs block size.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2034">MAPREDUCE-2034</a>.

			
 
				+     Trivial test reported by tlipcon and fixed by tlipcon (test)<br>

			
 
				+     <b>TestSubmitJob triggers NPE instead of permissions error</b><br>

			
 
				+     <blockquote>TestSubmitJob.testSecureJobExecution catches _any_ IOException and assumes a permissions error has been caught. In fact, it was passing an invalid path name to the NameNode and triggering an NPE, not a Permission denied error, in one case, but the test was not specific enough to detect this.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2031">MAPREDUCE-2031</a>.

			
 
				+     Major bug reported by amareshwari and fixed by ravidotg (tasktracker, test)<br>

			
 
				+     <b>TestTaskLauncher and TestTaskTrackerLocalization fail with NPE in trunk.</b><br>

			
 
				+     <blockquote>TestTaskLauncher and TestTaskTrackerLocalization fail in trunk after the commit of MAPREDUCE-1881 with NPE:

			
 
				+<br>NPE happens because taskTracker.myInstrumentation is not initialized.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2029">MAPREDUCE-2029</a>.

			
 
				+     Major bug reported by pauly and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>DistributedRaidFileSystem not removed from cache on close()</b><br>

			
 
				+     <blockquote>When DistributedRaidFileSystem.close() is called, it does not remove itself from the FileSystem cache, but it does close the underlying filesystem, e.g. DFS.

			
 
				+<br>

			
 
				+<br>Because the DRFS with the closed DFS is still in the cache, calling FileSystem.get() returns a stale DRFS that throws &apos;filesystem closed&apos; exceptions.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2026">MAPREDUCE-2026</a>.

			
 
				+     Major improvement reported by schen and fixed by jsensarma <br>

			
 
				+     <b>JobTracker.getJobCounters() should not hold JobTracker lock while calling JobInProgress.getCounters()</b><br>

			
 
				+     <blockquote>JobTracker.getJobCounter() will lock JobTracker and call JobInProgress.getCounters().

			
 
				+<br>JobInProgress.getCounters() can be very expensive because it aggregates all the task counters.

			
 
				+<br>We found that from the JobTracker jstacks that this method is one of the bottleneck of the JobTracker performance.

			
 
				+<br>

			
 
				+<br>JobInProgress.getCounters() should be able to be called out side the JobTracker lock because it already has JobInProgress lock.

			
 
				+<br>For example, it is used by jobdetails.jsp without a JobTracker lock.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2023">MAPREDUCE-2023</a>.

			
 
				+     Major bug reported by hong.tang and fixed by hong.tang (benchmarks)<br>

			
 
				+     <b>TestDFSIO read test may not read specified bytes.</b><br>

			
 
				+     <blockquote>TestDFSIO&apos;s read test may read less bytes than specified when reading large files.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2022">MAPREDUCE-2022</a>.

			
 
				+     Blocker bug reported by amareshwari and fixed by amareshwari (test)<br>

			
 
				+     <b>trunk build broken</b><br>

			
 
				+     <blockquote>Trunk compilation fails with following errors:

			
 
				+<br>    [javac] /home/amarsri/workspace/trunk/src/test/mapred/org/apache/hadoop/mapred/TestSubmitJob.java:267: getListing(java.lang.String,byte[],boolean) in org.apache.hadoop.hdfs.protocol.ClientProtocol cannot be applied to (java.lang.String,byte[])

			
 
				+<br>    [javac]         client.getListing(

			
 
				+<br>    [javac]               ^

			
 
				+<br>    [javac] /home/amarsri/workspace/trunk/src/test/mapred/org/apache/hadoop/mapred/TestSubmitJob.java:281: getListing(java.lang.String,byte[],boolean) in org.apache.hadoop.hdfs.protocol.ClientProtocol cannot be applied to (java.lang.String,byte[])

			
 
				+<br>    [javac]         client.getListing(

			
 
				+<br>    [javac]               ^

			
 
				+<br>

			
 
				+<br>This is due to commit of HDFS-202</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2021">MAPREDUCE-2021</a>.

			
 
				+     Major bug reported by amareshwari and fixed by amareshwari (client)<br>

			
 
				+     <b>CombineFileInputFormat returns duplicate  hostnames in split locations</b><br>

			
 
				+     <blockquote>CombineFileInputFormat.getSplits creates splits with duplicate locations. It adds locations of the files in the split to an ArrayList; if all the files are on same location, the location is added again and again. Instead, it should add it to a Set instead of List to avoid duplicates.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2000">MAPREDUCE-2000</a>.

			
 
				+     Major bug reported by hong.tang and fixed by hong.tang (tools/rumen)<br>

			
 
				+     <b>Rumen is not able to extract counters for Job history logs from Hadoop 0.20</b><br>

			
 
				+     <blockquote>Rumen tries to match the end of a value string through indexOf(&quot;\&quot;&quot;). It does not take into account the case when an escaped &apos;&quot;&apos; in the value string. This leads to the incorrect parsing the remaining key=value properties in the same line.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1999">MAPREDUCE-1999</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>ClientProtocol incorrectly uses hdfs DelegationTokenSelector</b><br>

			
 
				+     <blockquote>ClientProtocol in MR incorrectly uses the DelegationTokenSelector in hdfs due to a wrong import. It should use the DelegationTokenSelector in mapreduce.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1996">MAPREDUCE-1996</a>.

			
 
				+     Trivial bug reported by glynnbach and fixed by qwertymaniac (documentation)<br>

			
 
				+     <b>API: Reducer.reduce() method detail misstatement</b><br>

			
 
				+     <blockquote>method detail for Reducer.reduce() method has paragraph starting:

			
 
				+<br>

			
 
				+<br>&quot;Applications can use the Reporter  provided to report progress or just indicate that they are alive. In scenarios where the application takes an insignificant amount of time to process individual key/value pairs, this is crucial since the framework might assume that the task has timed-out and kill that task. &quot;

			
 
				+<br>

			
 
				+<br>s/an insignificant amount of time/a significant amount of time/

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1993">MAPREDUCE-1993</a>.

			
 
				+     Major bug reported by devaraj and fixed by devaraj <br>

			
 
				+     <b>TestTrackerDistributedCacheManagerWithLinuxTaskController fails on trunk</b><br>

			
 
				+     <blockquote>TestTrackerDistributedCacheManagerWithLinuxTaskController fails when run with the DefaultTaskController. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1992">MAPREDUCE-1992</a>.

			
 
				+     Major bug reported by ravidotg and fixed by kzhang (jobtracker)<br>

			
 
				+     <b>NPE in JobTracker&apos;s constructor</b><br>

			
 
				+     <blockquote>On my local machine, JobTracker is *not* coming up with current trunk. Logs show the following NPE:

			
 
				+<br>

			
 
				+<br>2010-08-03 14:01:41,449 FATAL org.apache.hadoop.mapred.JobTracker: java.lang.NullPointerException

			
 
				+<br>  at org.apache.hadoop.security.UserGroupInformation.isLoginKeytabBased(UserGroupInformation.java:703)

			
 
				+<br>  at org.apache.hadoop.mapred.JobTracker.&lt;init&gt;(JobTracker.java:1383)

			
 
				+<br>  at org.apache.hadoop.mapred.JobTracker.startTracker(JobTracker.java:275)

			
 
				+<br>  at org.apache.hadoop.mapred.JobTracker.startTracker(JobTracker.java:267)

			
 
				+<br>  at org.apache.hadoop.mapred.JobTracker.startTracker(JobTracker.java:262)

			
 
				+<br>  at org.apache.hadoop.mapred.JobTracker.main(JobTracker.java:4236)

			
 
				+<br>

			
 
				+<br>2010-08-03 14:01:41,449 INFO org.apache.hadoop.mapred.JobTracker: SHUTDOWN_MSG:</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1989">MAPREDUCE-1989</a>.

			
 
				+     Major bug reported by ravidotg and fixed by ravidotg (contrib/gridmix)<br>

			
 
				+     <b>Gridmix3 doesn&apos;t emit out proper mesage when user resolver is set and no user list is given</b><br>

			
 
				+     <blockquote>Currently, Gridmix3 emits out the following mesage when user resolver is set and no user list is given.

			
 
				+<br>&quot;Resource null ignored&quot;.

			
 
				+<br>This is not clear/meaningful to user.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1982">MAPREDUCE-1982</a>.

			
 
				+     Major bug reported by amar_kamat and fixed by ravidotg (tools/rumen)<br>

			
 
				+     <b>[Rumen] TraceBuilder&apos;s output shows jobname as NULL for jobhistory files with valid jobnames</b><br>

			
 
				+     <blockquote>{{TraceBuilder}} fails to extract configuration properties (like job-name) from the job-conf if the job-conf has the properties stored using the deprecated keys.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1979">MAPREDUCE-1979</a>.

			
 
				+     Major bug reported by ravidotg and fixed by ravidotg (contrib/gridmix)<br>

			
 
				+     <b>&quot;Output directory already exists&quot; error in gridmix when gridmix.output.directory is not defined</b><br>

			
 
				+     <blockquote>&quot;Output directory already exists&quot; error is seen in gridmix when gridmix.output.directory is not defined. When gridmix.output.directory is not defined, then gridmix uses inputDir/gridmix/ as output path for gridmix run. Because gridmix is creating outputPath(in this case, inputDir/gridmix/) at the begining, the output path to generate-data-mapreduce-job(i.e. inputDir) already exists and becomes error from mapreduce.

			
 
				+<br>

			
 
				+<br>There is need for creation of this outputPath in any case(whether user specifies the path using gridmix.output.directory OR gridmix itself considering inputDir/gridmix/ ) even though the paths are automatically created for output paths of mapreduce jobs(like mkdir -p), because gridmix needs to set 777 permissions for this outputPath sothat different users can create different output directories of different mapreduce jobs within this gridmix run.

			
 
				+<br>

			
 
				+<br>The other case in which this problem is seen is when gridmix.output.directory is defined as a relative path. This is because in this case also, gridmix tries to create relative path under ioPath/ and thus the same issue.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1975">MAPREDUCE-1975</a>.

			
 
				+     Major bug reported by ravidotg and fixed by ravidotg (contrib/gridmix)<br>

			
 
				+     <b>gridmix shows unnecessary InterruptedException</b><br>

			
 
				+     <blockquote>The following InterruptedException is seen when gridmix is run and it ran successfully:

			
 
				+<br>

			
 
				+<br>10/06/24 20:43:03 INFO gridmix.ReplayJobFactory: START REPLAY @ 11331037109

			
 
				+<br>10/06/24 20:43:03 ERROR gridmix.Statistics: Statistics interrupt while waiting for polling null

			
 
				+<br>java.lang.InterruptedException

			
 
				+<br>        at java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObjec\

			
 
				+<br>t.reportInterruptAfterWait(AbstractQueuedSynchronizer.java:1899)

			
 
				+<br>        at java.util.concurrent.locks.AbstractQueuedSynchronizer$ConditionObjec\

			
 
				+<br>t.await(AbstractQueuedSynchronizer.java:2066)

			
 
				+<br>        at org.apache.hadoop.mapred.gridmix.Statistics$StatCollector.run(Statis\

			
 
				+<br>tics.java:190)

			
 
				+<br>10/06/24 20:43:03 INFO gridmix.Gridmix: Exiting...</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1974">MAPREDUCE-1974</a>.

			
 
				+     Major bug reported by schen and fixed by schen (contrib/fair-share)<br>

			
 
				+     <b>FairScheduler can preempt the same task many times</b><br>

			
 
				+     <blockquote>In FairScheduler.preemptTasks(), tasks are collected from JobInProgress.runningMapCache.

			
 
				+<br>But tasks repeat multiple times in  JobInProgress.runningMapCache (on rack, node and cluster).

			
 
				+<br>This makes FairScheduler preempt the same task many times.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1970">MAPREDUCE-1970</a>.

			
 
				+     Major sub-task reported by schen and fixed by schen (contrib/raid)<br>

			
 
				+     <b>Reed-Solomon code implementation to be used in raid</b><br>

			
 
				+     <blockquote>A Reed-Solomon erasure code implementation.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1961">MAPREDUCE-1961</a>.

			
 
				+     Major bug reported by hong.tang and fixed by hong.tang (contrib/gridmix)<br>

			
 
				+     <b>[gridmix3] ConcurrentModificationException when shutting down Gridmix</b><br>

			
 
				+     <blockquote>We observed the following exception occasionally at the end of the Gridmix run:

			
 
				+<br>

			
 
				+<br>{code}

			
 
				+<br>Exception in thread &quot;StatsCollectorThread&quot; java.util.ConcurrentModificationException

			
 
				+<br>          at java.util.AbstractList$Itr.checkForComodification(AbstractList.java:372)

			
 
				+<br>          at java.util.AbstractList$Itr.next(AbstractList.java:343)

			
 
				+<br>          at org.apache.hadoop.mapred.gridmix.Statistics$StatCollector.updateAndNotifyClusterStatsListeners(Statistics.java:220)

			
 
				+<br>          at org.apache.hadoop.mapred.gridmix.Statistics$StatCollector.run(Statistics.java:205)

			
 
				+<br>{code}</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1958">MAPREDUCE-1958</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>using delegation token over hftp for long running clients (part of hdfs 1296)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1945">MAPREDUCE-1945</a>.

			
 
				+     Major improvement reported by kzhang and fixed by kzhang <br>

			
 
				+     <b>Support for using different Kerberos keys for Jobtracker and TaskTrackers</b><br>

			
 
				+     <blockquote>This is the MapRed part of HADOOP-6632.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1936">MAPREDUCE-1936</a>.

			
 
				+     Major improvement reported by hong.tang and fixed by hong.tang (contrib/gridmix)<br>

			
 
				+     <b>[gridmix3] Make Gridmix3 more customizable.</b><br>

			
 
				+     <blockquote>I&apos;d like to make gridmix3 more customizable. Specifically, the proposed customizations include:

			
 
				+<br>- add (random) location information for each sleep map task.

			
 
				+<br>- make the parameters used in stress submission load throttling configurable.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1935">MAPREDUCE-1935</a>.

			
 
				+     Major improvement reported by boryas and fixed by boryas <br>

			
 
				+     <b>HFTP needs to be updated to use delegation tokens (from HDFS-1007)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1931">MAPREDUCE-1931</a>.

			
 
				+     Major improvement reported by rksingh and fixed by ranjit (contrib/gridmix)<br>

			
 
				+     <b>Gridmix forrest documentation </b><br>

			
 
				+     <blockquote>Gridmix forrest documentation</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1925">MAPREDUCE-1925</a>.

			
 
				+     Major bug reported by amareshwari and fixed by ravidotg (tools/rumen)<br>

			
 
				+     <b>TestRumenJobTraces fails in trunk</b><br>

			
 
				+     <blockquote>TestRumenJobTraces failed with following error:

			
 
				+<br>Error Message

			
 
				+<br>

			
 
				+<br>the gold file contains more text at line 1 expected:&lt;56&gt; but was:&lt;0&gt;

			
 
				+<br>

			
 
				+<br>Stacktrace

			
 
				+<br>

			
 
				+<br>  at org.apache.hadoop.tools.rumen.TestRumenJobTraces.testHadoop20JHParser(TestRumenJobTraces.java:294)

			
 
				+<br>

			
 
				+<br>Full log of the failure is available at http://hudson.zones.apache.org/hudson/job/Mapreduce-Patch-h4.grid.sp2.yahoo.net/292/testReport/org.apache.hadoop.tools.rumen/TestRumenJobTraces/testHadoop20JHParser/</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1918">MAPREDUCE-1918</a>.

			
 
				+     Major improvement reported by amar_kamat and fixed by amar_kamat (tools/rumen)<br>

			
 
				+     <b>Add documentation to Rumen</b><br>

			
 
				+     <blockquote>Add forrest documentation to Rumen tool.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1915">MAPREDUCE-1915</a>.

			
 
				+     Trivial bug reported by rvernica and fixed by priyomustafi (tasktracker)<br>

			
 
				+     <b>IndexCache - getIndexInformation - check reduce index Out Of Bounds</b><br>

			
 
				+     <blockquote>When checking if the &quot;reduce&quot; index is out of bounds the check should be 

			
 
				+<br>

			
 
				+<br>info.mapSpillRecord.size() &lt;= reduce

			
 
				+<br>

			
 
				+<br>instead of:

			
 
				+<br>

			
 
				+<br>info.mapSpillRecord.size() &lt; reduce

			
 
				+<br>

			
 
				+<br>Not a big bug since an Out Of Bounds is thrown downstream anyway.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1911">MAPREDUCE-1911</a>.

			
 
				+     Major bug reported by amareshwari and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>Fix errors in -info option in streaming</b><br>

			
 
				+     <blockquote>Here are some of the findings by Karam while verifying -info option in streaming:

			
 
				+<br># We need to add &quot;Optional&quot; for -mapper, -reducer,-combiner and -file options.

			
 
				+<br># For -inputformat and -outputformat options, we should put &quot;Optional&quot; in the prefix for the sake on uniformity.

			
 
				+<br># We need to remove -cluster decription.

			
 
				+<br># -help option is not displayed in usage message.

			
 
				+<br># when displaying message for -info or -help options, we should not display &quot;Streaming Job Failed!&quot;; also exit code should be 0 in case of -help/-info option.

			
 
				+<br>

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1908">MAPREDUCE-1908</a>.

			
 
				+     Major bug reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>DistributedRaidFileSystem does not handle ChecksumException correctly</b><br>

			
 
				+     <blockquote>ChecksumException reports the offset of corruption within a block,

			
 
				+<br>whereas DistributedRaidFileSystem.setAlternateLocations was expecting it

			
 
				+<br>to report the offset of corruption within the file.

			
 
				+<br>

			
 
				+<br>The best way of dealing with a missing block/corrupt block is to just

			
 
				+<br>use the current seek offset in the file as the position of corruption.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1900">MAPREDUCE-1900</a>.

			
 
				+     Major bug reported by devaraj and fixed by kzhang (jobtracker, tasktracker)<br>

			
 
				+     <b>MapReduce daemons should close FileSystems that are not needed anymore</b><br>

			
 
				+     <blockquote>Related to HADOOP-6843, this jira is to make MapReduce behave better with respect to closing FileSystems when they are not needed anymore.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1894">MAPREDUCE-1894</a>.

			
 
				+     Major bug reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>DistributedRaidFileSystem.readFully() does not return</b><br>

			
 
				+     <blockquote>DistributedRaidFileSystem.readFully() has a while(true) loop with no return. The read(*) functions do not have this problem.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1893">MAPREDUCE-1893</a>.

			
 
				+     Major improvement reported by shv and fixed by shv (benchmarks, test)<br>

			
 
				+     <b>Multiple reducers for Slive</b><br>

			
 
				+     <blockquote>Slive currently uses single reducer. It could use multiple ones.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1892">MAPREDUCE-1892</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RaidNode can allow layered policies more efficiently</b><br>

			
 
				+     <blockquote>The RaidNode policy file can have layered policies that can cover a file more than once. To avoid processing a file multiple times (for RAIDing), RaidNode maintains a list of processed files that is used to avoid duplicate processing attempts.

			
 
				+<br>

			
 
				+<br>This is problematic in that a large number of processed files could cause the RaidNode to run out of memory.

			
 
				+<br>

			
 
				+<br>This task proposes a better method of detecting processed files. The method is based on the observation that a more selective policy will have a better match with a file name than a less selective one. Specifically, the more selective policy will have a longer common prefix with the file name.

			
 
				+<br>

			
 
				+<br>So to detect if a file has already been processed, the RaidNode only needs to maintain a list of processed policies and compare the lengths of the common prefixes. If the file has a longer common prefix with one of the processed policies than with the current policy, it can be assumed to be processed already.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1888">MAPREDUCE-1888</a>.

			
 
				+     Major bug reported by amareshwari and fixed by ravidotg (contrib/streaming)<br>

			
 
				+     <b>Streaming overrides user given output key and value types.</b><br>

			
 
				+     <blockquote>The following code in StreamJob.java overrides user given output key and value types.

			
 
				+<br>    idResolver.resolve(conf.get(StreamJobConfig.MAP_OUTPUT,

			
 
				+<br>        IdentifierResolver.TEXT_ID));

			
 
				+<br>    conf.setClass(StreamJobConfig.MAP_OUTPUT_READER_CLASS,

			
 
				+<br>      idResolver.getOutputReaderClass(), OutputReader.class);

			
 
				+<br>    job.setMapOutputKeyClass(idResolver.getOutputKeyClass());

			
 
				+<br>    job.setMapOutputValueClass(idResolver.getOutputValueClass());

			
 
				+<br>    

			
 
				+<br>    idResolver.resolve(conf.get(StreamJobConfig.REDUCE_OUTPUT,

			
 
				+<br>        IdentifierResolver.TEXT_ID));

			
 
				+<br>    conf.setClass(StreamJobConfig.REDUCE_OUTPUT_READER_CLASS,

			
 
				+<br>      idResolver.getOutputReaderClass(), OutputReader.class);

			
 
				+<br>    job.setOutputKeyClass(idResolver.getOutputKeyClass());

			
 
				+<br>    job.setOutputValueClass(idResolver.getOutputValueClass());

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1887">MAPREDUCE-1887</a>.

			
 
				+     Major bug reported by kimballa and fixed by kimballa <br>

			
 
				+     <b>MRAsyncDiskService does not properly absolutize volume root paths</b><br>

			
 
				+     <blockquote>In MRAsyncDiskService, volume names are sometimes specified as relative paths, which are not converted to absolute paths. This can cause errors of the form &quot;cannot delete &lt;/full/path/to/foo&gt; since it is outside of &lt;relative/volume/root&gt;&quot; even though the actual path is inside the root. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1878">MAPREDUCE-1878</a>.

			
 
				+     Major improvement reported by kimballa and fixed by kimballa (contrib/mrunit)<br>

			
 
				+     <b>Add MRUnit documentation</b><br>

			
 
				+     <blockquote>A short user guide for MRUnit, written in asciidoc.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1868">MAPREDUCE-1868</a>.

			
 
				+     Major improvement reported by ramach and fixed by ramach (client)<br>

			
 
				+     <b>Add read timeout on userlog pull</b><br>

			
 
				+     <blockquote>Add read and connection timeout to prevent job client hangs

			
 
				+<br>

			
 
				+<br>jobclient can block indefinitely during task log pull if read or connect fails 

			
 
				+<br>

			
 
				+<br>        at sun.net.www.protocol.http.HttpURLConnection.getInputStream(HttpURLConnection.java:1049)

			
 
				+<br>        - locked &lt;0xeed0f0f0&gt; (a sun.net.www.protocol.http.HttpURLConnection)

			
 
				+<br>        at org.apache.hadoop.mapred.JobClient.getTaskLogs(JobClient.java:1396)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1867">MAPREDUCE-1867</a>.

			
 
				+     Minor bug reported by amareshwari and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>Remove unused methods in org.apache.hadoop.streaming.StreamUtil</b><br>

			
 
				+     <blockquote>There are many unused methods in org.apache.hadoop.streaming.StreamUtil. They should be removed from the class for maintainability. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1866">MAPREDUCE-1866</a>.

			
 
				+     Minor bug reported by amareshwari and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>Remove deprecated class org.apache.hadoop.streaming.UTF8ByteArrayUtils</b><br>

			
 
				+     <blockquote>The class org.apache.hadoop.streaming.UTF8ByteArrayUtils is deprecated in favor of org.apache.hadoop.util.UTF8ByteArrayUtils in branch 0.19.

			
 
				+<br>The same should be removed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1865">MAPREDUCE-1865</a>.

			
 
				+     Major bug reported by amar_kamat and fixed by amar_kamat (tools/rumen)<br>

			
 
				+     <b>[Rumen] Rumen should also support jobhistory files generated using trunk</b><br>

			
 
				+     <blockquote>Rumen code in trunk parses and process only jobhistory files from pre-21 hadoop mapreduce clusters. It should also support jobhistory files generated using trunk.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1864">MAPREDUCE-1864</a>.

			
 
				+     Major bug reported by amareshwari and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>PipeMapRed.java has uninitialized members log_ and LOGNAME </b><br>

			
 
				+     <blockquote>PipeMapRed.java has members log_ and LOGNAME, which are never initialized and they are used in code for logging in several places. 

			
 
				+<br>They should be removed and PipeMapRed should use commons LogFactory and Log for logging. This would improve code maintainability.

			
 
				+<br>

			
 
				+<br>Also, as per [comment | https://issues.apache.org/jira/browse/MAPREDUCE-1851?focusedCommentId=12878530&amp;page=com.atlassian.jira.plugin.system.issuetabpanels%3Acomment-tabpanel#action_12878530], stream.joblog_ configuration property can be removed.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1863">MAPREDUCE-1863</a>.

			
 
				+     Major bug reported by amar_kamat and fixed by amar_kamat (tools/rumen)<br>

			
 
				+     <b>[Rumen] Null failedMapAttemptCDFs in job traces generated by Rumen</b><br>

			
 
				+     <blockquote>All the traces generated by Rumen for jobs having failed task attempts has null value for failedMapAttemptCDFs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1857">MAPREDUCE-1857</a>.

			
 
				+     Trivial bug reported by amareshwari and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>Remove unused streaming configuration from src</b><br>

			
 
				+     <blockquote>The configuration stream.numinputspecs is just set and not read anywhere. It can be removed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1851">MAPREDUCE-1851</a>.

			
 
				+     Major improvement reported by amareshwari and fixed by amareshwari (contrib/streaming, documentation)<br>

			
 
				+     <b>Document configuration parameters in streaming</b><br>

			
 
				+     <blockquote>There are several streaming options such as stream.map.output.field.separator, stream.num.map.output.key.fields, stream.map.input.field.separator,  stream.reduce.input.field.separator,  stream.map.input.ignoreKey, stream.non.zero.exit.is.failure etc which are spread everywhere. These should be documented at single place with description and default-value.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1850">MAPREDUCE-1850</a>.

			
 
				+     Major improvement reported by ramach and fixed by ramach <br>

			
 
				+     <b>Include job submit host information (name and ip) in jobconf and jobdetails display</b><br>

			
 
				+     <blockquote>Enhancement to identify the source (submit host and ip) of a job request. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1848">MAPREDUCE-1848</a>.

			
 
				+     Major improvement reported by schen and fixed by schen (jobtracker)<br>

			
 
				+     <b>Put number of speculative, data local, rack local tasks in JobTracker metrics</b><br>

			
 
				+     <blockquote>It will be nice that we can collect these information in JobTracker metrics</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1840">MAPREDUCE-1840</a>.

			
 
				+     Major improvement reported by amar_kamat and fixed by amar_kamat (contrib/gridmix)<br>

			
 
				+     <b>[Gridmix] Exploit/Add security features in GridMix</b><br>

			
 
				+     <blockquote>Use security information while replaying jobs in Gridmix. This includes

			
 
				+<br>- Support for multiple users

			
 
				+<br>- Submitting jobs as different users

			
 
				+<br>- Allowing usage of secure cluster (hdfs + mapreduce)

			
 
				+<br>- Support for multiple queues

			
 
				+<br>

			
 
				+<br>Other features include : 

			
 
				+<br>- Support for sleep job

			
 
				+<br>- Support for load job 

			
 
				+<br>

			
 
				+<br>+ testcases for verifying all of the above changes</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1838">MAPREDUCE-1838</a>.

			
 
				+     Minor improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>DistRaid map tasks have large variance in running times</b><br>

			
 
				+     <blockquote>HDFS RAID uses map-reduce jobs to generate parity files for a set of source files. Each map task gets a subset of files to operate on. The current code assigns files by walking through the list of files given in the constructor of DistRaid

			
 
				+<br>

			
 
				+<br>The problem is that the list of files given to the constructor has the order of (pretty much) the directory listing. When a large number of files is added, files in that order tend to have the same size. Thus a map task can end up with large files where as another can end up with small files, increasing the variance in run times.

			
 
				+<br>

			
 
				+<br>We could do smarter assignment by using the file sizes.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1836">MAPREDUCE-1836</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>Refresh for proxy superuser config (mr part for HDFS-1096)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1834">MAPREDUCE-1834</a>.

			
 
				+     Major bug reported by amareshwari and fixed by hong.tang (contrib/mumak)<br>

			
 
				+     <b>TestSimulatorDeterministicReplay timesout on trunk</b><br>

			
 
				+     <blockquote>TestSimulatorDeterministicReplay timesout on trunk.

			
 
				+<br>See hudson patch build http://hudson.zones.apache.org/hudson/job/Mapreduce-Patch-h4.grid.sp2.yahoo.net/216/testReport/org.apache.hadoop.mapred/TestSimulatorDeterministicReplay/testMain/</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1829">MAPREDUCE-1829</a>.

			
 
				+     Major improvement reported by schen and fixed by schen (jobtracker)<br>

			
 
				+     <b>JobInProgress.findSpeculativeTask should use min() to find the candidate instead of sort()</b><br>

			
 
				+     <blockquote>findSpeculativeTask needs only one candidate to speculate so it does not need to sort the whole list. It may looks OK but someone can still submit big jobs with small slow task thresholds. In this case, this sorting becomes expensive.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1825">MAPREDUCE-1825</a>.

			
 
				+     Major bug reported by amareshwari and fixed by schen (jobtracker)<br>

			
 
				+     <b>jobqueue_details.jsp and FairSchedulerServelet should not call finishedMaps and finishedReduces when job is not initialized</b><br>

			
 
				+     <blockquote>JobInProgress.finishedMaps() and finishedReduces() are synchronized. They are called from jobqueue_details.jsp and FairSchedulerServelet which iterates through all jobs. If any job is in initialization, these pages don&apos;t come up until the initialization finishes.

			
 
				+<br>

			
 
				+<br>See [comment|https://issues.apache.org/jira/browse/MAPREDUCE-1354?focusedCommentId=12834139&amp;page=com.atlassian.jira.plugin.system.issuetabpanels%3Acomment-tabpanel#action_12834139] for more details</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1820">MAPREDUCE-1820</a>.

			
 
				+     Major bug reported by alexvk and fixed by alexvk <br>

			
 
				+     <b>InputSampler does not create a deep copy of the key object when creating a sample, which causes problems with some formats like SequenceFile&lt;Text,Text&gt;</b><br>

			
 
				+     <blockquote>I tried to use the InputSampler on a SequenceFile&lt;Text,Text&gt; and found that it comes up with duplicate keys in the sample.  The problem was tracked down to the fact that the Text object returned from the reader is essentially a wrapper pointing to a byte array, which changes as the sequence file reader progresses.  There was also a bug in that the reader should be initialized before the use.  The am attaching a patch that fixes both of the issues.  --Alex K</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1819">MAPREDUCE-1819</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RaidNode should be smarter in submitting Raid jobs</b><br>

			
 
				+     <blockquote>The RaidNode currently computes parity files as follows:

			
 
				+<br>1. Using RaidNode.selectFiles() to figure out what files to raid for a policy

			
 
				+<br>2. Using #1 repeatedly for each configured policy to accumulate a list of files. 

			
 
				+<br>3. Submitting a mapreduce job with the list of files from #2 using DistRaid.doDistRaid()

			
 
				+<br>

			
 
				+<br>This task addresses the fact that #2 and #3 happen sequentially. The proposal is to submit a separate mapreduce job for the list of files for each policy and use another thread to track the progress of the submitted jobs. This will help reduce the time taken for files to be raided.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1818">MAPREDUCE-1818</a>.

			
 
				+     Minor improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RaidNode should specify a pool name incase the cluster is using FairScheduler</b><br>

			
 
				+     <blockquote>contrib/fairscheduler (FairScheduler) supports scheduling based on pools. The RaidNode should specify a pool name based on configuration to make use of pools.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1816">MAPREDUCE-1816</a>.

			
 
				+     Minor improvement reported by rvadali and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>HAR files used for RAID parity need to have configurable partfile size</b><br>

			
 
				+     <blockquote>RAID parity files are merged into HAR archives periodically. This is required to reduce the number of files that the NameNode has to track. The number of files present in a HAR archive depends on the size of HAR part files - higher the size, lower the number of files.

			
 
				+<br>The size of HAR part files is configurable through the setting har.partfile.size, but that is a global setting. This task introduces a new setting specific to raid.har.partfile.size, that is used in-turn to set har.partfile.size</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1813">MAPREDUCE-1813</a>.

			
 
				+     Major bug reported by amareshwari and fixed by ravidotg (contrib/streaming)<br>

			
 
				+     <b>NPE in PipeMapred.MRErrorThread</b><br>

			
 
				+     <blockquote>Some reduce tasks fail with following NPE

			
 
				+<br>java.lang.RuntimeException: java.lang.NullPointerException

			
 
				+<br>        at org.apache.hadoop.streaming.PipeMapRed.waitOutputThreads(PipeMapRed.java:325)

			
 
				+<br>        at org.apache.hadoop.streaming.PipeMapRed.mapRedFinished(PipeMapRed.java:540)

			
 
				+<br>        at org.apache.hadoop.streaming.PipeReducer.close(PipeReducer.java:137)

			
 
				+<br>        at org.apache.hadoop.mapred.ReduceTask.runOldReducer(ReduceTask.java:474)

			
 
				+<br>        at org.apache.hadoop.mapred.ReduceTask.run(ReduceTask.java:412)

			
 
				+<br>        at org.apache.hadoop.mapred.Child.main(Child.java:159)

			
 
				+<br>Caused by: java.lang.NullPointerException

			
 
				+<br>       at org.apache.hadoop.streaming.PipeMapRed$MRErrorThread.setStatus(PipeMapRed.java:517)

			
 
				+<br>        at org.apache.hadoop.streaming.PipeMapRed$MRErrorThread.run(PipeMapRed.java:449)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1804">MAPREDUCE-1804</a>.

			
 
				+     Major new feature reported by shv and fixed by shv (benchmarks, test)<br>

			
 
				+     <b>Stress-test tool for HDFS introduced in HDFS-708</b><br>

			
 
				+     <blockquote>This issue is to commit the SLive test developed in HDFS-708 to MR trunk.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1798">MAPREDUCE-1798</a>.

			
 
				+     Major improvement reported by boryas and fixed by boryas <br>

			
 
				+     <b>normalize property names for JT kerberos principal names in configuration (from HADOOP 6633)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1785">MAPREDUCE-1785</a>.

			
 
				+     Minor improvement reported by eli and fixed by eli (contrib/streaming)<br>

			
 
				+     <b>Add streaming config option for not emitting the key</b><br>

			
 
				+     <blockquote>PipeMapper currently does not emit the key when using TextInputFormat. If you switch to input formats (eg LzoTextInputFormat) the key will be emitted. We should add an option so users can explicitly make streaming not emit the key so they can change input formats without breaking or having to modify their existing programs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1784">MAPREDUCE-1784</a>.

			
 
				+     Minor bug reported by eli and fixed by eli <br>

			
 
				+     <b>IFile should check for null compressor</b><br>

			
 
				+     <blockquote>IFile assumes that when it has a codec it can always get a compressor. This fails when mapred.compress.map.output is true but the native libraries are not installed, resulting in an NPE:

			
 
				+<br>Let&apos;s make IFile handle this case by logging and using non-compressed streams.l</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1783">MAPREDUCE-1783</a>.

			
 
				+     Major improvement reported by rvadali and fixed by rvadali (contrib/fair-share)<br>

			
 
				+     <b>Task Initialization should be delayed till when a job can be run</b><br>

			
 
				+     <blockquote>The FairScheduler task scheduler uses PoolManager to impose limits on the number of jobs that can be running at a given time. However, jobs that are submitted are initiaiized immediately by EagerTaskInitializationListener by calling JobInProgress.initTasks. This causes the job split file to be read into memory. The split information is not needed until the number of running jobs is less than the maximum specified. If the amount of split information is large, this leads to unnecessary memory pressure on the Job Tracker.

			
 
				+<br>To ease memory pressure, FairScheduler can use another implementation of JobInProgressListener that is aware of PoolManager limits and can delay task initialization until the number of running jobs is below the maximum.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1780">MAPREDUCE-1780</a>.

			
 
				+     Major bug reported by ravidotg and fixed by ravidotg (jobtracker)<br>

			
 
				+     <b>AccessControlList.toString() is used for serialization of ACL in JobStatus.java</b><br>

			
 
				+     <blockquote>HADOOP-6715 is created to fix AccessControlList.toString() for the case of WILDCARD. JobStatus.write() and readFields() assume that toString() returns the serialized String of AccessControlList object, which is not true. Once HADOOP-6715 gets fixed in COMMON, JobStatus.write() and JobStatus.readFields() should be fixed depending on the fix of HADOOP-6715.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1778">MAPREDUCE-1778</a>.

			
 
				+     Major improvement reported by amar_kamat and fixed by ramach (jobtracker)<br>

			
 
				+     <b>CompletedJobStatusStore initialization should fail if {mapred.job.tracker.persist.jobstatus.dir} is unwritable</b><br>

			
 
				+     <blockquote>If {mapred.job.tracker.persist.jobstatus.dir} points to an unwritable location or mkdir of {mapred.job.tracker.persist.jobstatus.dir} fails, then CompletedJobStatusStore silently ignores the failure and disables CompletedJobStatusStore. Ideally the JobTracker should bail out early indicating a misconfiguration.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1773">MAPREDUCE-1773</a>.

			
 
				+     Major bug reported by aloknsingh and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>streaming doesn&apos;t support jobclient.output.filter</b><br>

			
 
				+     <blockquote>the streaming Jobclient implementation i.e contrib/streaming/src/java/org/apache/hadoop/streaming/StreamJob.java is significantly different than the core hadoop mapred/org/apache/hadoop/mapred/JobClient.java.

			
 
				+<br>for example unlike StreamJob.java, JobClient.java it gets tasks log when jobclient.output.filter=ALL is specified .

			
 
				+<br>With hod-logs going away in hadoop 0.20 (due to new scheduler) user has no good way of programmitically getting logs

			
 
				+<br>We should have intermediate adaptor class to implement Tools for the purpose of submitting jobs via m/r, streaming, pipes so that we don&apos;t miss some core functionality.

			
 
				+<br>GenericJobClient implements Tools and then StreamJob extends GenericJobClient, JobClient extends GenericJobClient

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1772">MAPREDUCE-1772</a>.

			
 
				+     Minor bug reported by menicosia and fixed by amareshwari (contrib/streaming, documentation)<br>

			
 
				+     <b>Hadoop streaming doc should not use IdentityMapper as an example</b><br>

			
 
				+     <blockquote>From the URL http://hadoop.apache.org/core/docs/current/streaming.html

			
 
				+<br>

			
 
				+<br>This example doesn&apos;t work:

			
 
				+<br>You can supply a Java class as the mapper and/or the reducer. The above example is equivalent to:

			
 
				+<br>

			
 
				+<br>$HADOOP_HOME/bin/hadoop  jar $HADOOP_HOME/hadoop-streaming.jar \

			
 
				+<br>    -input myInputDirs \

			
 
				+<br>    -output myOutputDir \

			
 
				+<br>    -mapper org.apache.hadoop.mapred.lib.IdentityMapper \

			
 
				+<br>    -reducer /bin/wc

			
 
				+<br>

			
 
				+<br>This will produce the following exception:

			
 
				+<br>java.io.IOException: Type mismatch in key from map: expected org.apache.hadoop.io.Text, recieved org.apache.hadoop.io.LongWritable

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1762">MAPREDUCE-1762</a>.

			
 
				+     Major improvement reported by schen and fixed by schen <br>

			
 
				+     <b>Add a setValue() method in Counter</b><br>

			
 
				+     <blockquote>Counters are very useful because of the logging and transmitting are already there.

			
 
				+<br>It is very convenient to transmit and store numbers. But currently Counter only has an increment() method.

			
 
				+<br>It will be nice if there can be a setValue() method in this class that will allow us to transmit wider variety of information through it.

			
 
				+<br>

			
 
				+<br>What do you think?</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1761">MAPREDUCE-1761</a>.

			
 
				+     Major improvement reported by schen and fixed by schen <br>

			
 
				+     <b>FairScheduler should allow separate configuration of node and rack locality wait time</b><br>

			
 
				+     <blockquote>It would be nice that we can separately assign rack locality wait time.

			
 
				+<br>In our use case, we would set node locality wait to zero and wait only rack locality.

			
 
				+<br>

			
 
				+<br>I propose that we add two parameters

			
 
				+<br>mapred.fairscheduler.locality.delay.nodetorack

			
 
				+<br>mapred.fairscheduler.locality.delay.racktoany

			
 
				+<br>This allows specifying the wait time on each stage.

			
 
				+<br>

			
 
				+<br>And we can use

			
 
				+<br>mapred.fairscheduler.locality.delay

			
 
				+<br>as the default value of the above fields so that this is backward compatible.

			
 
				+<br>

			
 
				+<br>Thoughts?</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1754">MAPREDUCE-1754</a>.

			
 
				+     Major bug reported by amareshwari and fixed by amareshwari (jobtracker)<br>

			
 
				+     <b>Replace mapred.persmissions.supergroup with an acl : mapreduce.cluster.administrators</b><br>

			
 
				+     <blockquote>mapred.permissions.supergroup should be replaced with an acl so that it does not restrict the admins to a single group.

			
 
				+<br>See more details on MAPREDUCE-1542.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1733">MAPREDUCE-1733</a>.

			
 
				+     Major new feature reported by jnp and fixed by jnp <br>

			
 
				+     <b>Authentication between pipes processes and java counterparts.</b><br>

			
 
				+     <blockquote>The connection between a pipe process and its parent java process should be authenticated.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1718">MAPREDUCE-1718</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas <br>

			
 
				+     <b>job conf key for the services name of DelegationToken for HFTP url is constructed incorrectly in HFTPFileSystem</b><br>

			
 
				+     <blockquote>the key (build in TokenCache) is hdfs.service.host_HOSTNAME.PORT, but 

			
 
				+<br>in HftpFileSystem it is sometimes built as hdfs.service.host_IP.PORT.

			
 
				+<br>

			
 
				+<br>Fix. change it to always be IP.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1711">MAPREDUCE-1711</a>.

			
 
				+     Major improvement reported by hong.tang and fixed by rksingh (contrib/gridmix)<br>

			
 
				+     <b>Gridmix should provide an option to submit jobs to the same queues as specified in the trace.</b><br>

			
 
				+     <blockquote>Gridmix should provide an option to submit jobs to the same queues as specified in the trace.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1707">MAPREDUCE-1707</a>.

			
 
				+     Major bug reported by amareshwari and fixed by vinodkv (tasktracker)<br>

			
 
				+     <b>TaskRunner can get NPE in getting ugi from TaskTracker</b><br>

			
 
				+     <blockquote>The following code in TaskRunner can get NPE in the scenario described below.

			
 
				+<br>      UserGroupInformation ugi = 

			
 
				+<br>        tracker.getRunningJob(t.getJobID()).getUGI();

			
 
				+<br>

			
 
				+<br>The scenario:

			
 
				+<br>Tracker got a LaunchTaskAction; Task is localized and TaskRunner is started.

			
 
				+<br>Then Tracker got a KillJobAction; This would issue a kill for the task. But, kill will be a no-op because the task did not actually start; The job is removed from runningJobs. 

			
 
				+<br>Then if TaskRunner calls tracker.getRunningJob(t.getJobID()), it will be null.

			
 
				+<br>

			
 
				+<br>Instead of TaskRunner doing a back call to tasktracker to get the ugi, tracker.getRunningJob(t.getJobID()).getUGI(), ugi should be passed a parameter in the constructor of TaskRunner. 

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1701">MAPREDUCE-1701</a>.

			
 
				+     Major bug reported by devaraj and fixed by boryas (jobtracker)<br>

			
 
				+     <b>AccessControlException while renewing a delegation token in not correctly handled in the JobTracker</b><br>

			
 
				+     <blockquote>The timer task for renewing delegation token gets scheduled even when an AccessControlException is obtained. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1686">MAPREDUCE-1686</a>.

			
 
				+     Minor bug reported by pburkhardt and fixed by pburkhardt (contrib/streaming, test)<br>

			
 
				+     <b>ClassNotFoundException for custom format classes provided in libjars</b><br>

			
 
				+     <blockquote>The StreamUtil::goodClassOrNull method assumes user-provided classes have package names and if not, they are part of the Hadoop Streaming package. For example, using custom InputFormat or OutputFormat classes without package names will fail with a ClassNotFound exception which is not indicative given the classes are provided in the libjars option. Admittedly, most Java packages should have a package name so this should rarely come up.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1683">MAPREDUCE-1683</a>.

			
 
				+     Major bug reported by chris.douglas and fixed by vicaya (jobtracker)<br>

			
 
				+     <b>Remove JNI calls from ClusterStatus cstr</b><br>

			
 
				+     <blockquote>The {{ClusterStatus}} constructor makes two JNI calls to the {{Runtime}} to fetch memory information. {{ClusterStatus}} instances are often created inside the {{JobTracker}} to obtain other, unrelated metrics (sometimes from schedulers&apos; inner loops). Given that this information is related to the {{JobTracker}} process and not the cluster, the metrics are also available via {{JvmMetrics}}, and the jsps can gather this information for themselves: these fields can be removed from {{ClusterStatus}}</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1680">MAPREDUCE-1680</a>.

			
 
				+     Major new feature reported by hong.tang and fixed by dking (jobtracker)<br>

			
 
				+     <b>Add a metrics to track the number of heartbeats processed</b><br>

			
 
				+     <blockquote>It would be nice to add a metrics that tracks the number of heartbeats processed by JT.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1670">MAPREDUCE-1670</a>.

			
 
				+     Major bug reported by rschmidt and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RAID should avoid policies that scan their own destination path</b><br>

			
 
				+     <blockquote>Raid currently allows policies that include the destination directory into the source directory and vice-versa.

			
 
				+<br>Both situations can create cycles and should be avoided.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1668">MAPREDUCE-1668</a>.

			
 
				+     Major bug reported by rschmidt and fixed by rvadali (contrib/raid)<br>

			
 
				+     <b>RaidNode should only Har a directory if all its parity files have been created</b><br>

			
 
				+     <blockquote>In the current code, it can happen that a directory will be Archived (Har&apos;ed) before all its parity files have been generated since parity file generation is not atomic. We should verify if all the parity files are present before Archiving a directory.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1664">MAPREDUCE-1664</a>.

			
 
				+     Major bug reported by ravidotg and fixed by ravidotg (security)<br>

			
 
				+     <b>Job Acls affect Queue Acls</b><br>

			
 
				+     <blockquote>MAPREDUCE-1307 introduced job ACLs for securing job level operations. So in current trunk, queue ACLs and job ACLs are checked(with AND for both acls) for allowing job level operations. So for doing operations like killJob, killTask and setJobPriority user should be part of both mapred.queue.{queuename}.acl-administer-jobs and in mapreduce.job.acl-modify-job. This needs to change so that users who are part of mapred.queue.{queuename}.acl-administer-jobs will be able to do killJob,killTask,setJobPriority and users part of mapreduce.job.acl-modify-job will be able to do killJob,killTask,setJobPriority.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1662">MAPREDUCE-1662</a>.

			
 
				+     Major bug reported by amareshwari and fixed by amareshwari (tasktracker)<br>

			
 
				+     <b>TaskRunner.prepare() and close() can be removed</b><br>

			
 
				+     <blockquote>TaskRunner.prepare() and close() methods call only mapOutputFile.removeAll(). The removeAll() call is a always a no-op in prepare(), because the directory is always empty during start up of the task. The removeAll() call in close() is useless, because it is followed by a attempt directory cleanup. Since the map output files are in attempt directory,  the call to close() is useless.

			
 
				+<br>After MAPREDUCE-842, these calls are under TaskTracker space, passing the wrong conf. Now, the calls do not make sense at all.

			
 
				+<br>I think we can remove the methods.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1626">MAPREDUCE-1626</a>.

			
 
				+     Major improvement reported by tomwhite and fixed by jolly (documentation)<br>

			
 
				+     <b>Publish Javadoc for all contrib packages with user-facing APIs</b><br>

			
 
				+     <blockquote>Some packages don&apos;t appear in the Javadoc. E.g. MRUnit, Vertica.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1621">MAPREDUCE-1621</a>.

			
 
				+     Major bug reported by tlipcon and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>Streaming&apos;s TextOutputReader.getLastOutput throws NPE if it has never read any output</b><br>

			
 
				+     <blockquote>If TextOutputReader.readKeyValue() has never successfully read a line, then its bytes member will be left null. Thus when logging a task failure, PipeMapRed.getContext() can trigger an NPE when it calls outReader_.getLastOutput().</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1617">MAPREDUCE-1617</a>.

			
 
				+     Major bug reported by amareshwari and fixed by vicaya (test)<br>

			
 
				+     <b>TestBadRecords failed once in our test runs</b><br>

			
 
				+     <blockquote>org.apache.hadoop.mapred.TestBadRecords.testBadMapRed failed with the following

			
 
				+<br>exception:

			
 
				+<br>java.io.IOException: Job failed!

			
 
				+<br>        at org.apache.hadoop.mapred.JobClient.runJob(JobClient.java:1142)

			
 
				+<br>        at org.apache.hadoop.mapred.TestBadRecords.runMapReduce(TestBadRecords.java:94)

			
 
				+<br>        at org.apache.hadoop.mapred.TestBadRecords.testBadMapRed(TestBadRecords.java:211)

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1599">MAPREDUCE-1599</a>.

			
 
				+     Major bug reported by jnp and fixed by jnp <br>

			
 
				+     <b>MRBench reuses jobConf and credentials there in.</b><br>

			
 
				+     <blockquote>MRBench reuses the jobconf and therefore credentials are re-used, but JobTracker cancels the delegation tokens therefore the test fails sometimes. 

			
 
				+<br>The fix is to pass the mapreduce.job.complete.cancel.delegation.tokens=false in the jobconf so that JobTracker does not cancel the tokens.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1597">MAPREDUCE-1597</a>.

			
 
				+     Major bug reported by namit and fixed by amareshwari <br>

			
 
				+     <b>combinefileinputformat does not work with non-splittable files</b><br>

			
 
				+     <blockquote>CombineFileInputFormat.getSplits() does not take into account whether a file is splittable.

			
 
				+<br>This can lead to a problem for compressed text files - for example, getSplits() may return more

			
 
				+<br>than 1 split depending on the size of the compressed file, all the splits recordreader will read the

			
 
				+<br>complete file.

			
 
				+<br>

			
 
				+<br>I ran into this problem while using Hive on hadoop 20.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1594">MAPREDUCE-1594</a>.

			
 
				+     Major new feature reported by rksingh and fixed by rksingh (contrib/gridmix)<br>

			
 
				+     <b>Support for Sleep Jobs in gridmix</b><br>

			
 
				+     <blockquote>Support for Sleep jobs in gridmix</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1592">MAPREDUCE-1592</a>.

			
 
				+     Major improvement reported by tomwhite and fixed by tomwhite (build)<br>

			
 
				+     <b>Generate Eclipse&apos;s .classpath file from Ivy config</b><br>

			
 
				+     <blockquote>MapReduce companion issue for HADOOP-6407.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1566">MAPREDUCE-1566</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by jnp (security)<br>

			
 
				+     <b>Need to add a mechanism to import tokens and secrets into a submitted job.</b><br>

			
 
				+     <blockquote>We need to include tokens and secrets into a submitted job. I propose adding a configuration attribute that when pointed at a token storage file will include the tokens and secrets from that token storage file.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1559">MAPREDUCE-1559</a>.

			
 
				+     Major bug reported by devaraj and fixed by devaraj (jobtracker)<br>

			
 
				+     <b>The DelegationTokenRenewal timer task should use the jobtracker&apos;s credentials to create the filesystem</b><br>

			
 
				+     <blockquote>The submitJob RPC finally creates a timer task for renewing the delegation tokens of the submitting user. This timer task inherits the context of the RPC handler that runs in the context of the job submitting user, and when it tries to create a filesystem, the RPC client tries to use the user&apos;s credentials. This should instead use the JobTracker&apos;s credentials.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1558">MAPREDUCE-1558</a>.

			
 
				+     Major bug reported by boryas and fixed by boryas (security)<br>

			
 
				+     <b>specify correct server principal for RefreshAuthorizationPolicyProtocol and RefreshUserToGroupMappingsProtocol protocols in MRAdmin (for HADOOP-6612)</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1548">MAPREDUCE-1548</a>.

			
 
				+     Major improvement reported by rschmidt and fixed by rschmidt (harchive)<br>

			
 
				+     <b>Hadoop archives should be able to preserve times and other properties from original files</b><br>

			
 
				+     <blockquote>Files inside hadoop archives don&apos;t keep their original:

			
 
				+<br>

			
 
				+<br>- modification time

			
 
				+<br>- access time

			
 
				+<br>- permission

			
 
				+<br>- owner

			
 
				+<br>- group

			
 
				+<br>

			
 
				+<br>all such properties are currently taken from the file storing the archive index, and not the stored files. This doesn&apos;t look very correct.

			
 
				+<br>

			
 
				+<br>There should be possible to preserve the original properties of the stored files.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1546">MAPREDUCE-1546</a>.

			
 
				+     Minor improvement reported by schen and fixed by schen <br>

			
 
				+     <b>Jobtracker JSP pages should automatically redirect to the corresponding history page if not in memory</b><br>

			
 
				+     <blockquote>MAPREDUCE-1185 redirects jobdetails.jsp to it&apos;s corresponding history page.

			
 
				+<br>

			
 
				+<br>For convenience, we should also redirect the following JSP pages to the corresponding history pages:

			
 
				+<br>jobconf.jsp

			
 
				+<br>jobtasks.jsp

			
 
				+<br>taskdetails.jsp

			
 
				+<br>taskstats.jsp

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1545">MAPREDUCE-1545</a>.

			
 
				+     Major improvement reported by acmurthy and fixed by vicaya (jobtracker)<br>

			
 
				+     <b>Add &apos;first-task-launched&apos; to job-summary</b><br>

			
 
				+     <blockquote>It would be useful to track &apos;first-task-launched&apos; time to job-summary for better reporting.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1543">MAPREDUCE-1543</a>.

			
 
				+     Major bug reported by vinodkv and fixed by vicaya (security)<br>

			
 
				+     <b>Log messages of JobACLsManager should use security logging of HADOOP-6586</b><br>

			
 
				+     <blockquote>{{JobACLsManager}} added in MAPREDUCE-1307 logs the successes and failures w.r.t job-level authorization in the corresponding Daemons&apos; logs. The log messages should instead use security logging of HADOOP-6586.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1533">MAPREDUCE-1533</a>.

			
 
				+     Major bug reported by rajesh.balamohan and fixed by dking (jobtracker)<br>

			
 
				+     <b>Reduce or remove usage of String.format() usage in CapacityTaskScheduler.updateQSIObjects and Counters.makeEscapedString()</b><br>

			
 
				+     <blockquote>When short jobs are executed in hadoop with OutOfBandHeardBeat=true, JT executes heartBeat() method heavily. This internally makes a call to CapacityTaskScheduler.updateQSIObjects(). 

			
 
				+<br>

			
 
				+<br>CapacityTaskScheduler.updateQSIObjects(), internally calls String.format() for setting the job scheduling information. Based on the datastructure size of &quot;jobQueuesManager&quot; and &quot;queueInfoMap&quot;, the number of times String.format() gets executed becomes very high. String.format() internally does pattern matching which turns to be out very heavy (This was revealed while profiling JT. Almost 57% of time was spent in CapacityScheduler.assignTasks(), out of which String.format() took 46%.

			
 
				+<br>

			
 
				+<br>Would it be possible to do String.format() only at the time of invoking JobInProgress.getSchedulingInfo?. This might reduce the pressure on JT while processing heartbeats. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1532">MAPREDUCE-1532</a>.

			
 
				+     Major bug reported by devaraj and fixed by devaraj (job submission, security)<br>

			
 
				+     <b>Delegation token is obtained as the superuser</b><br>

			
 
				+     <blockquote>When the UserGroupInformation.doAs is invoked for proxy users, the delegation token is incorrectly obtained as the real user.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1528">MAPREDUCE-1528</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by jnp <br>

			
 
				+     <b>TokenStorage should not be static</b><br>

			
 
				+     <blockquote>Currently, TokenStorage is a singleton. This doesn&apos;t work for some use cases, such as Oozie. I think that each Job should have a TokenStorage that is associated it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1526">MAPREDUCE-1526</a>.

			
 
				+     Major improvement reported by rksingh and fixed by rksingh (contrib/gridmix)<br>

			
 
				+     <b>Cache the job related information while submitting the job , this would avoid many RPC calls to JobTracker.</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1517">MAPREDUCE-1517</a>.

			
 
				+     Major new feature reported by sinofool and fixed by sinofool (contrib/streaming)<br>

			
 
				+     <b>streaming should support running on background</b><br>

			
 
				+     <blockquote>StreamJob submit the job and use a while loop monitor the progress.

			
 
				+<br>I prefer it running on background.

			
 
				+<br>

			
 
				+<br>Just add &quot;&amp;&quot; at the end of command is a alternative solution, but it keeps a java process on client machine.

			
 
				+<br>When submit hundreds jobs at the same time, the client machine is overloaded.

			
 
				+<br>

			
 
				+<br>Adding a -background option to StreamJob, tell it only submit and don&apos;t monitor the progress.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1516">MAPREDUCE-1516</a>.

			
 
				+     Major new feature reported by jnp and fixed by jnp <br>

			
 
				+     <b>JobTracker should issue a delegation token only for kerberos authenticated client</b><br>

			
 
				+     <blockquote>Delegation tokens should be issued only if the client is kerberos authenticated.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1505">MAPREDUCE-1505</a>.

			
 
				+     Major bug reported by devaraj and fixed by dking (client)<br>

			
 
				+     <b>Cluster class should create the rpc client only when needed</b><br>

			
 
				+     <blockquote>It will be good to have the org.apache.hadoop.mapreduce.Cluster create the rpc client object only when needed (when a call to the jobtracker is actually required). org.apache.hadoop.mapreduce.Job constructs the Cluster object internally and in many cases the application that created the Job object really wants to look at the configuration only. It&apos;d help to not have these connections to the jobtracker especially when Job is used in the tasks (for e.g., Pig calls mapreduce.FileInputFormat.setInputPath in the tasks and that requires a Job object to be passed).

			
 
				+<br>

			
 
				+<br>In Hadoop 20, the Job object internally creates the JobClient object, and the same argument applies there too.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1492">MAPREDUCE-1492</a>.

			
 
				+     Major improvement reported by rschmidt and fixed by rschmidt (contrib/raid)<br>

			
 
				+     <b>Delete or recreate obsolete har files used on hdfs raid</b><br>

			
 
				+     <blockquote>The current code for har on raid doesn&apos;t delete or recreate har directories when they become obsolete. We should fix that.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1382">MAPREDUCE-1382</a>.

			
 
				+     Major improvement reported by schen and fixed by zshao <br>

			
 
				+     <b>MRAsyncDiscService should tolerate missing local.dir</b><br>

			
 
				+     <blockquote>Currently when some of the local.dir do not exist, MRAsyncDiscService will fail. It should only fail when all directories don&apos;t work.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1376">MAPREDUCE-1376</a>.

			
 
				+     Major improvement reported by chris.douglas and fixed by chris.douglas (contrib/gridmix)<br>

			
 
				+     <b>Support for varied user submission in Gridmix</b><br>

			
 
				+     <blockquote>Gridmix currently submits all synthetic jobs as the client user. It should be possible to map users in the trace to a set of users appropriate for the target cluster.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1375">MAPREDUCE-1375</a>.

			
 
				+     Major bug reported by amar_kamat and fixed by tlipcon (contrib/streaming, test)<br>

			
 
				+     <b>TestFileArgs fails intermittently</b><br>

			
 
				+     <blockquote>TestFileArgs failed once for me with the following error

			
 
				+<br>expected:&lt;[job.jar

			
 
				+<br>sidefile

			
 
				+<br>tmp

			
 
				+<br>]&gt; but was:&lt;[]&gt;

			
 
				+<br>sidefile

			
 
				+<br>tmp

			
 
				+<br>]&gt; but was:&lt;[]&gt;

			
 
				+<br>        at org.apache.hadoop.streaming.TestStreaming.checkOutput(TestStreaming.java:107)

			
 
				+<br>        at org.apache.hadoop.streaming.TestStreaming.testCommandLine(TestStreaming.java:123)

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1354">MAPREDUCE-1354</a>.

			
 
				+     Critical improvement reported by devaraj and fixed by dking (jobtracker)<br>

			
 
				+     <b>Incremental enhancements to the JobTracker for better scalability</b><br>

			
 
				+     <blockquote>It&apos;d be nice to have the JobTracker object not be locked while accessing the HDFS for reading the jobconf file and while writing the jobinfo file in the submitJob method. We should see if we can avoid taking the lock altogether.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1288">MAPREDUCE-1288</a>.

			
 
				+     Critical bug reported by devaraj and fixed by devaraj (distributed-cache, security, tasktracker)<br>

			
 
				+     <b>DistributedCache localizes only once per cache URI</b><br>

			
 
				+     <blockquote>As part of the file localization the distributed cache localizer creates a copy of the file in the corresponding user&apos;s private directory. The localization in DistributedCache assumes the key as the URI of the cachefile and if it already exists in the map, the localization is not done again. This means that another user cannot access the same distributed cache file. We should change the key to include the username so that localization is done for every user.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1253">MAPREDUCE-1253</a>.

			
 
				+     Major improvement reported by anirban.dasgupta and fixed by anirban.dasgupta (contrib/mumak)<br>

			
 
				+     <b>Making Mumak work with Capacity-Scheduler</b><br>

			
 
				+     <blockquote>In order to make the capacity-scheduler work in the mumak simulation environment, we have to replace the job-initialization threads of the capacity scheduler with classes that perform event-based initialization. We propose to use aspectj to disable the threads  of the JobInitializationPoller class used by the Capacity Scheduler, and then perform the corresponding initialization tasks through a simulation job-initialization class that receives periodic wake-up calls from the simulator engine.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1248">MAPREDUCE-1248</a>.

			
 
				+     Minor improvement reported by ruibang and fixed by ruibang (contrib/streaming)<br>

			
 
				+     <b>Redundant memory copying in StreamKeyValUtil</b><br>

			
 
				+     <blockquote>I found that when MROutputThread collecting the output of  Reducer, it calls StreamKeyValUtil.splitKeyVal() and two local byte-arrays are allocated there for each line of output. Later these two byte-arrays are passed to variable key and val. There are twice memory copying here, one is the System.arraycopy() method, the other is inside key.set() / val.set().

			
 
				+<br>

			
 
				+<br>This causes double times of memory copying for the whole output (may lead to higher CPU consumption), and frequent temporay object allocation.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1225">MAPREDUCE-1225</a>.

			
 
				+     Major bug reported by vinodkv and fixed by zhong (tasktracker)<br>

			
 
				+     <b>TT successfully localizes a task even though the corresponding cache-file has already changed on DFS.</b><br>

			
 
				+     <blockquote>This happens with the first task of a job being localized on this TT. TT doesn&apos;t check if the file on DFS is fresh according to the timestamps set in job-conf during submission. After the first task incorrectly gets localized, all further tasks fail on this TT as expected.

			
 
				+<br>

			
 
				+<br>Found this issue while trying to improve test-case for MAPREUCE-913.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1159">MAPREDUCE-1159</a>.

			
 
				+     Trivial improvement reported by zshao and fixed by qwertymaniac <br>

			
 
				+     <b>Limit Job name on jobtracker.jsp to be 80 char long</b><br>

			
 
				+     <blockquote>Sometimes a user submits a job with a very long job name. That made jobtracker.jsp very hard to read.

			
 
				+<br>We should limit the size of the job name. User can see the full name when they click on the job.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1118">MAPREDUCE-1118</a>.

			
 
				+     Major bug reported by aw and fixed by ramach (contrib/capacity-sched)<br>

			
 
				+     <b>Capacity Scheduler scheduling information is hard to read / should be tabular format</b><br>

			
 
				+     <blockquote>The scheduling information provided by the capacity scheduler is extremely hard to read on the job tracker web page.  Instead of just flat text, it should be presenting the information in a tabular format, similar to what the fair share scheduler provides.  This makes it much easier to compare what different queues are doing.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1092">MAPREDUCE-1092</a>.

			
 
				+     Major test reported by eli and fixed by eli (test)<br>

			
 
				+     <b>Enable asserts for tests by default</b><br>

			
 
				+     <blockquote>See HADOOP-6309. Let&apos;s make the tests run with java asserts by default.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1085">MAPREDUCE-1085</a>.

			
 
				+     Minor bug reported by ravidotg and fixed by tlipcon (tasktracker)<br>

			
 
				+     <b>For tasks, &quot;ulimit -v -1&quot; is being run when user doesn&apos;t specify mapred.child.ulimit</b><br>

			
 
				+     <blockquote>For tasks, &quot;ulimit -v -1&quot; is being run when user doesn&apos;t specify mapred.child.ulimit.  Taking -1 as default value and using it in building the command is not right.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-927">MAPREDUCE-927</a>.

			
 
				+     Major sub-task reported by vinodkv and fixed by amareshwari (security, tasktracker)<br>

			
 
				+     <b>Cleanup of task-logs should happen in TaskTracker instead of the Child</b><br>

			
 
				+     <blockquote>Task logs&apos; cleanup is being done in Child now. This is undesirable atleast for two reasons: 1) failures while cleaning up will affect the user&apos;s tasks, and 2) the task&apos;s wall time will get affected due to operations that TT actually should own.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-869">MAPREDUCE-869</a>.

			
 
				+     Major bug reported by acmurthy and fixed by tucu00 (documentation, task)<br>

			
 
				+     <b>Documentation for config to set map/reduce task environment</b><br>

			
 
				+     <blockquote>HADOOP-2838 added mapred.child.env to allow users to set the map/reduce tasks&apos; environment.

			
 
				+<br>

			
 
				+<br>MAPREDUCE-478 will break that into mapred.map.child.env and mapred.reduce.child.env. We need to add documentation (forrest) for these knobs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-714">MAPREDUCE-714</a>.

			
 
				+     Major bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>JobConf.findContainingJar unescapes unnecessarily on Linux</b><br>

			
 
				+     <blockquote>In JobConf.findContainingJar, the path name is decoded using URLDecoder.decode(...). This was done by Doug in r381794 (commit msg &quot;Un-escape containing jar&apos;s path, which is URL-encoded.  This fixes things primarily on Windows, where paths are likely to contain spaces.&quot;) Unfortunately, jar paths do not appear to be URL encoded on Linux. If you try to use &quot;hadoop jar&quot; on a jar with a &quot;+&quot; in it, this function decodes it to a space and then the job cannot be submitted.

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-647">MAPREDUCE-647</a>.

			
 
				+     Major bug reported by rschmidt and fixed by rschmidt (documentation)<br>

			
 
				+     <b>Update the DistCp forrest doc to make it consistent with the latest changes (5472, 5620, 5762, 5826)</b><br>

			
 
				+     <blockquote>New features have been added to DistCp and the documentation must be updated.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-577">MAPREDUCE-577</a>.

			
 
				+     Major bug reported by camda03 and fixed by ravidotg (contrib/streaming)<br>

			
 
				+     <b>Duplicate Mapper input when using StreamXmlRecordReader</b><br>

			
 
				+     <blockquote>

			
 
				+I believe that the problem is in StreamXmlRecordReader.java in the fast-match code. When the bytestream doesn't completely match the begin/end pattern, the code does "pos_ += m" to increment the position in the stream by the number of characters matching the pattern... but it forgets the "c" character which didn't match. Ultimately, the code ends up reading significantly past the end of the split, resulting in the same record (at least the first one right after the split) being detected by multiple StreamXmlRecordReader instances.

			
 
				+</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-572">MAPREDUCE-572</a>.

			
 
				+     Minor bug reported by karams and fixed by amareshwari (contrib/streaming)<br>

			
 
				+     <b>If #link is missing from uri format of -cacheArchive then streaming does not throw error.</b><br>

			
 
				+     <blockquote>Ran hadoop streaming command as -:

			
 
				+<br>bin/hadoop jar contrib/streaming/hadoop-*-streaming.jar -input in -output out -mapper &quot;xargs cat&quot;  -reducer &quot;bin/cat&quot; -cahceArchive hdfs://h:p/pathofJarFile

			
 
				+<br>Streaming submits job to jobtracker and map fails.

			
 
				+<br>For similar with -cacheFile -:

			
 
				+<br>bin/hadoop jar contrib/streaming/hadoop-*-streaming.jar -input in -output out -mapper &quot;xargs cat&quot;  -reducer &quot;bin/cat&quot; -cahceFile hdfs://h:p/pathofFile

			
 
				+<br>followinng error is repoerted back -:

			
 
				+<br>

			
 
				+<br>You need to specify the uris as hdfs://host:port/#linkname,Please specify a different link name for all of your caching URIs

			
 
				+<br>

			
 
				+<br>Streaming should check about present #link after uri of cacheArchive and should throw proper error .

			
 
				+<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-231">MAPREDUCE-231</a>.

			
 
				+     Major task reported by owen.omalley and fixed by owen.omalley <br>

			
 
				+     <b>Split map/reduce into sub-project</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-220">MAPREDUCE-220</a>.

			
 
				+     Major new feature reported by hong.tang and fixed by schen (task, tasktracker)<br>

			
 
				+     <b>Collecting cpu and memory usage for MapReduce tasks</b><br>

			
 
				+     <blockquote>It would be nice for TaskTracker to collect cpu and memory usage for individual Map or Reduce tasks over time.</blockquote></li>

			
 
				+

			
 
				+</ul>

			
 
				+

			
 
				+

			
 
				+<h2>Changes since Hadoop 0.21.0</h2>

			
 
				+<ul>

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7194">HADOOP-7194</a>.

			
 
				+     Major bug reported by devaraj.k and fixed by devaraj.k (io)<br>

			
 
				+     <b>Potential Resource leak in IOUtils.java</b><br>

			
 
				+     <blockquote>try {<br>      copyBytes(in, out, buffSize);<br>    } finally {<br>      if(close) {<br>        out.close();<br>        in.close();<br>      }<br>    }<br> <br>In the above code if any exception throws from the out.close() statement, in.close() statement will not execute and the input stream will not be closed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7193">HADOOP-7193</a>.

			
 
				+     Minor improvement reported by umamaheswararao and fixed by umamaheswararao (fs)<br>

			
 
				+     <b>Help message is wrong for touchz command.</b><br>

			
 
				+     <blockquote>Help message for touchz command is<br> -touchz &lt;path&gt;: Write a timestamp in yyyy-MM-dd HH:mm:ss format<br>                in a file at &lt;path&gt;. An error is returned if the file exists with non-zero length.<br><br> Actually current DFS behaviour is that it will not write any time stamp in created file. Just it is creating zero size file.<br><br>So better to change the help message to give exact meaning.<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7183">HADOOP-7183</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tomwhite <br>

			
 
				+     <b>WritableComparator.get should not cache comparator objects</b><br>

			
 
				+     <blockquote>HADOOP-6881 modified WritableComparator.get such that the constructed WritableComparator gets saved back into the static map. This is fine for stateless comparators, but some comparators have per-instance state, and thus this becomes thread-unsafe and causes errors in the shuffle where multiple threads are doing comparisons. An example of a Comparator with per-instance state is WritableComparator itself.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7177">HADOOP-7177</a>.

			
 
				+     Trivial improvement reported by aw and fixed by aw (native)<br>

			
 
				+     <b>CodecPool should report which compressor it is using</b><br>

			
 
				+     <blockquote>Certain native compression libraries are overly verbose causing confusion while reading the task logs.  Let&apos;s actually say which compressor we got when we report it in the task logs.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7174">HADOOP-7174</a>.

			
 
				+     Minor bug reported by umamaheswararao and fixed by umamaheswararao (fs)<br>

			
 
				+     <b>null is displayed in the console,if the src path is invalid while doing copyToLocal operation from commandLine</b><br>

			
 
				+     <blockquote>When we perform copyToLocal operations from commandLine and if src Path is invalid <br><br>srcFS.globStatus(srcpath) will return null. So, when we find the length of resulted value, it will *throw NullPointerException*.<br><br> Since we are handling generic exception , it will display null as the message.<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7162">HADOOP-7162</a>.

			
 
				+     Minor bug reported by humanoid and fixed by humanoid (fs)<br>

			
 
				+     <b>FsShell: call srcFs.listStatus(src) twice</b><br>

			
 
				+     <blockquote>in file ./src/java/org/apache/hadoop/fs/FsShell.java line 555<br>call method twice:<br>1. for init variable<br>2. for getting data<br><br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7120">HADOOP-7120</a>.

			
 
				+     Major bug reported by szetszwo and fixed by szetszwo (test)<br>

			
 
				+     <b>200 new Findbugs warnings</b><br>

			
 
				+     <blockquote>ant test-patch on an empty patch over hdfs trunk.<br><br>     [exec] -1 overall.  <br>     [exec] <br>     [exec]     +1 @author.  The patch does not contain any @author tags.<br>     [exec] <br>     [exec]     -1 tests included.  The patch doesn&apos;t appear to include any new or modified tests.<br>     [exec]                         Please justify why no new tests are needed for this patch.<br>     [exec]                         Also please list what manual steps were performed to verify this patch.<br>     [exec] <br>     [exec]     +1 javadoc.  The javadoc tool did not generate any warning messages.<br>     [exec] <br>     [exec]     +1 javac.  The applied patch does not increase the total number of javac compiler warnings.<br>     [exec] <br>     [exec]     -1 findbugs.  The patch appears to introduce 200 new Findbugs (version 1.3.9) warnings.<br>     [exec] <br>     [exec]     -1 release audit.  The applied patch generated 1 release audit warnings (more than the trunk&apos;s current 0 warnings).<br>     [exec] <br>     [exec]     +1 system test framework.  The patch passed system test framework compile.<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7117">HADOOP-7117</a>.

			
 
				+     Major improvement reported by patrickangeles and fixed by qwertymaniac (conf)<br>

			
 
				+     <b>Move secondary namenode checkpoint configs from core-default.xml to hdfs-default.xml</b><br>

			
 
				+     <blockquote>The following configs are in core-default.xml, but are really read by the Secondary Namenode. These should be moved to hdfs-default.xml for consistency.

			
 
				+     </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7072">HADOOP-7072</a>.

			
 
				+     Major sub-task reported by cos and fixed by cos (build)<br>

			
 
				+     <b>Remove java5 dependencies from build</b><br>

			
 
				+     <blockquote>As the first short-term step let&apos;s remove JDK5 dependency from build(s)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7053">HADOOP-7053</a>.

			
 
				+     Minor bug reported by yaojingguo and fixed by yaojingguo (conf)<br>

			
 
				+     <b>wrong FSNamesystem Audit logging setting in conf/log4j.properties</b><br>

			
 
				+     <blockquote>&quot;log4j.logger.org.apache.hadoop.fs.FSNamesystem.audit=WARN&quot; should be &quot;log4j.logger.org.apache.hadoop.hdfs.server.namenode.FSNamesystem.audit=WARN&quot;.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7052">HADOOP-7052</a>.

			
 
				+     Major bug reported by yaojingguo and fixed by yaojingguo (conf)<br>

			
 
				+     <b>misspelling of threshold in conf/log4j.properties</b><br>

			
 
				+     <blockquote>In &quot;log4j.threshhold=ALL&quot;, threshhold is a misspelling of threshold. So &quot;log4j.threshhold=ALL&quot; has no effect on the control of log4j logging.<br><br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-7019">HADOOP-7019</a>.

			
 
				+     Major bug reported by owen.omalley and fixed by vicaya (build)<br>

			
 
				+     <b>Refactor build targets to enable faster cross project dev cycles.</b><br>

			
 
				+     <blockquote>The current build always generates fault injection artifacts and pushes them to Maven. Most developers have no need for these artifacts and no users need them. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6993">HADOOP-6993</a>.

			
 
				+     Major bug reported by atm and fixed by eli (documentation)<br>

			
 
				+     <b>Broken link on cluster setup page of docs</b><br>

			
 
				+     <blockquote>The link on http://hadoop.apache.org/common/docs/current/cluster_setup.html#Configuring+the+Hadoop+Daemons to core-default.xml is presently:<br>http://hadoop.apache.org/common/docs/current/common-default.html<br>but it should be:<br>http://hadoop.apache.org/common/docs/current/core-default.html</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6971">HADOOP-6971</a>.

			
 
				+     Major bug reported by cos and fixed by cos (build, test)<br>

			
 
				+     <b>Clover build doesn&apos;t generate per-test coverage</b><br>

			
 
				+     <blockquote>Because of the way the structure of Hadoop&apos;s builds is done Clover can&apos;t properly detect test classes among the sources. As the result clover reports are incomplete and do not provide viral per-test coverage info.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6969">HADOOP-6969</a>.

			
 
				+     Major bug reported by shv and fixed by tomwhite <br>

			
 
				+     <b>CHANGES.txt does not reflect the release of version 0.21.0.</b><br>

			
 
				+     <blockquote></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6954">HADOOP-6954</a>.

			
 
				+     Major bug reported by tomwhite and fixed by tomwhite (build)<br>

			
 
				+     <b>Sources JARs are not correctly published to the Maven repository</b><br>

			
 
				+     <blockquote>When you try to &quot;close&quot; the staging repository to make it visible to the public the operation fails (see https://issues.apache.org/jira/browse/HDFS-1292?focusedCommentId=12909953&amp;page=com.atlassian.jira.plugin.system.issuetabpanels%3Acomment-tabpanel#action_12909953 for the type of error).</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6944">HADOOP-6944</a>.

			
 
				+     Major task reported by vinaythota and fixed by vinaythota (test)<br>

			
 
				+     <b>[Herriot] Implement a functionality for getting proxy users definitions like groups and hosts.</b><br>

			
 
				+     <blockquote>Gridmix should require a proxy user&apos;s file for impersonating various jobs. So, implement couple of methods for getting the proxy users list and a proxy users file (it&apos;s a combination of proxy users and groups) based on cluster configuration.<br><br>The proxy users list should require for map reduce jobs and proxy users file should require for gridmix jobs.<br><br>The following are methods signature,<br>public ProxyUserDefinitions getHadoopProxyUsers() - get the list of proxy users list based on cluster configuration.<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6934">HADOOP-6934</a>.

			
 
				+     Major test reported by oae and fixed by oae (record)<br>

			
 
				+     <b>test for ByteWritable comparator</b><br>

			
 
				+     <blockquote>The test for the ByteWritable comparator bug (see HADOOP-6928), which is already fixed in 0.21.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6925">HADOOP-6925</a>.

			
 
				+     Critical bug reported by tlipcon and fixed by tlipcon (io)<br>

			
 
				+     <b>BZip2Codec incorrectly implements read()</b><br>

			
 
				+     <blockquote>HADOOP-4012 added an implementation of read() in BZip2InputStream that doesn&apos;t work correctly when reading bytes &gt; 0x80. This causes EOFExceptions when working with BZip2 compressed data inside of sequence files in some datasets.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6833">HADOOP-6833</a>.

			
 
				+     Blocker bug reported by tlipcon and fixed by tlipcon <br>

			
 
				+     <b>IPC leaks call parameters when exceptions thrown</b><br>

			
 
				+     <blockquote>HADOOP-6498 moved the calls.remove() call lower into the SUCCESS clause of receiveResponse(), but didn&apos;t put a similar calls.remove into the ERROR clause. So, any RPC call that throws an exception ends up orphaning the Call object in the connection&apos;s &quot;calls&quot; hashtable. This prevents cleanup of the connection and is a memory leak for the call parameters.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HADOOP-6786">HADOOP-6786</a>.

			
 
				+     Major improvement reported by cos and fixed by cos (build)<br>

			
 
				+     <b>test-patch needs to verify Herriot integrity</b><br>

			
 
				+     <blockquote>Whenever a new patch is submitted for verification {{test-patch}} process has to make sure that none of Herriot bindings were broken.</blockquote></li>

			
 
				+

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1750">HDFS-1750</a>.

			
 
				+     Major bug reported by szetszwo and fixed by szetszwo <br>

			
 
				+     <b>fs -ls hftp://file not working</b><br>

			
 
				+     <blockquote><br>hadoop dfs -touchz /tmp/file1 # create file. OK<br>hadoop dfs -ls /tmp/file1  # OK<br>hadoop dfs -ls hftp://namenode:50070/tmp/file1 # FAILED: not seeing the file<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1728">HDFS-1728</a>.

			
 
				+     Minor bug reported by szetszwo and fixed by szetszwo (name-node)<br>

			
 
				+     <b>SecondaryNameNode.checkpointSize is in byte but not MB.</b><br>

			
 
				+     <blockquote>The unit of SecondaryNameNode.checkpointSize is byte but not MB as stated in the following comment.<br><br>//SecondaryNameNode.java<br>   private long checkpointSize;    // size (in MB) of current Edit Log<br><br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1665">HDFS-1665</a>.

			
 
				+     Minor bug reported by szetszwo and fixed by szetszwo (balancer)<br>

			
 
				+     <b>Balancer sleeps inadequately</b><br>

			
 
				+     <blockquote>The value of {{dfs.heartbeat.interval}} is in seconds.  Balancer seems misused it.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1612">HDFS-1612</a>.

			
 
				+     Minor bug reported by joecrobak and fixed by joecrobak (documentation)<br>

			
 
				+     <b>HDFS Design Documentation is outdated</b><br>

			
 
				+     <blockquote>I was trying to discover details about the Secondary NameNode, and came across the description below in the HDFS design doc.<br><br><br>The NameNode keeps an image of the entire file system namespace and file Blockmap in memory. This key metadata item is designed to be compact, such that a NameNode with 4 GB of RAM is plenty to support a huge number of files and directories. When the NameNode starts up, it reads the FsImage and EditLog from disk, applies all the transactions from the EditLog to the in-memory representation of the FsImage, and flushes out this new version into a new FsImage on disk. It can then truncate the old EditLog because its transactions have been applied to the persistent FsImage. This process is called a checkpoint. *In the current implementation, a checkpoint only occurs when the NameNode starts up. Work is in progress to support periodic checkpointing in the near future.*<br><br>(emphasis mine).<br><br>Note that this directly conflicts with information in the hdfs user guide, http://hadoop.apache.org/common/docs/r0.20.2/hdfs_user_guide.html#Secondary+NameNode<br>and http://hadoop.apache.org/hdfs/docs/current/hdfs_user_guide.html#Checkpoint+Node<br><br>I haven&apos;t done a thorough audit of that doc-- I only noticed the above inaccuracy.<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1598">HDFS-1598</a>.

			
 
				+     Major bug reported by szetszwo and fixed by szetszwo (name-node)<br>

			
 
				+     <b>ListPathsServlet excludes .*.crc files</b><br>

			
 
				+     <blockquote>The {{.*.crc}} files are excluded by default.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1596">HDFS-1596</a>.

			
 
				+     Major improvement reported by patrickangeles and fixed by qwertymaniac (documentation, name-node)<br>

			
 
				+     <b>Move secondary namenode checkpoint configs from core-default.xml to hdfs-default.xml</b><br>

			
 
				+     <blockquote>The following configs are in core-default.xml, but are really read by the Secondary Namenode. These should be moved to hdfs-default.xml for consistency.

			
 
				+     </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1552">HDFS-1552</a>.

			
 
				+     Major bug reported by cos and fixed by cos (build)<br>

			
 
				+     <b>Remove java5 dependencies from build</b><br>

			
 
				+     <blockquote>As the first short-term step let&apos;s remove JDK5 dependency from build(s)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1548">HDFS-1548</a>.

			
 
				+     Major bug reported by cos and fixed by cos (build, test)<br>

			
 
				+     <b>Fault-injection tests are executed multiple times if invoked with run-test-hdfs-fault-inject target</b><br>

			
 
				+     <blockquote>When invoked with {{run-test-hdfs-fault-inject target}} fault injection tests are getting executed 4 times.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1474">HDFS-1474</a>.

			
 
				+     Major bug reported by cos and fixed by cos (build)<br>

			
 
				+     <b>ant binary-system is broken</b><br>

			
 
				+     <blockquote>Build failed due to unable to copy the commons instrumented jar. I could see the following error in the log.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1452">HDFS-1452</a>.

			
 
				+     Major bug reported by jghoman and fixed by cos (contrib/hdfsproxy)<br>

			
 
				+     <b>ant compile-contrib is broken</b><br>

			
 
				+     <blockquote>ant compile-contrib is broken, looks like commit a0a62d971fb35de7f021ecbd6ceb8d08ef923ed5 HDFS-1444<br></blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1444">HDFS-1444</a>.

			
 
				+     Minor bug reported by cos and fixed by cos (build)<br>

			
 
				+     <b>Test related code of build.xml is error-prone and needs to be re-aligned.</b><br>

			
 
				+     <blockquote>Test related parts of build.xml introduce at least two places (effectively different) for test classes destination compilation.<br>Then some extra logic is applied at say test-jar creation step where the content of one is copied over to another. Etc.<br><br>This seems to be overcomplicated and is better be fixed to prevent possible issues with future build modificaitons.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1420">HDFS-1420</a>.

			
 
				+     Major bug reported by cos and fixed by cos (build, test)<br>

			
 
				+     <b>Clover build doesn&apos;t generate per-test coverage</b><br>

			
 
				+     <blockquote>Because of the way the structure of Hadoop&apos;s builds is done Clover can&apos;t properly detect test classes among the sources. As the result clover reports are incomplete and do not provide viral per-test coverage info.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1416">HDFS-1416</a>.

			
 
				+     Major bug reported by shv and fixed by tomwhite <br>

			
 
				+     <b>CHANGES.txt does not reflect the release version 0.21.0.</b><br>

			
 
				+     <blockquote>CHANGES.txt still claims version 0.21.0 - Unreleased. It should show the release date instead and include section for for 0.21.1 - Unreleased. Latest changes, that did not make into 0.21.0, should be moved under 0.21.1 section.<br>This should also be fixed for common and mapreduce.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1413">HDFS-1413</a>.

			
 
				+     Major bug reported by shv and fixed by shv (documentation)<br>

			
 
				+     <b>Broken links to HDFS Wiki in hdfs site and documentation.</b><br>

			
 
				+     <blockquote># hdfs/site wiki tab points to &quot;http://wiki.apache.org/hadoop/DFS&quot;, should be HDFS.<br># hdfs documentation wiki tab points to &quot;http://wiki.apache.org/hadoop/hdfs&quot;, should be HDFS.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1411">HDFS-1411</a>.

			
 
				+     Minor bug reported by chingshen and fixed by chingshen (documentation)<br>

			
 
				+     <b>The startup command of the Backup Node is &quot;bin/hdfs namenode -backup&quot;</b><br>

			
 
				+     <blockquote>The startup command of the Backup Node is &quot;bin/hdfs namenode -backup&quot;</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1377">HDFS-1377</a>.

			
 
				+     Blocker bug reported by eli and fixed by eli (name-node)<br>

			
 
				+     <b>Quota bug for partial blocks allows quotas to be violated </b><br>

			
 
				+     <blockquote>There&apos;s a bug in the quota code that causes them not to be respected when a file is not an exact multiple of the block size.

			
 
				+     </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1363">HDFS-1363</a>.

			
 
				+     Major bug reported by shv and fixed by shv <br>

			
 
				+     <b>startFileInternal should return the last block of the file opened for append as an under-construction block</b><br>

			
 
				+     <blockquote>{{FSNamesystem.startFileInternal}} should convert the last block of the file opened for append to an under-construction block and return it. This will let remove the second synchronized section in {{FSNamesystem.appendFile()}} and avoid redundant computations and potential inconsistencies as stated in HDFS-1152.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1343">HDFS-1343</a>.

			
 
				+     Minor improvement reported by cos and fixed by cos (build)<br>

			
 
				+     <b>Instrumented build should be concentrated in one build area</b><br>

			
 
				+     <blockquote>Current instrumented build is inefficient in a sense that part of it is build under build-fi and another part is under build-fi/system.<br>This doubles the time of some classes and tests compilation. And needed to be fixed. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1206">HDFS-1206</a>.

			
 
				+     Major bug reported by szetszwo and fixed by cos (test)<br>

			
 
				+     <b>TestFiHFlush fails intermittently</b><br>

			
 
				+     <blockquote>When I was testing HDFS-1114, the patch passed all tests except TestFiHFlush.  Then, I tried to print out some debug messages, however, TestFiHFlush succeeded after added the messages.<br><br>TestFiHFlush probably depends on the speed of BlocksMap.  If BlocksMap is slow enough, then it will pass.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-1189">HDFS-1189</a>.

			
 
				+     Major bug reported by xiaokang and fixed by johnvijoe (name-node)<br>

			
 
				+     <b>Quota counts missed between clear quota and set quota</b><br>

			
 
				+     <blockquote>HDFS Quota counts will be missed between a clear quota operation and a set quota.<br><br>When setting quota for a dir, the INodeDirectory will be replaced by INodeDirectoryWithQuota and dir.isQuotaSet() becomes true. When INodeDirectoryWithQuota  is newly created, quota counting will be performed. However, when clearing quota, the quota conf is set to -1 and dir.isQuotaSet() becomes false while INodeDirectoryWithQuota will NOT be replaced back to INodeDirectory.<br><br>FSDirectory.updateCount just update the quota count for inodes that isQuotaSet() is true. So after clear quota for a dir, its quota counts will not be updated and it&apos;s reasonable. But when re seting quota for this dir, quota counting will not be performed and some counts will be missed.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/HDFS-996">HDFS-996</a>.

			
 
				+     Blocker bug reported by cos and fixed by cos (test)<br>

			
 
				+     <b>JUnit tests should never depend on anything in conf</b><br>

			
 
				+     <blockquote>Similar to MAPREDUCE-1369 we need to make sure that nothing in conf is used in the unit tests. </blockquote></li>

			
 
				+

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2317">MAPREDUCE-2317</a>.

			
 
				+     Minor bug reported by devaraj.k and fixed by devaraj.k (harchive)<br>

			
 
				+     <b>HadoopArchives throwing NullPointerException while creating hadoop archives (.har files)</b><br>

			
 
				+     <blockquote>While we are trying to run hadoop archive tool in widows using this way,

			
 
				+     <br>java org.apache.hadoop.tools.HadoopArchives -archiveName temp.har D:/test/in E:/temp<br> 

			
 
				+     it is giving java.lang.NullPointerException</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2228">MAPREDUCE-2228</a>.

			
 
				+     Major bug reported by cos and fixed by cos (build)<br>

			
 
				+     <b>Remove java5 dependencies from build</b><br>

			
 
				+     <blockquote>As the first short-term step let&apos;s remove JDK5 dependency from build(s)</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2223">MAPREDUCE-2223</a>.

			
 
				+     Minor bug reported by cos and fixed by cos (test)<br>

			
 
				+     <b>TestMRCLI might fail on Ubuntu with default /etc/hosts</b><br>

			
 
				+     <blockquote>Depending on the order of entries in /etc/hosts, TestCLI can fail. This is because it sets fs.default.name to &quot;localhost&quot;, and then the bound IPC socket on the NN side reports its hostname as &quot;foobar-host&quot; if the entry for 127.0.0.1 lists &quot;foobar-host&quot; before &quot;localhost&quot;. This seems to be the default in some versions of Ubuntu.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2140">MAPREDUCE-2140</a>.

			
 
				+     Trivial improvement reported by matei and fixed by matei <br>

			
 
				+     <b>Re-generate fair scheduler design doc PDF</b><br>

			
 
				+     <blockquote>The Fair Scheduler contains a design document in src/contrib/fairscheduler/designdoc that is included both as a Latex file and as a PDF. However, the PDF that&apos;s currently there is not generated properly and has some question marks for section references. I&apos;d like to regenerate it and commit the new one. There is no patch to attach because this just requires running pdflatex and committing a binary file.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2134">MAPREDUCE-2134</a>.

			
 
				+     Major bug reported by vinaythota and fixed by cos (build)<br>

			
 
				+     <b>ant binary-system is broken in mapreduce project.</b><br>

			
 
				+     <blockquote>Build failed due to unable to copy the commons instrumented jar.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2090">MAPREDUCE-2090</a>.

			
 
				+     Major bug reported by cos and fixed by cos (build, test)<br>

			
 
				+     <b>Clover build doesn&apos;t generate per-test coverage</b><br>

			
 
				+     <blockquote>Because of the way the structure of Hadoop&apos;s builds is done Clover can&apos;t properly detect test classes among the sources. As the result clover reports are incomplete and do not provide viral per-test coverage info.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2086">MAPREDUCE-2086</a>.

			
 
				+     Major bug reported by shv and fixed by tomwhite <br>

			
 
				+     <b>CHANGES.txt does not reflect the release of version 0.21.0.</b><br>

			
 
				+     <blockquote>CHANGES.txt should show the release date for 0.21.0 and include section for for 0.21.1 - Unreleased. Latest changes, that did not make into 0.21.0, should be moved under 0.21.1 section.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2040">MAPREDUCE-2040</a>.

			
 
				+     Minor new feature reported by sandholm and fixed by sandholm (contrib/dynamic-scheduler)<br>

			
 
				+     <b>Forrest Documentation for Dynamic Priority Scheduler</b><br>

			
 
				+     <blockquote>New Forrest documentation for dynamic priority scheduler</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-2032">MAPREDUCE-2032</a>.

			
 
				+     Major bug reported by amareshwari and fixed by dking (task)<br>

			
 
				+     <b>TestJobOutputCommitter fails in ant test run</b><br>

			
 
				+     <blockquote>TestJobOutputCommitter fails in a &quot;ant test&quot; run with following exception :<br><br>Output directory /home/amarsri/mapred/build/test/data/test-job-cleanup/output-2 already exists<br>org.apache.hadoop.fs.FileAlreadyExistsException: Output directory /home/amarsri/mapred/build/test/data/test-job-cleanup/output-2 already exists<br>        at org.apache.hadoop.mapreduce.lib.output.FileOutputFormat.checkOutputSpecs(FileOutputFormat.java:141)<br>        at org.apache.hadoop.mapreduce.JobSubmitter.checkSpecs(JobSubmitter.java:391)<br>        at org.apache.hadoop.mapreduce.JobSubmitter.submitJobInternal(JobSubmitter.java:350)<br>        at org.apache.hadoop.mapreduce.Job$2.run(Job.java:1037)<br>        at org.apache.hadoop.mapreduce.Job$2.run(Job.java:1034)<br>        at java.security.AccessController.doPrivileged(Native Method)<br>        at javax.security.auth.Subject.doAs(Subject.java:396)<br>        at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1093)<br>        at org.apache.hadoop.mapreduce.Job.submit(Job.java:1034)<br>        at org.apache.hadoop.mapreduce.lib.output.TestJobOutputCommitter.testKilledJob(TestJobOutputCommitter.java:192)<br>        at org.apache.hadoop.mapreduce.lib.output.TestJobOutputCommitter.testDefaultCleanupAndAbort(TestJobOutputCommitter.java:232)<br><br>But it passes when it is run individually.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1984">MAPREDUCE-1984</a>.

			
 
				+     Major bug reported by balajirg and fixed by balajirg <br>

			
 
				+     <b>herriot TestCluster fails because exclusion is not there</b><br>

			
 
				+     <blockquote>restart is part of the test case which causes ioexceptions, and this needs to be ignored. The test case should not be incorrectly failed. </blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1929">MAPREDUCE-1929</a>.

			
 
				+     Blocker bug reported by tomwhite and fixed by tomwhite (build)<br>

			
 
				+     <b>Allow artifacts to be published to the staging Apache Nexus Maven Repository</b><br>

			
 
				+     <blockquote>MapReduce companion issue to HADOOP-6847.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1905">MAPREDUCE-1905</a>.

			
 
				+     Blocker bug reported by amareshwari and fixed by amareshwari (task)<br>

			
 
				+     <b>Context.setStatus() and progress() api are ignored</b><br>

			
 
				+     <blockquote>TaskAttemptContext.setStatus() and progress() were overriden in TaskInputOutputContext, inbranch 0.20, to call the underlying reporter apis. But the methods are no more over-riden in TaskInputOutputContextImpl after MAPREDUCE-954.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1897">MAPREDUCE-1897</a>.

			
 
				+     Major bug reported by roelofs and fixed by cos (test)<br>

			
 
				+     <b>trunk build broken on compile-mapred-test</b><br>

			
 
				+     <blockquote>...apparently.  Fresh checkout of trunk (all three hadoop-*), build.properties project.version fix, ant veryclean mvn-install of common, hdfs, and then mapreduce:</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1809">MAPREDUCE-1809</a>.

			
 
				+     Major task reported by vinaythota and fixed by vinaythota (build)<br>

			
 
				+     <b>Ant build changes for Streaming system tests in contrib projects.</b><br>

			
 
				+     <blockquote>Implementing new target( test-system) in build-contrib.xml file for executing the system test that are in contrib projects. Also adding &apos;subant&apos;  target in aop.xml that calls the build-contrib.xml file for system tests.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1501">MAPREDUCE-1501</a>.

			
 
				+     Major improvement reported by zshao and fixed by zshao <br>

			
 
				+     <b>FileInputFormat to support multi-level/recursive directory listing</b><br>

			
 
				+     <blockquote>As we have seen multiple times in the mailing list, users want to have the capability of getting all files out of a multi-level directory structure.<br>One solution that our users had is to write a new FileInputFormat, but that means all existing FileInputFormat subclasses need to be changed in order to support this feature.<br>We can easily provide a JobConf option (which defaults to false) to {{FileInputFormat.listStatus(...)}} to recursively go into directory structure.</blockquote></li>

			
 
				+

			
 
				+<li> <a href="https://issues.apache.org/jira/browse/MAPREDUCE-1280">MAPREDUCE-1280</a>.

			
 
				+     Major bug reported by kimballa and fixed by alexvk <br>

			
 
				+     <b>Eclipse Plugin does not work with Eclipse Ganymede (3.4)</b><br>

			
 
				+     <blockquote>The newest version of Eclipse seems incompatible with the plugin. The plugin as released in 0.16.4 will allow you to add/remove MapReduce servers, and will allow you to browse/manipulate the DFS in the DFS Browser, but will not allow you to run programs. Clicking &quot;Run As * Run On Hadoop&quot; will simply not cause the run-on-hadoop server selection window to appear. No error message is given.<br><br>Dropping the 0.17.1 copy of the plugin JAR into the eclipse/plugins/ directory does not fix the issue; it is in fact worse: Eclipse does not seem to regard the 0.17 plugin as real. No &quot;MapReduce Perspective&quot; is made available in the perspectives selection window.</blockquote></li>

			
 
				+

			
 
				+</ul>

			
 
				+

			
 
				+</body>

			
 
				+</html>

			
--- a/hdfs/CHANGES.txt
+++ b/hdfs/CHANGES.txt
@@ -1,6 +1,18 @@
 
				 Hadoop HDFS Change Log
			
 
				 
			
 
				-Release 0.22.0 - Unreleased
			
 
				+Release 0.22.1 - Unreleased
			
 
				+
			
 
				+  INCOMPATIBLE CHANGES
			
 
				+
			
 
				+  NEW FEATURES
			
 
				+
			
 
				+  IMPROVEMENTS
			
 
				+
			
 
				+  OPTIMIZATIONS
			
 
				+
			
 
				+  BUG FIXES
			
 
				+
			
 
				+Release 0.22.0 - 2011-11-29
			
 
				 
			
 
				   INCOMPATIBLE CHANGES
			
 
				 
			
--- a/hdfs/build.xml
+++ b/hdfs/build.xml
@@ -30,7 +30,7 @@
 
				   <property name="name" value="hadoop-hdfs"/>
			
 
				   <!-- Need to change aop.xml project.version prop. synchronously
			
 
				    -->
			
 
				-  <property name="version" value="0.22.0-SNAPSHOT"/>
			
 
				+  <property name="version" value="0.22.0"/>
			
 
				   <property name="final.name" value="${name}-${version}"/>
			
 
				   <property name="test.hdfs.final.name" value="${name}-test-${version}"/>
			
 
				   <property name="ant.final.name" value="${name}-ant-${version}"/>
			
--- a/mapreduce/CHANGES.txt
+++ b/mapreduce/CHANGES.txt
@@ -1,6 +1,18 @@
 
				 Hadoop MapReduce Change Log
			
 
				 
			
 
				-Release 0.22.0 - Unreleased
			
 
				+Release 0.22.1 - Unreleased
			
 
				+
			
 
				+  INCOMPATIBLE CHANGES
			
 
				+
			
 
				+  NEW FEATURES
			
 
				+
			
 
				+  IMPROVEMENTS
			
 
				+
			
 
				+  OPTIMIZATIONS
			
 
				+
			
 
				+  BUG FIXES
			
 
				+
			
 
				+Release 0.22.0 - 2011-11-29
			
 
				 
			
 
				   INCOMPATIBLE CHANGES
			
 
				 
			
--- a/mapreduce/build.xml
+++ b/mapreduce/build.xml
@@ -31,7 +31,7 @@
 
				   <property name="Name" value="Hadoop-Mapred"/>
			
 
				   <property name="name" value="hadoop-mapred"/>
			
 
				   <!-- Need to change aop.xml project.version prop. synchronously -->
			
 
				-  <property name="version" value="0.22.0-SNAPSHOT"/>
			
 
				+  <property name="version" value="0.22.0"/>
			
 
				   <property name="final.name" value="${name}-${version}"/>
			
 
				   <property name="test.final.name" value="${name}-test-${version}"/>
			
 
				   <property name="examples.final.name" value="${name}-examples-${version}"/>