CHANGES.txt 93 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489
  1. Hadoop MapReduce Change Log
  2. Trunk (unreleased changes)
  3. INCOMPATIBLE CHANGES
  4. MAPREDUCE-2455. Remove deprecated JobTracker.State in favour of
  5. JobTrackerStatus. (tomwhite)
  6. MAPREDUCE-2430. Remove mrunit contrib. (nigel via eli)
  7. MAPREDUCE-2606. Remove IsolationRunner. (Alejandro Abdelnur via eli)
  8. NEW FEATURES
  9. MAPREDUCE-2682. Add "mapred classpath" command to print classpath
  10. for MR applications. (vinodkv via acmurthy)
  11. MAPREDUCE-2107. [Gridmix] Total heap usage emulation in Gridmix.
  12. (Amar Kamat and Ravi Gummadi via amarrk)
  13. MAPREDUCE-2106. [Gridmix] Cumulative CPU usage emulation in Gridmix.
  14. (amarrk)
  15. MAPREDUCE-2543. [Gridmix] High-Ram feature emulation in Gridmix. (amarrk)
  16. MAPREDUCE-2408. [Gridmix] Compression emulation in Gridmix. (amarrk)
  17. MAPREDUCE-2473. Add "mapred groups" command to query the server-side groups
  18. resolved for a user. (Aaron T. Myers via todd)
  19. MAPREDUCE-461. Enable ServicePlugins for the JobTracker.
  20. (Fredrik Hedberg via tomwhite)
  21. MAPREDUCE-2521. Create RPM and Debian packages for MapReduce. Changes
  22. deployment layout to be consistent across the binary tgz, rpm, and deb.
  23. (Eric Yang via omalley)
  24. MAPREDUCE-2323. Add metrics to the fair scheduler. (todd)
  25. IMPROVEMENTS
  26. MAPREDUCE-2365. Add counters to track bytes (read,written) via
  27. File(Input,Output)Format. (Siddharth Seth via acmurthy)
  28. MAPREDUCE-2680. Display queue name in job client CLI. (acmurthy)
  29. MAPREDUCE-2679. Minor changes to sync trunk with MR-279 branch. (acmurthy)
  30. MAPREDUCE-2400. Remove Cluster's dependency on JobTracker via a
  31. ServiceProvider for the actual implementation. (tomwhite via acmurthy)
  32. MAPREDUCE-2596. [Gridmix] Summarize Gridmix runs. (amarrk)
  33. MAPREDUCE-2563. [Gridmix] Add High-Ram emulation system tests to
  34. Gridmix. (Vinay Kumar Thota via amarrk)
  35. MAPREDUCE-2104. [Rumen] Add Cpu, Memory and Heap usages to
  36. TraceBuilder's output. (amarrk)
  37. MAPREDUCE-2554. [Gridmix] Add distributed cache emulation system tests
  38. to Gridmix. (Vinay Kumar Thota via amarrk)
  39. MAPREDUCE-2543. [Gridmix] High-Ram feature emulation testcase. (amarrk)
  40. MAPREDUCE-2469. Task counters should also report the total heap usage of
  41. the task. (Ravi Gummadi and Amar Ramesh Kamat via amarrk)
  42. MAPREDUCE-2544. [Gridmix] Add compression emulation system tests to
  43. Gridmix. (Vinay Kumar Thota via amarrk)
  44. MAPREDUCE-2517. [Gridmix] Add system tests to Gridmix.
  45. (Vinay Kumar Thota via amarrk)
  46. MAPREDUCE-2492. The new MapReduce API should make available task's
  47. progress to the task. (amarrk)
  48. MAPREDUCE-2153. Bring in more job configuration properties in to the trace
  49. file. (Rajesh Balamohan via amarrk)
  50. MAPREDUCE-1461. Feature to instruct rumen-folder utility to skip jobs worth
  51. of specific duration. (Rajesh Balamohan via amarrk)
  52. MAPREDUCE-2172. Added test-patch.properties required by test-patch.sh
  53. (nigel)
  54. MAPREDUCE-2156. Raid-aware FSCK. (Patrick Kling via dhruba)
  55. MAPREDUCE-2215. A more elegant FileSystem#listCorruptFileBlocks API
  56. (RAID changes) (Patrick Kling via hairong)
  57. MAPREDUCE-1831. BlockPlacement policy for HDFS-RAID.
  58. (Scott Chen via dhruba)
  59. MAPREDUCE-1906. Lower minimum heartbeat interval for TaskTracker
  60. (Scott Carey and Todd Lipcon via todd)
  61. MAPREDUCE-1382. MRAsyncDiscService should tolerate missing local.dir.
  62. (Zheng Shao and tomwhite via tomwhite)
  63. MAPREDUCE-2263. MapReduce side of HADOOP-6904: RPC compatibility.
  64. (hairong)
  65. MAPREDUCE-1706. Log RAID recoveries on HDFS. (schen)
  66. MAPREDUCE-2334. Update BlockPlacementPolicyRaid for the new method
  67. in BlockPlacementPolicy. (szetszwo)
  68. MAPREDUCE-2254. Allow setting of end-of-record delimiter for
  69. TextInputFormat (Ahmed Radwan via todd)
  70. MAPREDUCE-1927. Unit test for HADOOP-6835 (concatenated gzip support).
  71. (Greg Roelofs via tomwhite)
  72. MAPREDUCE-2206. The task-cleanup tasks should be optional. (schen)
  73. MAPREDUCE-2225. MultipleOutputs should not require the use of 'Writable'.
  74. (Harsh J Chouraria via tomwhite)
  75. MAPREDUCE-1811. Job.monitorAndPrintJob() should print status of the job
  76. at completion. (Harsh J Chouraria via tomwhite)
  77. MAPREDUCE-993. bin/hadoop job -events <jobid> <from-event-#> <#-of-events>
  78. help message is confusing. (Harsh J Chouraria via tomwhite)
  79. MAPREDUCE-2302. Add static factory methods in GaloisField. (schen)
  80. MAPREDUCE-2351. mapred.job.tracker.history.completed.location should
  81. support an arbitrary filesystem URI. (tomwhite)
  82. MAPREDUCE-2239. BlockPlacementPolicyRaid should call getBlockLocations
  83. only when necessary. (schen)
  84. MAPREDUCE-2331. Add coverage of task graph servlet to fair scheduler system
  85. test. (todd)
  86. MAPREDUCE-2367. Allow using a file to exclude certain tests from build.
  87. (todd)
  88. MAPREDUCE-2202. Generalize CLITest structure and interfaces to faciliate
  89. upstream adoption (e.g. for web or system testing). (cos)
  90. MAPREDUCE-2420. JobTracker should be able to renew delegation token over
  91. HTTP (Boris Shkolnik via jitendra)
  92. MAPREDUCE-2474. Add docs to the new API Partitioner on how to access the
  93. Job Configuration. (Harsh J Chouraria via todd)
  94. MAPREDUCE-2475. Disable IPV6 for junit tests. (suresh srinivas via mahadev)
  95. MAPREDUCE-2422. Removed unused internal methods from DistributedCache.
  96. (tomwhite)
  97. MAPREDUCE-2456. Log the reduce taskID and associated TaskTrackers with
  98. failed fetch notifications in the JobTracker log.
  99. (Jeffrey Naisbitt via cdouglas)
  100. MAPREDUCE-869. Documentation for config to set map/reduce task environment
  101. (Alejandro Abdelnur via todd)
  102. MAPREDUCE-2410. Add entry to streaming FAQ about how streaming reducers
  103. receive keys. (Harsh J Chouraria via todd)
  104. MAPREDUCE-2499. MR part of HADOOP-7291. (eli)
  105. MAPREDUCE-2497. Missing spaces in error messages. (eli)
  106. MAPREDUCE-2502. JobSubmitter should use mapreduce.job.maps instead of
  107. its deprecated equivalent. (eli via todd)
  108. MAPREDUCE-2381. JobTracker instrumentation not consistent about error
  109. handling. (Philip Zeyliger via tomwhite)
  110. MAPREDUCE-2449. Allow for command line arguments when performing
  111. "Run on Hadoop" action in Eclipse plugin. (Jeff Zemerick via todd)
  112. MAPREDUCE-2483. Remove duplication of jars between Hadoop subprojects
  113. from build artifacts. (Eric Yang via omalley)
  114. MAPREDUCE-2372. TaskLogAppender mechanism shouldn't be set up in
  115. log4j.properties (todd)
  116. MAPREDUCE-2516. Rename webinterface.private.actions to
  117. mapreduce.jobtracker.webinterface.trusted (Ari Rabkin via todd)
  118. MAPREDUCE-2459. Cache HAR filesystem metadata. (Mac Yang via mahadev)
  119. HADOOP-7259. Contrib modules should include the build.properties from
  120. the enclosing hadoop directory. (omalley)
  121. MAPREDUCE-2494. Order distributed cache deletions by LRU. (Robert Joseph
  122. Evans via cdouglas)
  123. MAPREDUCE-2452. Makes the cancellation of delegation tokens happen in a
  124. separate thread. (ddas)
  125. HADOOP-7106. Reorganize project SVN layout to "unsplit" the projects.
  126. (todd, nigel)
  127. MAPREDUCE-2249. Check the reflexive property of Counters objects when
  128. comparing equality. (Devaraj K via todd)
  129. MAPREDUCE-2623. Update ClusterMapReduceTestCase to use
  130. MiniDFSCluster.Builder (Harsh J Chouraria via eli)
  131. MAPREDUCE-2602. Allow setting of end-of-record delimiter for
  132. TextInputFormat for the old API. (Ahmed Radwan via todd)
  133. OPTIMIZATIONS
  134. MAPREDUCE-2026. Make JobTracker.getJobCounters() and
  135. JobInProgress.getCounters() aquire locks in a shorter time period.
  136. (Joydeep Sen Sarma via schen)
  137. MAPREDUCE-2740. MultipleOutputs in new API creates needless
  138. TaskAttemptContexts. (todd)
  139. BUG FIXES
  140. MAPREDUCE-2603. Disable High-Ram emulation in system tests.
  141. (Vinay Kumar Thota via amarrk)
  142. MAPREDUCE-2539. Fixed NPE in getMapTaskReports in JobClient. (Robert Evans via
  143. acmurthy)
  144. MAPREDUCE-2531. Fixed jobcontrol to downgrade JobID. (Robert Evans via
  145. acmurthy)
  146. MAPREDUCE-1978. Rumen TraceBuilder should provide recursive
  147. input folder scanning.
  148. MAPREDUCE-2416. Remove the restriction of specifying group names in
  149. users-list file for Gridmix in RoundRobinUserResolver mode.
  150. MAPREDUCE-2417. Fix Gridmix in RoundRobinUserResolver mode to
  151. map testing/proxy users to unique users in a trace.
  152. MAPREDUCE-2307. Exception thrown in Jobtracker logs, when the Scheduler
  153. configured is FairScheduler. (Devaraj K via matei)
  154. MAPREDUCE-2199. build is broken 0.22 branch creation. (cos)
  155. MAPREDUCE-1752. Implement getFileBlockLocations in HarFilesystem.
  156. (Patrick Kling via dhruba)
  157. MAPREDUCE-2155. RaidNode should optionally use the mapreduce jobs to
  158. fix missing blocks. (Patrick Kling via dhruba)
  159. MAPREDUCE-1334. Fix TestIndexUpdater by ignoring _SUCCESS file in HDFS.
  160. (Kay Kay via yhemanth)
  161. MAPREDUCE-2232. Add missing methods to TestMapredGroupMappingServiceRefresh.
  162. (Todd Lipcon via eli)
  163. MAPREDUCE-2271. Fix TestSetupTaskScheduling failure on trunk.
  164. (Liyin Liang via todd)
  165. MAPREDUCE-2290. Fix compilation error in TestTaskCommit. (eli)
  166. MAPREDUCE-2294. Fix compilation error in mumak. (todd)
  167. MAPREDUCE-2300. Fix TestUmbilicalProtocolWithJobToken on trunk after
  168. HADOOP-6904. (todd)
  169. MAPREDUCE-2296. Fix references to misspelled method name
  170. getProtocolSigature (todd)
  171. MAPREDUCE-2311. Fix TestFairScheduler failure (schen)
  172. MAPREDUCE-1996. API: Reducer.reduce() method detail misstatement.
  173. (Harsh J Chouraria via tomwhite)
  174. MAPREDUCE-2203. Wrong javadoc for TaskRunner's appendJobJarClasspaths
  175. method. (Jingguo Yao via tomwhite)
  176. MAPREDUCE-2074. Task should fail when symlink creation fails.
  177. (Priyo Mustafi via tomwhite)
  178. MAPREDUCE-1242. Chain APIs error misleading.
  179. (Harsh J Chouraria via tomwhite)
  180. MAPREDUCE-2379. Adds missing DistributedCache configurations in
  181. mapred-default.xml (Todd Lipcon via amareshwari)
  182. MAPREDUCE-2348. Disable mumak tests on trunk since they currently time out
  183. (todd)
  184. MAPREDUCE-2395. TestBlockFixer timing out on trunk. (Ramkumar Vadali via
  185. todd)
  186. MAPREDUCE-2426. Make TestFairSchedulerSystem fail with more verbose output
  187. (todd)
  188. MAPREDUCE-2448. NoSuchMethodError:
  189. org.apache.hadoop.hdfs.TestDatanodeBlockScanner.corruptReplica(..) (eli)
  190. MAPREDUCE-2460. Fix flaky test TestFairSchedulerSystem. (todd)
  191. MAPREDUCE-2451. Log the details from health check script at the
  192. JobTracker. (Thomas Graves via cdouglas)
  193. MAPREDUCE-2467. HDFS-1052 changes break the raid contrib module in
  194. MapReduce. (suresh srinivas via mahadev)
  195. MAPREDUCE-2258. IFile reader closes stream and compressor in wrong order.
  196. (todd via tomwhite)
  197. MAPREDUCE-2518. The t flag is missing in distcp help message. (Wei Yongjun
  198. via szetszwo)
  199. MAPREDUCE-2514. Fix typo in TaskTracker ReinitTrackerAction log message.
  200. (Jonathan Eagles via cdouglas)
  201. MAPREDUCE-2490. Add logging to graylist and blacklist activity to aid
  202. diagnosis of related issues. (Jonathan Eagles via cdouglas)
  203. MAPREDUCE-2495. exit() the TaskTracker when the distributed cache cleanup
  204. thread dies. (Robert Joseph Evans via cdouglas)
  205. MAPREDUCE-2470. Fix NPE in RunningJobs::getCounters. (Robert Joseph Evans
  206. via cdouglas)
  207. MAPREDUCE-2536. Update FsShell -mv command usage in TestMRCLI. (Daryn
  208. Sharp via szetszwo)
  209. MAPREDUCE-2529. Add support for regex-based shuffle metric counting
  210. exceptions. (Thomas Graves via cdouglas)
  211. MAPREDUCE-2559. ant binary fails due to missing c++ lib dir. (eli)
  212. MAPREDUCE-2573. Fix new findbugs warning introduced by MAPREDUCE-2494.
  213. (Robert Joseph Evans via todd)
  214. MAPREDUCE-2581. Spelling errors in log messages. (Tim Sell via eli)
  215. MAPREDUCE-2588. Change raid to the new DataTransferProtocol API. (szetszwo)
  216. MAPREDUCE-2576. Typo in comment in SimulatorLaunchTaskAction.java.
  217. (Tim Sell via jghoman)
  218. MAPREDUCE-2550. Fix bin/mapred to work properly from within a source
  219. checkout (Eric Yang via todd)
  220. MAPREDUCE-2620. Update RAID for HDFS-2087. (szetszwo)
  221. MAPREDUCE-2624. Update RAID for HDFS-2107. (szetszwo)
  222. MAPREDUCE-2670. Fixing spelling mistake in FairSchedulerServlet.java. (eli)
  223. MAPREDUCE-2710. Update JobSubmitter.printTokens(..) for HDFS-2161.
  224. (szetszwo)
  225. MAPREDUCE-2409. DistributedCache maps files and archives to the same path,
  226. despite semantic incompatibility. (Siddharth Seth via cdouglas)
  227. MAPREDUCE-2575. TestMiniMRDFSCaching fails if test.build.dir is set
  228. to something other than build/test (Thomas Graves via mahadev)
  229. MAPREDUCE-2622. Remove the last remaining reference to the deprecated
  230. configuration "io.sort.mb". (Harsh J Chouraria via todd)
  231. MAPREDUCE-2732. Remove directly accessing FSNamesystem.LOG from
  232. TestCopyFiles and TestDistCh. (szetszwo)
  233. MAPREDUCE-2463. Job history files are not moved to done folder when job
  234. history location is hdfs. (Devaraj K via szetszwo)
  235. MAPREDUCE-2243. Close streams propely in a finally-block to avoid leakage
  236. in CompletedJobStatusStore, TaskLog, EventWriter and TotalOrderPartitioner.
  237. (Devaraj K via szetszwo)
  238. Release 0.22.0 - Unreleased
  239. INCOMPATIBLE CHANGES
  240. MAPREDUCE-1866. Removes deprecated class
  241. org.apache.hadoop.streaming.UTF8ByteArrayUtils. (amareshwari)
  242. MAPREDUCE-1664. Changes the behaviour of the combination of job-acls
  243. when they function together with queue-acls. (Ravi Gummadi via vinodkv)
  244. NEW FEATURES
  245. MAPREDUCE-1804. Stress-test tool for HDFS introduced in HDFS-708.
  246. (Joshua Harlow via shv)
  247. MAPREDUCE-220. Collect cpu and memory statistics per task. (Scott Chen via
  248. acmurthy)
  249. MAPREDUCE-1970. Reed-Solomon code implementation for HDFS RAID.
  250. (Scott Chen via dhruba)
  251. MAPREDUCE-2169. Integrated Reed-Solomon code with RaidNode. (Ramkumar
  252. Vadali via schen)
  253. IMPROVEMENTS
  254. MAPREDUCE-2141. Add an "extra data" field to Task for use by Mesos. (matei)
  255. MAPREDUCE-2140. Regenerate fair scheduler design doc PDF. (matei)
  256. MAPREDUCE-1546. Redirect all job pages to corresponding history page
  257. if job is not in JT memory. (Scott Chen via sharad)
  258. MAPREDUCE-1092. Enable assertions for unit tests. (Eli Collins via
  259. cdouglas)
  260. MAPREDUCE-1680. Add a metric recording JobTracker heartbeats processed.
  261. (Dick King via cdouglas)
  262. MAPREDUCE-1761. FairScheduler allows separate configuration of node
  263. and rack locality wait time (Scott Chen via dhruba)
  264. MAPREDUCE-1539. authorization checks for inter-server protocol
  265. (based on HADOOP-6600) (Boris Shkolnik via shv)
  266. MAPREDUCE-1798. Names the configuration keys for the Kerberos
  267. principals better. (Boris Shkolnik via ddas)
  268. MAPREDUCE-1773. streaming doesn't support jobclient.output.filter.
  269. (Amareshwari Sriramadasu via vinodkv)
  270. MAPREDUCE-1785. Add streaming config option for not emitting the key.
  271. (Eli Collins via sharad)
  272. MAPREDUCE-572. If #link is missing from uri format of -cacheArchive
  273. then streaming does not throw error. (Amareshwari Sriramadasu via
  274. vinodkv)
  275. MAPREDUCE-1545. Add timestamps for first task type launched in job summary.
  276. (Luke Lu via cdouglas)
  277. MAPREDUCE-1543. Add an audit log for authentication events. (Amar Kamat and
  278. Luke Lu via cdouglas)
  279. MAPREDUCE-1762. Add ability to set values of task counters. (Scott Chen via
  280. cdouglas)
  281. MAPREDUCE-1533. Reduce overhead of logging and string manipulation during
  282. heartbeat processing. (Amar Kamat and Dick King via cdouglas)
  283. MAPREDUCE-1516. JobTracker issues delegation tokens only if the user's
  284. authentication is Kerberos. (Jitendra Pandey via ddas)
  285. MAPREDUCE-647. Update distcp forrest documentation to reflect the changes
  286. of HADOOP-5472, MAPREDUCE-642 and HADOOP-5620. (Rodrigo Schmidt via
  287. szetszwo)
  288. MAPREDUCE-1851. Documents configuration parameters in streaming.
  289. (amareshwari)
  290. MAPREDUCE-1868. Add a read and connection timeout to JobClient while
  291. pulling tasklogs. (Krishna Ramachandran via acmurthy)
  292. MAPREDUCE-1778. Ensure failure to setup CompletedJobStatusStore is not
  293. silently ignored by the JobTracker. (Krishna Ramachandran via acmurthy)
  294. MAPREDUCE-1850. Includes job submit host information (name and ip) in
  295. jobconf and jobdetails display (Krishna Ramachandran via amareshwari)
  296. MAPREDUCE-1893. Slive with multiple reducers. (shv)
  297. MAPREDUCE-1248. Fixes redudant memory copying in StreamKeyValUtil.
  298. (Ruibang He via amareshwari)
  299. MAPREDUCE-1840. Enhancements to Gridmix benchmark simulating user
  300. diversity, queue replay, and task duration for JobTracker load testing.
  301. Also includes compatibility with security enhancements, and scalability
  302. improvements. (Amar Kamat, Rahul Singh, Hong Tang, and cdouglas)
  303. MAPREDUCE-1848. Put number of speculative, data local, rack local
  304. tasks in JobTracker metrics. (Scott Chen via dhruba)
  305. MAPREDUCE-1935. Makes the Distcp to work in a secure environment.
  306. (Boris Shkolnik via ddas)
  307. MAPREDUCE-1945. The MapReduce component for HADOOP-6632.
  308. (Kan Zhang & Jitendra Pandey via ddas)
  309. MAPREDUCE-1936. Modify Gridmix3 to support more tunable parameters for
  310. stress submission and sleep jobs. (Hong Tang via cdouglas)
  311. MAPREDUCE-1733. Makes pipes applications secure. (Jitendra Pandey via ddas)
  312. MAPREDUCE-1566. Adds a configuration attribute using which job clients can
  313. specify a credentials file. The tokens from there will be passed to the job.
  314. (Jitendra Pandey and Owen O'Malley via ddas)
  315. MAPREDUCE-1624. Documents the job credentials and associated details to do
  316. with delegation tokens (on the client side).
  317. (Jitendra Pandey and Devaraj Das via ddas)
  318. MAPREDUCE-1834. TestSimulatorDeterministicReplay timesout on trunk.
  319. (Hong Tang via mahadev)
  320. MAPREDUCE-1993. Fixes test failure
  321. TestTrackerDistributedCacheManagerWithLinuxTaskController. (Devaraj Das
  322. via amareshwari)
  323. MAPREDUCE-1523. Making Mumak work with Capacity-Scheduler (Anirban Das
  324. via mahadev)
  325. MAPREDUCE-1920. Enables completed jobstatus store by default. (Tom White
  326. via amareshwari)
  327. MAPREDUCE-1881. Improve TaskTrackerInstrumentation to enable collection of
  328. advanced metrics. (Matei Zaharia via acmurthy)
  329. MAPREDUCE-1548. Hadoop archives preserve times and other properties from
  330. original files. (Rodrigo Schmidt via dhruba)
  331. MAPREDUCE-1517. Supports streaming job to run in the background. (Bochun Bai
  332. via amareshwari)
  333. MAPREDUCE-1819. RaidNode is now smarter in submitting Raid jobs. (Ramkumar
  334. Vadali via schen)
  335. MAPREDUCE-2132. A command line option in RaidShell to fix blocks using raid
  336. MAPREDUCE-2147. Remove redundant lines in JobInProgress ctor.
  337. (Harsh J Chouraria via cutting)
  338. HADOOP-7007. Update the hudson-test-patch ant target to work with the
  339. latest test-patch.sh script (gkesavan)
  340. MAPREDUCE-1818. RaidNode can specify scheduling parameters. (Ramkumar
  341. Vadali via schen)
  342. MAPREDUCE-2051. Contribute a fair scheduler preemption system test.
  343. (Todd Lipcon via tomwhite)
  344. MAPREDUCE-1892. RaidNode can allow layered policies more efficiently.
  345. (Ramkumar Vadali via schen)
  346. MAPREDUCE-1592. Generate Eclipse's .classpath file from Ivy config.
  347. (tomwhite via nigel)
  348. MAPREDUCE-2073. TestTrackerDistributedCacheManager should be up-front
  349. about requirements on build environment. (Todd Lipcon via tomwhite)
  350. MAPREDUCE-2093. Herriot JT and TT clients should vend statistics. (cos)
  351. MAPREDUCE-2167. Faster directory traversal for raid node. (Ramkumar Vadali
  352. via schen)
  353. MAPREDUCE-1931. Gridmix forrest documentation . (Ranjit Mathew via vinodkv).
  354. MAPREDUCE-2184. Port DistRaid.java to new mapreduce API. (Ramkumar Vadali
  355. via schen)
  356. MAPREDUCE-1878. Add MRUnit documentation. (Aaron Kimball via tomwhite)
  357. MAPREDUCE-2180. Add coverage of fair scheduler servlet to system test (todd)
  358. MAPREDUCE-2250. Fix logging in raid code. (Ramkumar Vadali via schen)
  359. MAPREDUCE-2260. Remove auto-generated native build files. (rvs via eli)
  360. MAPREDUCE-2314. configure files that are generated as part of the released
  361. tarball need to have executable bit set (rvs via cos)
  362. MAPREDUCE-1159. Limit Job name in web UI to be 80 char long. (Harsh J
  363. Chouraria via szetszwo)
  364. MAPREDUCE-2337. Remove dependence of public MapReduce API on classes in
  365. server package. (tomwhite)
  366. MAPREDUCE-2383. Improve documentation of DistributedCache methods (Harsh J
  367. Chouraria via todd)
  368. MAPREDUCE-2222. Ivy resolve force mode should be turned off by default.
  369. (Luke Lu via tomwhite)
  370. MAPREDUCE-2103. task-controller shouldn't require o-r permissions.
  371. (todd via eli)
  372. MAPREDUCE-2505. Explain how to use ACLs in the fair scheduler.
  373. (matei via eli)
  374. OPTIMIZATIONS
  375. MAPREDUCE-1354. Enhancements to JobTracker for better performance and
  376. scalability. (Arun C. Murthy & Richard King via acmurthy)
  377. MAPREDUCE-1829. JobInProgress.findSpeculativeTask should use min() to
  378. find the candidate instead of sort(). (Scott Chen via vinodkv)
  379. BUG FIXES
  380. MAPREDUCE-1845. FairScheduler.tasksToPreempt() can return negative number.
  381. (Scott Chen via matei)
  382. MAPREDUCE-1707. TaskRunner can get NPE in getting ugi from TaskTracker.
  383. (Vinod Kumar Vavilapalli)
  384. MAPREDUCE-1532. Ensures that delegation tokens is obtained as the
  385. actual user when the proxy-user is used for submitting jobs. Also
  386. refactors the DelegationTokenToRenew class. (ddas)
  387. MAPREDUCE-1558. Fixes MRAdmin to look up the principal of the
  388. JobTracker and use that in the RefreshUserToGroupsMapping protocol and
  389. RefreshAuthorizationPolicyProtocol. (Boris Shkolnik via ddas)
  390. MAPREDUCE-1662. Remove unused methods from TaskRunner. (Amareshwari
  391. Sriramadasu via cdouglas)
  392. MAPREDUCE-1617. Use IPv4 stack for unit tests. (Amar Kamat and Luke Lu via
  393. cdouglas)
  394. MAPREDUCE-1599. Fixes MRBench so that it reuses tokens across jobs
  395. correctly. (Jitendra Nath Pandey via ddas)
  396. MAPREDUCE-1836. Refresh for proxy superuser config (mr part for HDFS-1096).
  397. (Boris Shkolnik via shv)
  398. MAPREDUCE-1505. Create RPC client on job submission, not in cstr of Job
  399. instance. (Dick King via cdouglas)
  400. MAPREDUCE-1813. NPE in PipeMapred.MRErrorThread. (Ravi Gummadi via vinodkv)
  401. MAPREDUCE-1225. Fixes DistributedCache to check if the file is fresh or not,
  402. for the first localization also. (Zhong Wang via amareshwari)
  403. MAPREDUCE-1559. Fixes the token renewer to use the JobTracker's
  404. credentials for talking to the NameNode. (ddas)
  405. MAPREDUCE-1492. Delete obsolete har files used on the parity files
  406. of hdfs raid. (Rodrigo Schmidt via dhruba)
  407. MAPREDUCE-1857. Removes unused configuration parameters in streaming.
  408. (amareshwari)
  409. MAPREDUCE-1887. MRAsyncDiskService now properly absolutizes volume root
  410. paths. (Aaron Kimball via zshao)
  411. MAPREDUCE-1863. Fix NPE in Rumen when processing null CDF for failed task
  412. attempts. (Amar Kamat via cdouglas)
  413. MAPREDUCE-1864. Removes uninitialized/unused variables in
  414. org.apache.hadoop.streaming.PipeMapRed. (amareshwari)
  415. MAPREDUCE-1888. Fixes Streaming to override output key and value types,
  416. only if mapper/reducer is a command. (Ravi Gummadi via amareshwari)
  417. MAPREDUCE-577. Fixes duplicate records in StreamXmlRecordReader.
  418. (Ravi Gummadi via amareshwari)
  419. MAPREDUCE-1894. Fixed a bug in DistributedRaidFileSystem.readFully()
  420. that was causing it to loop infinitely. (Ramkumar Vadali via dhruba)
  421. MAPREDUCE-1838. Reduce the time needed for raiding a bunch of files
  422. by randomly assigning files to map tasks. (Ramkumar Vadali via dhruba)
  423. MAPREDUCE-1820. Fix InputSampler to clone sampled keys. (Alex Kozlov via
  424. cdouglas)
  425. MAPREDUCE-1528. Incorporates the changes to the credentials API done in
  426. HADOOP-6845. Also, introduces Credentials in JobConf, and in JobContext.
  427. (Jitendra Pandey and Arun Murthy via ddas)
  428. MAPREDUCE-1865. Rumen should also support jobhistory files generated using
  429. trunk. (Amar Kamat via amareshwari)
  430. MAPREDUCE-1621. Fixes NPE in TextOutputReader.getLastOutput if it has never
  431. read any output. (amareshwari)
  432. MAPREDUCE-1911. Fixes errors in -info message in streaming. (amareshwari)
  433. MAPREDUCE-1772. Corrects errors in streaming documentation in forrest.
  434. (amareshwari)
  435. MAPREDUCE-1925. Fix failing TestRumenJobTraces. (Ravi Gummadi via cdouglas)
  436. MAPREDUCE-1718. Fixes a bug in the construction of jobconf key for the
  437. mapping that the tasks use at runtime for looking up delegation tokens.
  438. (Boris Shkolnik via ddas)
  439. MAPREDUCE-1701. Fixes a problem to do with exception handling in
  440. delegation-token renewals. (Boris Shkolnik via ddas)
  441. MAPREDUCE-1686. Fixes StreamUtil.goodClassOrNull to find classes without
  442. package names. (Paul Burkhardt via amareshwari)
  443. MAPREDUCE-1288. Fixes TrackerDistributedCacheManager to take into account
  444. the owner of the localized file in the mapping from cache URIs to
  445. CacheStatus objects. (ddas)
  446. MAPREDUCE-1982. Fixes Rumen's TraceBuilder to extract job name from either
  447. of configuration properties "mapreduce.job.name" and "mapred.job.name".
  448. (Ravi Gummadi via amareshwari)
  449. MAPREDUCE-1958. The MapReduce part corresponding to the HADOOP-6873.
  450. (Boris Shkolnik & Owen O'Malley via ddas)
  451. MAPREDUCE-1900. TaskTracker and JobTracker closes FileSystems, opened on
  452. behalf of users that it no longer requires. (Kan Zhang and ddas via ddas)
  453. MAPREDUCE-1992. Fixes a problem to do with bringing up the JobTracker in
  454. unsecure mode. (Kan Zhang via ddas)
  455. MAPREDUCE-1999. Fixes ClientProtocol to use the correct
  456. DelegationTokenSelector. (Jitendra Pandey via ddas)
  457. MAPREDUCE-1780. AccessControlList.toString() is used for serialization of
  458. ACL in JobStatus.java. (Ravi Gummadi via vinodkv)
  459. MAPREDUCE-1961. Fix ConcurrentModificationException in Gridmix during
  460. shutdown. (Hong Tang via cdouglas)
  461. MAPREDUCE-2000. Fix parsing of JobHistory lines in Rumen when quotes are
  462. escaped. (Hong Tang via cdouglas)
  463. MAPREDUCE-2022. Fixes compilation errors in TestSubmitJob. (amareshwari)
  464. MAPREDUCE-1670. RAID policies should not scan their own destination path.
  465. (Ramkumar Vadali via dhruba)
  466. MAPREDUCE-1668. RaidNode Hars a directory only if all its parity files
  467. have been created. (Ramkumar Vadali via dhruba)
  468. MAPREDUCE-2021. Fixes duplicate hostnames in CombineFileInputFormat's
  469. split locations. (amareshwari)
  470. MAPREDUCE-1375. Fixes flaky test TestFileArgs. (Todd Lipcon via
  471. amareshwari)
  472. MAPREDUCE-2023. TestDFSIO should not stop reading if curSize != bufferSize.
  473. (Hong Tang via szetszwo)
  474. MAPREDUCE-2031. Fixes test failures TestTaskLauncher and
  475. TestTaskTrackerLocalization. (Ravi Gummadi via amareshwari)
  476. MAPREDUCE-2046. Fixes CombineFileInputFormat to allow splits with size
  477. less than DFS block size. (dhruba borthakur via amareshwari)
  478. MAPREDUCE-1975. Fixes unnecessary InterruptedException log in gridmix.
  479. (Ravi Gummadi via amareshwari)
  480. MAPREDUCE-1597. Fixes CombineFileInputFormat to work with non-splittable
  481. files. (amareshwari)
  482. MAPREDUCE-2032. Fixes TestJobCleanup to cleanup test directory in
  483. tearDown. (Dick King via amareshwari)
  484. MAPREDUCE-1979. Fixes "Output directory already exists" error in gridmix
  485. when gridmix.output.directory is not defined. (Ravi Gummadi via
  486. amareshwari)
  487. MAPREDUCE-1918. Adds documentation to Rumen. (Amar Kamat via amareshwari)
  488. MAPREDUCE-2078. Fixes TraceBuilder to generate traces when a globbed job
  489. history path is given. (Amar Kamat via amareshwari)
  490. MAPREDUCE-1989. Fixes error message in gridmix when user resolver is set
  491. and no user list is given. (Ravi Gummadi via amareshwari)
  492. MAPREDUCE-2067. Distinct minicluster services (e.g. NN and JT) overwrite
  493. each other's service policies. (Aaron T. Myers via tomwhite)
  494. MAPREDUCE-2029. DistributedRaidFileSystem removes itself from FileSystem
  495. cache when it is closed. (Ramkumar Vadali via dhruba)
  496. MAPREDUCE-1816. HAR files used for RAID parity-bite have configurable
  497. partfile size. (Ramkumar Vadali via dhruba)
  498. MAPREDUCE-2082. Fixes Pipes to create the jobtoken file in the right
  499. place. (Jitendra Pandey via ddas)
  500. MAPREDUCE-2095. Fixes Gridmix to run from compressed traces. (Ranjit
  501. Mathew via amareshwari)
  502. MAPREDUCE-1908. DistributedRaidFileSystem now handles ChecksumException
  503. correctly. (Ramkumar Vadali via schen)
  504. MAPREDUCE-2126. JobQueueJobInProgressListener's javadoc is inconsistent
  505. with source code. (Jingguo Yao via tomwhite)
  506. MAPREDUCE-2143. HarFileSystem is able to handle spaces in pathnames.
  507. (Ramkumar Vadali via dhruba)
  508. MAPREDUCE-1867. Remove unused methods in
  509. org.apache.hadoop.streaming.StreamUtil. (amareshwari via tomwhite)
  510. MAPREDUCE-2146. Raid does not affect access time of a source file.
  511. (Ramkumar Vadali via dhruba)
  512. MAPREDUCE-2150. RaidNode periodically fixes corrupt blocks. (Ramkumar Vadali via
  513. schen)
  514. MAPREDUCE-2099. RaidNode recreates outdated parity HARs. (Ramkumar Vadali
  515. via schen)
  516. MAPREDUCE-2173. Fix race condition in TestBlockFixer that was
  517. causing intermittent failure (Patrick Kling via dhruba)
  518. MAPREDUCE-2142. Refactor RaidNode so that the map-reduce component is
  519. clearly separated out. (Patrick Kling via dhruba)
  520. MAPREDUCE-2179. Fix RaidBlockSender compilation failure. (Ramkumar Vadali
  521. via schen)
  522. MAPREDUCE-2034. TestSubmitJob triggers NPE instead of permissions error.
  523. (Todd Lipcon via tomwhite)
  524. MAPREDUCE-2195. New property for local conf directory in
  525. system-test-mapreduce.xml file. (cos)
  526. MAPREDUCE-1783. FairScheduler initializes tasks only when the job can be
  527. run. (Ramkumar Vadali via schen)
  528. MAPREDUCE-2224. Fix synchronization bugs in JvmManager. (todd)
  529. MAPREDUCE-714. JobConf.findContainingJar unescapes unnecessarily on linux (todd)
  530. MAPREDUCE-2096. Secure local filesystem IO from symlink vulnerabilities (todd)
  531. MAPREDUCE-2234. If Localizer can't create task log directory, it should fail
  532. on the spot. (todd)
  533. MAPREDUCE-2219. JobTracker should not try to remove mapred.system.dir
  534. during startup. (todd)
  535. MAPREDUCE-2207. Task-cleanup task should not be scheduled on the node that
  536. the task just failed. (Liyin Liang via schen)
  537. MAPREDUCE-2084. Remove deprecate annotation for package file. The package
  538. classes themselves are already deprecated. This removes an Eclipse error.
  539. (tomwhite via nigel)
  540. MAPREDUCE-2248. DistributedRaidFileSystem should unraid only the corrupt
  541. block (Ramkumar Vadali via schen)
  542. MAPREDUCE-1085. For tasks, "ulimit -v -1" is being run when user doesn't
  543. specify a ulimit (todd)
  544. MAPREDUCE-2282. Fix TestMRServerPorts for the changes in
  545. TestHDFSServerPorts. (shv via szetszwo)
  546. MAPREDUCE-2238. Fix permissions handling to avoid leaving undeletable
  547. directories in local dirs. (todd)
  548. MAPREDUCE-2277. TestCapacitySchedulerWithJobTracker needs to wait for jobs
  549. to complete before testing status. (todd)
  550. MAPREDUCE-2253. Servlets should specify content type (todd)
  551. MAPREDUCE-2283. Add timeout for Raid Tests (Ramkumar Vadali via schen)
  552. MAPREDUCE-1754. Replace mapred.persmissions.supergroup with an
  553. acl : mapreduce.cluster.administrators (Amareshwari Sriramadasu via shv)
  554. MAPREDUCE-2256. FairScheduler fairshare preemption from multiple pools may
  555. preempt all tasks from one pool causing that pool to go below fairshare.
  556. (Priyo Mustafi via shv)
  557. MAPREDUCE-2281. MR part of HADOOP-6642. (Chris Douglas, Po Cheung via shv)
  558. MAPREDUCE-2200. TestUmbilicalProtocolWithJobToken is failing without Krb
  559. evironment: needs to be conditional. (cos)
  560. MAPREDUCE-2077. Resolve name clash in the deprecated
  561. o.a.h.util.MemoryCalculatorPlugin (Luke Lu via shv)
  562. MAPREDUCE-2188. The new API MultithreadedMapper doesn't initialize
  563. RecordReader. (Owen O'Malley via shv)
  564. MAPREDUCE-1915. Fix IndexOutOfBoundsException in IndexCache.
  565. (Priyo Mustafi via shv)
  566. MAPREDUCE-1974. Fix multiple preemtions of the same task in FairScheduler.
  567. (Scott Chen via shv)
  568. MAPREDUCE-2304. Fix TestMRCLI to allow hostname with a hyphen (-).
  569. (Priyo Mustafi via shv)
  570. MAPREDUCE-1825. jobqueue_details.jsp and FairSchedulerServelet should not
  571. call finishedMaps and finishedReduces when job is not initialized.
  572. (Scott Chen via shv)
  573. MAPREDUCE-2285. MiniMRCluster does not start after ant test-patch
  574. (todd)
  575. MAPREDUCE-2315. javadoc is failing in nightly build (todd)
  576. MAPREDUCE-2054. Hierarchical queue implementation broke dynamic queue
  577. addition in Dynamic Scheduler. (Thomas Sandholm via tomwhite)
  578. MAPREDUCE-2272. Job ACL file should not be executable
  579. (Harsh J Chouraria via todd)
  580. MAPREDUCE-2241. ClusterWithLinuxTaskController should accept relative path
  581. on the command line. (todd)
  582. MAPREDUCE-2251. Remove unused mapreduce.job.userhistorylocation config.
  583. (Harsh J Chouraria via todd)
  584. MAPREDUCE-2284. TestLocalRunner.testMultiMaps times out (todd)
  585. MAPREDUCE-2336. Tool-related packages should be in the Tool javadoc group.
  586. (tomwhite)
  587. MAPREDUCE-2394. JUnit output format doesn't propagate into raid contrib
  588. build. (todd)
  589. MAPREDUCE-2392. TaskTracker shutdown in the tests sometimes take 60s.
  590. (tomwhite)
  591. MAPREDUCE-2437. SLive uses only part* files to generating the final report.
  592. (shv)
  593. MAPREDUCE-2428. start-mapred.sh script fails if HADOOP_HOME is not set.
  594. (tomwhite via eli)
  595. MAPREDUCE-2445. Fix TestMiniMRWithDFSWithDistinctUsers to be a valid test.
  596. (todd)
  597. MAPREDUCE-2457. Job submission should inject group.name on the JobTracker
  598. (Alejandro Abdelnur via todd)
  599. MAPREDUCE-2472. Extra whitespace in mapred.child.java.opts breaks JVM
  600. initialization. (Aaron T. Myers via todd)
  601. MAPREDUCE-2222. Ivy resolve force mode should be turned off by default.
  602. (Luke Lu via tomwhite)
  603. MAPREDUCE-2486. Incorrect snapshot dependency published in .pom files
  604. (todd)
  605. MAPREDUCE-2327. MapTask doesn't need to put username information in
  606. SpillRecord. (todd via tomwhite)
  607. MAPREDUCE-2515. MapReduce code references some deprecated options
  608. (Ari Rabkin via todd)
  609. MAPREDUCE-2487. ChainReducer uses MAPPER_BY_VALUE instead of
  610. REDUCER_BY_VALUE. (Devaraj K via todd)
  611. MAPREDUCE-2185. Fix infinite loop at creating splits using
  612. CombineFileInputFormat. (Ramkumar Vadali via schen)
  613. MAPREDUCE-2571. CombineFileInputFormat.getSplits throws a
  614. java.lang.ArrayStoreException. (Bochun Bai via todd)
  615. Release 0.21.1 - Unreleased
  616. NEW FEATURES
  617. MAPREDUCE-2040. Forrest Documentation for Dynamic Priority Scheduler.
  618. (Thomas Sandholm via tomwhite)
  619. BUG FIXES
  620. MAPREDUCE-1897. trunk build broken on compile-mapred-test (cos)
  621. MAPREDUCE-1280. Update Eclipse plugin to the new eclipse.jdt API.
  622. (Alex Kozlov via szetszwo)
  623. MAPREDUCE-1984. herriot TestCluster fails because exclusion is not there
  624. (Balaji Rajagopalan via cos)
  625. MAPREDUCE-2090. Clover build doesn't generate per-test coverage. (cos)
  626. MAPREDUCE-2134. ant binary-system is broken in mapreduce project. (cos)
  627. MAPREDUCE-1905. Fixes Context.setStatus() and progress() apis.
  628. (amareshwari)
  629. MAPREDUCE-1809. Ant build changes for Streaming system tests in contrib
  630. projects. (Vinay Kumar Thota via amareshwari)
  631. MAPREDUCE-2223. TestMRCLI might fail on Ubuntu with default /etc/hosts
  632. (cos)
  633. MAPREDUCE-2228. Remove java5 dependencies from build. (cos)
  634. MAPREDUCE-1929. Allow artifacts to be published to the staging Apache Nexus
  635. Maven Repository. (tomwhite)
  636. MAPREDUCE-2317. Fix a NPE in HadoopArchives. (Devaraj K via szetszwo)
  637. MAPREDUCE-2127. mapreduce trunk builds are filing on hudson.
  638. (Bruno Mahé via eli)
  639. Release 0.21.0 - 2010-08-13
  640. INCOMPATIBLE CHANGES
  641. MAPREDUCE-516. Fix the starvation problem in the Capacity Scheduler
  642. when running High RAM Jobs. (Arun Murthy via yhemanth)
  643. MAPREDUCE-358. Change org.apache.hadoop.examples. AggregateWordCount
  644. and org.apache.hadoop.examples.AggregateWordHistogram to use new
  645. mapreduce api. (Amareshwari Sriramadasu via sharad)
  646. MAPREDUCE-245. Change Job and jobcontrol classes to use the List interface
  647. rather than ArrayList in APIs. (Tom White via cdouglas)
  648. MAPREDUCE-766. Enhanced list-blacklisted-trackers to display reasons
  649. for blacklisting a node. (Sreekanth Ramakrishnan via yhemanth)
  650. MAPREDUCE-817. Add a cache for retired jobs with minimal job info and
  651. provide a way to access history file url. (sharad)
  652. MAPREDUCE-711. Moved Distributed Cache from Common to Map/Reduce
  653. project. (Vinod Kumar Vavilapalli via yhemanth)
  654. MAPREDUCE-895. Per the contract elucidated in HADOOP-6201, throw
  655. FileNotFoundException from FileSystem::listStatus rather than returning
  656. null. (Jakob Homan via cdouglas)
  657. MAPREDUCE-479. Provide full task id to map output servlet rather than the
  658. reduce id, only. (Jiaqi Tan via cdouglas)
  659. MAPREDUCE-873. Simplify job recovery. Incomplete jobs are resubmitted on
  660. jobtracker restart. Removes a public constructor in JobInProgress. (sharad)
  661. HADOOP-6230. Moved process tree and memory calculator related classes from
  662. Common to Map/Reduce. (Vinod Kumar Vavilapalli via yhemanth)
  663. MAPREDUCE-157. Refactor job history APIs and change the history format to
  664. JSON. (Jothi Padmanabhan via sharad)
  665. MAPREDUCE-849. Rename configuration properties. (Amareshwari Sriramadasu
  666. via sharad)
  667. MAPREDUCE-1287. Only call the partitioner with more than one reducer.
  668. (cdouglas)
  669. MAPREDUCE-1385. Use the new UserGroupInformation from HADOOP-6299.
  670. (ddas via omalley)
  671. MAPREDUCE-1493. Authorization for job-history pages. (vinodkv)
  672. MAPREDUCE-1607. Task controller may not set permissions for a
  673. task cleanup attempt's log directory (Amareshwari Sriramadasu via vinodkv)
  674. MAPREDUCE-1683. Remove JNI calls from ClusterStatus cstr. (Arun Murthy and
  675. Luke Lu via cdouglas)
  676. MAPREDUCE-1855. Makes the refresh methods (for groups and proxy users)
  677. independent of the client side configuration. (Boris Shkolnik via ddas)
  678. NEW FEATURES
  679. MAPREDUCE-1774. Large-scale Automated Framework (Sharad Agarwal, Sreekanth
  680. Ramakrishnan, Konstantin Boudnik, at all via cos)
  681. MAPREDUCE-706. Support for FIFO pools in the fair scheduler.
  682. (Matei Zaharia)
  683. MAPREDUCE-546. Provide sample fair scheduler config file in conf/ and use
  684. it by default if no other config file is specified. (Matei Zaharia)
  685. MAPREDUCE-551. Preemption support in the Fair Scheduler. (Matei Zaharia)
  686. MAPREDUCE-567. Add a new example MR that always fails. (Philip Zeyliger
  687. via tomwhite)
  688. MAPREDUCE-211. Provides ability to run a health check script on the
  689. tasktracker nodes and blacklist nodes if they are unhealthy.
  690. (Sreekanth Ramakrishnan via yhemanth)
  691. MAPREDUCE-637. Add an example, distbbp, which able to compute the n th bit
  692. of Pi for some large n. (szetszwo)
  693. MAPREDUCE-532. Provide a way to limit the number of used slots
  694. per queue in the capacity scheduler.
  695. (Rahul Kumar Singh via yhemanth)
  696. MAPREDUCE-467. Provide ability to collect statistics about total tasks
  697. and succeeded tasks in different time windows. (sharad)
  698. MAPREDUCE-740. Log a job-summary at the end of a job, while allowing it
  699. to be configured to use a custom appender if desired. (acmurthy)
  700. MAPREDUCE-814. Provide a way to configure completed job history files
  701. to be on HDFS. (sharad)
  702. MAPREDUCE-800. MRUnit should support the new API. (Aaron Kimball via
  703. tomwhite)
  704. MAPREDUCE-798. MRUnit should be able to test a succession of MapReduce
  705. passes. (Aaron Kimball via tomwhite)
  706. MAPREDUCE-768. Provide an option to dump jobtracker configuration in JSON
  707. format to standard output. (V.V.Chaitanya Krishna via yhemanth)
  708. MAPREDUCE-824. Add support for a hierarchy of queues in the capacity
  709. scheduler. (Rahul Kumar Singh via yhemanth)
  710. MAPREDUCE-751. Add Rumen, a tool for extracting statistics from job tracker
  711. logs and generating job traces for simulation and analysis. (Dick King via
  712. cdouglas)
  713. MAPREDUCE-830. Add support for splittable compression to TextInputFormats.
  714. (Abdul Qadeer via cdouglas)
  715. MAPREDUCE-861. Add support for hierarchical queues in the Map/Reduce
  716. framework. (Rahul Kumar Singh via yhemanth)
  717. MAPREDUCE-776. Add Gridmix, a benchmark processing Rumen traces to simulate
  718. a measured mix of jobs on a cluster. (cdouglas)
  719. MAPREDUCE-862. Enhance JobTracker UI to display hierarchical queues.
  720. (V.V.Chaitanya Krishna via yhemanth)
  721. MAPREDUCE-777. Brand new apis to track and query jobs as a
  722. replacement for JobClient. (Amareshwari Sriramadasu via acmurthy)
  723. MAPREDUCE-775. Add native and streaming support for Vertica as an input
  724. or output format taking advantage of parallel read and write properties of
  725. the DBMS. (Omer Trajman via ddas)
  726. MAPREDUCE-679. XML-based metrics as JSP servlet for JobTracker.
  727. (Aaron Kimball via tomwhite)
  728. MAPREDUCE-980. Modify JobHistory to use Avro for serialization. (cutting)
  729. MAPREDUCE-728. Add Mumak, a Hadoop map/reduce simulator. (Arun C Murthy,
  730. Tamas Sarlos, Anirban Dasgupta, Guanying Wang, and Hong Tang via cdouglas)
  731. MAPREDUCE-1383. Automates fetching of delegation tokens in File*Formats
  732. Distributed Cache and Distcp. Also, provides a config
  733. mapreduce.job.hdfs-servers that the jobs can populate with a comma
  734. separated list of namenodes. The job client automatically fetches
  735. delegation tokens from those namenodes. (Boris Shkolnik via ddas)
  736. MAPREDUCE-698. Per-pool task limits for the fair scheduler.
  737. (Kevin Peterson via matei)
  738. MAPREDUCE-1026. Does mutual authentication of the shuffle
  739. transfers using a shared JobTracker generated key.
  740. (Boris Shkolnik via ddas)
  741. MAPREDUCE-744. Introduces the notion of a public distributed cache.
  742. (Devaraj Das)
  743. MAPREDUCE-1338. Introduces the notion of token cache using which
  744. tokens and secrets can be sent by the Job client to the JobTracker.
  745. (Boris Shkolnik via ddas)
  746. HDFS-503. This patch implements an optional layer over HDFS that
  747. implements offline erasure-coding. It can be used to reduce the
  748. total storage requirements of HDFS. (dhruba)
  749. MAPREDUCE-1432. Adds hooks in the jobtracker and tasktracker
  750. for loading the tokens in the user's ugi. This is required
  751. for the copying of files from the hdfs. (ddas)
  752. MAPREDUCE-1335. Adds SASL Kerberos/Digest authentication in MapReduce.
  753. (Kan Zhang via ddas)
  754. MAPREDUCE-1464. Makes a compatible change in JobTokenIdentifier to
  755. account for HADOOP-6510. (Jitendra Nath Pandey via ddas)
  756. MAPREDUCE-1433. Add a delegation token for MapReduce. (omalley)
  757. MAPREDUCE-1307. Introduces the Job level ACLs feature.
  758. (Vinod Kumar Vavilapalli via ddas)
  759. MAPREDUCE-1430. JobTracker automatically renews delegation tokens for jobs.
  760. (Boris Shkolnik via ddas)
  761. MAPREDUCE-1455. Introduces job-level authorization for mapreduce servlets.
  762. (Ravi Gummadi via vinodkv)
  763. IMPROVEMENTS
  764. MAPREDUCE-463. Makes job setup and cleanup tasks as optional.
  765. (Amareshwari Sriramadasu via sharad)
  766. MAPREDUCE-502. Allow jobtracker to be configured with zero completed jobs
  767. in memory. (Amar Kamat via sharad)
  768. MAPREDUCE-416. Moves the history file to a "done" folder whenever a job
  769. completes. (Amar Kamat via ddas)
  770. MAPREDUCE-646. Increase srcfilelist replication number in dictcp job.
  771. (Ravi Gummadi via szetszwo)
  772. HADOOP-6106. Updated hadoop-core and test jars from hudson trunk
  773. build #12. (Giridharan Kesavan)
  774. MAPREDUCE-642. A option to distcp that allows preserving the full
  775. source path of a file in the specified destination directory.
  776. (Rodrigo Schmidt via dhruba)
  777. MAPREDUCE-686. Move TestSpeculativeExecution.Fake* into a separate class
  778. so that it can be used by other tests. (Jothi Padmanabhan via sharad)
  779. MAPREDUCE-625. Modify TestTaskLimits to improve execution time.
  780. (Jothi Padmanabhan via sharad)
  781. MAPREDUCE-465. Deprecate o.a.h.mapred.lib.MultithreadedMapRunner and add
  782. test for o.a.h.mapreduce.lib.MultithreadedMapper.
  783. (Amareshwari Sriramadasu via sharad)
  784. MAPREDUCE-701. Improves the runtime of the TestRackAwareTaskPlacement
  785. by making it a unit test. (Jothi Padmanabhan via ddas)
  786. MAPREDUCE-371. Change KeyFieldBasedComparator and KeyFieldBasedPartitioner
  787. to use new api. (Amareshwari Sriramadasu via sharad)
  788. MAPREDUCE-623. Resolve javac warnings in mapreduce. (Jothi Padmanabhan
  789. via sharad)
  790. MAPREDUCE-655. Change KeyValueLineRecordReader and KeyValueTextInputFormat
  791. to use new mapreduce api. (Amareshwari Sriramadasu via sharad)
  792. MAPREDUCE-632. Merge TestCustomOutputCommitter with
  793. TestCommandLineJobSubmission. (Jothi Padmanabhan via sharad)
  794. MAPREDUCE-627. Improves execution time of TestTrackerBlacklistAcrossJobs.
  795. (Jothi Padmanabhan via ddas)
  796. MAPREDUCE-630. Improves execution time of TestKillCompletedJob.
  797. (Jothi Padmanabhan via ddas)
  798. MAPREDUCE-626. Improves the execution time of TestLostTracker.
  799. (Jothi Padmanabhan via ddas)
  800. MAPREDUCE-353. Makes the shuffle read and connection timeouts
  801. configurable. (Ravi Gummadi via ddas)
  802. MAPREDUCE-739. Allow relative paths to be created in archives. (Mahadev
  803. Konar via cdouglas)
  804. MAPREDUCE-772. Merge HADOOP-4010 changes to LineRecordReader into mapreduce
  805. package. (Abdul Qadeer via cdouglas)
  806. MAPREDUCE-785. Separate sub-test of TestReduceFetch to be included in
  807. MR-670. (Jothi Padmanabhan via cdouglas)
  808. MAPREDUCE-784. Modify TestUserDefinedCounters to use LocalJobRunner
  809. instead of MiniMR. (Jothi Padmanabhan via sharad)
  810. HADOOP-6160. Fix releaseaudit target to run on specific directories.
  811. (gkesavan)
  812. MAPREDUCE-782. Use PureJavaCrc32 in SpillRecord. (Todd Lipcon via
  813. szetszwo)
  814. MAPREDUCE-369. Change org.apache.hadoop.mapred.lib.MultipleInputs to
  815. use new api. (Amareshwari Sriramadasu via sharad)
  816. MAPREDUCE-373. Change org.apache.hadoop.mapred.lib.FieldSelectionMapReduce
  817. to use new api. (Amareshwari Sriramadasu via sharad)
  818. MAPREDUCE-628. Improves the execution time of TestJobInProgress.
  819. (Jothi Padmanabhan via ddas)
  820. MAPREDUCE-793. Creates a new test that consolidates a few tests to
  821. include in the commit-test list. (Jothi Padmanabhan via ddas)
  822. MAPREDUCE-797. Adds combiner support to MRUnit MapReduceDriver.
  823. (Aaron Kimball via johan)
  824. MAPREDUCE-656. Change org.apache.hadoop.mapred.SequenceFile* classes
  825. to use new mapreduce api. (Amareshwari Sriramadasu via sharad)
  826. MAPREDUCE-670. Creates ant target for 10 mins patch test build.
  827. (Jothi Padmanabhan via gkesavan)
  828. MAPREDUCE-375. Change org.apache.hadoop.mapred.lib.NLineInputFormat
  829. and org.apache.hadoop.mapred.MapFileOutputFormat to use new api.
  830. (Amareshwari Sriramadasu via ddas)
  831. MAPREDUCE-779. Added node health failure counts into
  832. JobTrackerStatistics. (Sreekanth Ramakrishnan via yhemanth)
  833. MAPREDUCE-842. Setup secure permissions for localized job files,
  834. intermediate outputs and log files on tasktrackers.
  835. (Vinod Kumar Vavilapalli via yhemanth)
  836. MAPREDUCE-478. Allow map and reduce jvm parameters, environment variables
  837. and ulimit to be set separately.
  838. Configuration changes:
  839. add mapred.map.child.java.opts
  840. add mapred.reduce.child.java.opts
  841. add mapred.map.child.env
  842. add mapred.reduce.child.ulimit
  843. add mapred.map.child.env
  844. add mapred.reduce.child.ulimit
  845. deprecated mapred.child.java.opts
  846. deprecated mapred.child.env
  847. deprecated mapred.child.ulimit
  848. (acmurthy)
  849. MAPREDUCE-767. Remove the dependence on the CLI 2.0 snapshot.
  850. (Amar Kamat via omalley)
  851. MAPREDUCE-712. Minor efficiency tweaks to RandomTextWriter. (cdouglas)
  852. MAPREDUCE-870. Remove the job retire thread and the associated
  853. config parameters. (sharad)
  854. MAPREDUCE-874. Rename the PiEstimator example to QuasiMonteCarlo.
  855. (szetszwo)
  856. MAPREDUCE-336. Allow logging level of map/reduce tasks to be configurable.
  857. Configuration changes:
  858. add mapred.map.child.log.level
  859. add mapred.reduce.child.log.level
  860. (acmurthy)
  861. MAPREDUCE-355. Update mapred.join package to use the new API. (Amareshwari
  862. Sriramadasu via cdouglas)
  863. HADOOP-6184. Updated hadoop common and test jars to get the new API
  864. in Configuration for dumping in JSON format from Hudson trunk build #68.
  865. (yhemanth)
  866. MAPREDUCE-476. Extend DistributedCache to work locally (LocalJobRunner).
  867. (Philip Zeyliger via tomwhite)
  868. MAPREDUCE-825. JobClient completion poll interval of 5s causes slow tests
  869. in local mode. (Aaron Kimball via tomwhite)
  870. MAPREDUCE-910. Support counters in MRUnit. (Aaron Kimball via cdouglas)
  871. MAPREDUCE-788. Update gridmix2 to use the new API (Amareshwari Sriramadasu
  872. via cdouglas)
  873. MAPREDUCE-875. Make DBRecordReader execute queries lazily. (Aaron Kimball
  874. via enis)
  875. MAPREDUCE-318. Modularizes the shuffle code. (Jothi Padmanabhan and
  876. Arun Murthy via ddas)
  877. MAPREDUCE-936. Allow a load difference for fairshare scheduler.
  878. (Zheng Shao via dhruba)
  879. MAPREDUCE-370. Update MultipleOutputs to use the API, merge funcitonality
  880. of MultipleOutputFormat. (Amareshwari Sriramadasu via cdouglas)
  881. MAPREDUCE-898. Changes DistributedCache to use the new API.
  882. (Amareshwari Sriramadasu via ddas)
  883. MAPREDUCE-144. Includes dump of the process tree in task diagnostics when
  884. a task is killed due to exceeding memory limits.
  885. (Vinod Kumar Vavilapalli via yhemanth)
  886. MAPREDUCE-945. Modifies MRBench and TestMapRed to use ToolRunner so that
  887. options such as queue name can be passed via command line.
  888. (Sreekanth Ramakrishnan via yhemanth)
  889. MAPREDUCE-963. Deprecate o.a.h.mapred.FileAlreadyExistsException and
  890. replace it with o.a.h.fs.FileAlreadyExistsException. (Boris Shkolnik
  891. via szetszwo)
  892. MAPREDUCE-960. Remove an unnecessary intermediate copy and obsolete API
  893. from KeyValueLineRecordReader. (cdouglas)
  894. MAPREDUCE-930. Modify Rumen to resolve paths in the canonical way, rather
  895. than defaulting to the local filesystem. (cdouglas)
  896. MAPREDUCE-944. Extend the LoadManager API of the fair-share scheduler
  897. to support regulating tasks for a job based on resources currently in use
  898. by that job. (dhruba)
  899. MAPREDUCE-973. Move FailJob and SleepJob from examples to test. (cdouglas
  900. via omalley)
  901. MAPREDUCE-966. Modify Rumen to clean up interfaces and simplify integration
  902. with other tools. (Hong Tang via cdouglas)
  903. MAPREDUCE-856. Setup secure permissions for distributed cache files.
  904. (Vinod Kumar Vavilapalli via yhemanth)
  905. MAPREDUCE-885. More efficient SQL queries for DBInputFormat. (Aaron Kimball
  906. via enis)
  907. MAPREDUCE-284. Enables ipc.client.tcpnodelay in Tasktracker's Child.
  908. (Ravi Gummadi via sharad)
  909. MAPREDUCE-916. Split the documentation to match the project split.
  910. (Corinne Chandel via omalley)
  911. MAPREDUCE-649. Validate a copy by comparing the source and destination
  912. checksums in distcp. Also adds an intra-task retry mechanism for errors
  913. detected during the copy. (Ravi Gummadi via cdouglas)
  914. MAPREDUCE-654. Add a -dryrun option to distcp printing a summary of the
  915. file data to be copied, without actually performing the copy. (Ravi Gummadi
  916. via cdouglas)
  917. MAPREDUCE-664. Display the number of files deleted by distcp when the
  918. -delete option is specified. (Ravi Gummadi via cdouglas)
  919. MAPREDUCE-781. Let the name of distcp jobs be configurable. (Venkatesh S
  920. via cdouglas)
  921. MAPREDUCE-975. Add an API in job client to get the history file url for
  922. a given job id. (sharad)
  923. MAPREDUCE-905. Add Eclipse launch tasks for MapReduce. (Philip Zeyliger
  924. via tomwhite)
  925. MAPREDUCE-277. Makes job history counters available on the job history
  926. viewers. (Jothi Padmanabhan via ddas)
  927. MAPREDUCE-893. Provides an ability to refresh queue configuration
  928. without restarting the JobTracker.
  929. (Vinod Kumar Vavilapalli and Rahul Kumar Singh via yhemanth)
  930. MAPREDUCE-1011. Add build.properties to svn and git ignore. (omalley)
  931. MAPREDUCE-954. Change Map-Reduce context objects to be interfaces.
  932. (acmurthy)
  933. MAPREDUCE-639. Change Terasort example to reflect the 2009 updates.
  934. (omalley)
  935. MAPREDUCE-1063. Document gridmix benchmark. (cdouglas)
  936. MAPREDUCE-931. Use built-in interpolation classes for making up task
  937. runtimes in Rumen. (Dick King via cdouglas)
  938. MAPREDUCE-1012. Mark Context interfaces as public evolving. (Tom White via
  939. cdouglas)
  940. MAPREDUCE-971. Document use of distcp when copying to s3, managing timeouts
  941. in particular. (Aaron Kimball via cdouglas)
  942. HDFS-663. DFSIO for append. (shv)
  943. HDFS-641. Move all of the components that depend on map/reduce to
  944. map/reduce. (omalley)
  945. HADOOP-5107. Use Maven ant tasks to publish artifacts. (Giridharan Kesavan
  946. via omalley)
  947. MAPREDUCE-1229. Allow customization of job submission policy in Mumak.
  948. (Hong Tang via cdouglas)
  949. MAPREDUCE-1317. Reduce the memory footprint of Rumen objects by interning
  950. host Strings. (Hong Tang via cdouglas)
  951. MAPREDUCE-1097. Add support for Vertica 3.5 to its contrib module. (Omer
  952. Trajman via cdouglas)
  953. MAPREDUCE-1627. HadoopArchives should not uses a method in DistCp.
  954. (szetszwo)
  955. MAPREDUCE-1198. Alternatively schedule different types of tasks in
  956. fair share scheduler. (Scott Chen via matei)
  957. MAPREDUCE-707. Provide a jobconf property for explicitly assigning a job to
  958. a pool in the Fair Scheduler. (Alan Heirich via matei)
  959. MAPREDUCE-947. Added commitJob and abortJob apis to OutputCommitter.
  960. Enhanced FileOutputCommitter to create a _SUCCESS file for successful
  961. jobs. (Amar Kamat & Jothi Padmanabhan via acmurthy)
  962. MAPREDUCE-1103. Added more metrics to Jobtracker. (sharad)
  963. MAPREDUCE-1048. Add occupied/reserved slot usage summary on jobtracker UI.
  964. (Amareshwari Sriramadasu and Hemanth Yamijala via sharad)
  965. MAPREDUCE-1090. Modified log statement in TaskMemoryManagerThread to
  966. include task attempt id. (yhemanth)
  967. MAPREDUCE-1189. Reduce ivy console output to ovservable level (cos)
  968. MAPREDUCE-1167. ProcfsBasedProcessTree collects rss memory information.
  969. (Scott Chen via dhruba)
  970. MAPREDUCE-1231. Added a new DistCp option, -skipcrccheck, so that the CRC
  971. check during setup can be skipped. (Jothi Padmanabhan via szetszwo)
  972. MAPREDUCE-1190. Add package documentation for BBP example.
  973. (Tsz Wo (Nicholas) Sze via cdouglas)
  974. MAPREDUCE-1119. When tasks fail to report status, show tasks's stack dump
  975. before killing. (Aaron Kimball via tomwhite)
  976. MAPREDUCE-1185. Redirect running job url to history url if job is already
  977. retired. (Amareshwari Sriramadasu and Sharad Agarwal via sharad)
  978. MAPREDUCE-1050. Introduce a mock object testing framework. (tomwhite)
  979. MAPREDUCE-1084. Implementing aspects development and fault injeciton
  980. framework for MapReduce. (Sreekanth Ramakrishnan via cos)
  981. MAPREDUCE-1209. Move common specific part of the test TestReflectionUtils
  982. out of mapred into common. (Todd Lipcon via tomwhite)
  983. MAPREDUCE-967. TaskTracker does not need to fully unjar job jars.
  984. (Todd Lipcon via tomwhite)
  985. MAPREDUCE-1083. Changes in MapReduce so that group information of users
  986. can be refreshed in the JobTracker via command line.
  987. (Boris Shkolnik via ddas)
  988. MAPREDUCE-181. Changes the job submission process to be secure.
  989. (Devaraj Das)
  990. MAPREDUCE-1250. Refactors the JobToken to use Common's Token interface.
  991. (Kan Zhang via ddas)
  992. MAPREDUCE-896. Enhance tasktracker to cleanup files that might have
  993. been created by user tasks with non-writable permissions.
  994. (Ravi Gummadi via yhemanth)
  995. MAPREDUCE-372. Change org.apache.hadoop.mapred.lib.ChainMapper/Reducer
  996. to use new mapreduce api. (Amareshwari Sriramadasu via sharad)
  997. MAPREDUCE-1295. Add a tool in Rumen for folding and manipulating job
  998. traces. (Dick King via cdouglas)
  999. MAPREDUCE-1302. TrackerDistributedCacheManager deletes file
  1000. asynchronously, thus reducing task initialization delays.
  1001. (Zheng Shao via dhruba)
  1002. MAPREDUCE-1218. TaskTrackers send cpu and memory usage of
  1003. node to JobTracker. (Scott Chen via dhruba)
  1004. MAPREDUCE-847. Fix Releaseaudit warning count to zero
  1005. (Giridharan Kesavan)
  1006. MAPREDUCE-1337. Use generics in StreamJob to improve readability of that
  1007. class. (Kay Kay via cdouglas)
  1008. MAPREDUCE-361. Port terasort example to the new mapreduce API. (Amareshwari
  1009. Sriramadasu via cdouglas)
  1010. MAPREDUCE-1367. LocalJobRunner should support parallel mapper execution.
  1011. (Aaron Kimball via tomwhite)
  1012. MAPREDUCE-64. Eliminate io.sort.record.percent from MapTask configuration.
  1013. (cdouglas)
  1014. MAPREDUCE-1440. Replace the long user name in MapReduce with the local
  1015. name. (omalley)
  1016. MAPREDUCE-1470. Move delegation tokens from HDFS to Common so that
  1017. MapReduce can use them too. (omalley)
  1018. MAPREDUCE-1425. Reduce memory usage by archive. (mahadev via szetszwo)
  1019. MAPREDUCE-1441. Trim whitespace from directory lists pulled from the
  1020. configuration. (Todd Lipcon via cdouglas)
  1021. MAPREDUCE-1309. Refactor Rumen trace generator to improve code structure
  1022. and add extensible support for log formats. (Dick King via cdouglas)
  1023. MAPREDUCE-1503. Delegation token renewing and cancelling should provide
  1024. meaningful exceptions when there are failures instead of returning
  1025. false. (omalley)
  1026. HADOOP-6579. Upgrade commons-codec library to 1.4. (omalley)
  1027. MAPREDUCE-1423. Improve performance of CombineFileInputFormat when multiple
  1028. pools are configured. (Dhruba Borthakur via zshao)
  1029. MAPREDUCE-1454. Quote user supplied strings in Tracker servlets. (cdouglas)
  1030. MAPREDUCE-1408. Add customizable job submission policies to Gridmix. (Rahul
  1031. Singh via cdouglas)
  1032. MAPREDUCE-1527. Better warning logged when mapred.queue.names is
  1033. overshadowed by mapred-queues.xml. (Hong Tang via acmurthy)
  1034. MAPREDUCE-1403. Save the size and number of distributed cache artifacts in
  1035. the configuration. (Arun Murthy via cdouglas)
  1036. MAPREDUCE-1482. Truncate state string and diagnostic information in
  1037. TaskStatus. (Amar Kamat via szetszwo)
  1038. MAPREDUCE-1593. [Rumen] Improvements to random seed generation (tamas via
  1039. mahadev)
  1040. MAPREDUCE-1460. Oracle support in DataDrivenDBInputFormat.
  1041. (Aaron Kimball via tomwhite)
  1042. MAPREDUCE-1569. Pass configuration through mocked contexts in MRUnit.
  1043. (Chris White via cdouglas)
  1044. MAPREDUCE-1590. Move HarFileSystem from Hadoop Common to Mapreduce tools.
  1045. (mahadev)
  1046. MAPREDUCE-1629. Get rid of fakeBlockLocations() on HarFileSystem, since
  1047. it's not used (mahadev)
  1048. MAPREDUCE-1489. DataDrivenDBInputFormat should not query the database
  1049. when generating only one split. (Aaron Kimball via tomwhite)
  1050. MAPREDUCE-1514. Add documentation on replication, permissions, new options,
  1051. limitations and internals of har. (mahadev via szetszwo)
  1052. MAPREDUCE-1428. Make block size and the size of archive created files
  1053. configurable. (mahadev via szetszwo)
  1054. MAPREDUCE-1656. JobStory should provide queue info. (hong via mahadev)
  1055. MAPREDUCE-1466. Record number of files processed in FileInputFormat in the
  1056. Configuration for offline analysis. (Luke Lu and Arun Murthy via cdouglas)
  1057. MAPREDUCE-1538. TrackerDistributedCacheManager manages the
  1058. number of files. (Scott Chen via dhruba)
  1059. MAPREDUCE-1673. Scripts to start and stop RaidNode.
  1060. (Rodrigo Schmidt via dhruba)
  1061. MAPREDUCE-1659. RaidNode writes temp files on configured tmp directory and
  1062. add random numbers to their names to avoid conflicts
  1063. (Rodrigo Schmidt via dhruba)
  1064. MAPREDUCE-1221. Allow admins to control physical memory limits per-task
  1065. and per-node. (Scott Chen via acmurthy)
  1066. MAPREDUCE-1065. Update mapred tutorial to use the new API. (Aaron Kimball
  1067. via cdouglas)
  1068. MAPREDUCE-1304. Add a task counter tracking time spent in GC. (Aaron
  1069. Kimball via cdouglas)
  1070. MAPREDUCE-1570. Add grouping comparators to MRUnit. (Chris White via
  1071. cdouglas)
  1072. MAPREDUCE-1650. Exclude Private elements from generated MapReduce
  1073. Javadoc. (tomwhite)
  1074. MAPREDUCE-1625. Improve grouping of packages in Javadoc. (tomwhite)
  1075. MAPREDUCE-1417. Forrest documentation should be updated to reflect
  1076. the changes in MAPREDUCE-744. (Ravi Gummadi via vinodkv)
  1077. MAPREDUCE-1568. TrackerDistributedCacheManager should clean up cache
  1078. in a background thread. (Scott Chen via zshao)
  1079. MAPREDUCE-1749. Move configuration strings out of JobContext so that it
  1080. can be made public stable. (omalley)
  1081. MAPREDUCE-1623. Apply audience and stability notations to Hadoop
  1082. Map-Reduce. (tomwhite via acmurthy)
  1083. MAPREDUCE-1751. Change MapReduce to depend on Hadoop 'common' artifacts
  1084. instead of 'core'. (tomwhite)
  1085. MAPREDUCE-1535. Replace usage of FileStatus#isDir(). (Eli Collins via
  1086. tomwhite)
  1087. MAPREDUCE-1832. Allow file sizes less than 1MB in DFSIO benchmark. (shv)
  1088. MAPREDUCE-1404. Move Cluster-Setup and Single-Node-Setup Docs from
  1089. MapReduce to Common. (tomwhite)
  1090. MAPREDUCE-1697. Document the behavior of -file option and deprecate it
  1091. in favour of -files option in streaming. (Amareshwari Sriramadasu
  1092. via vinodkv)
  1093. MAPREDUCE-1033. Resolve location of scripts and configuration files after
  1094. project split. (tomwhite)
  1095. MAPREDUCE-1018. Document changes to the memory management and scheduling
  1096. model. (Hemanth Yamijala via vinodkv)
  1097. MAPREDUCE-1896. [Herriot] New property for multi user list. (Vinay Thota
  1098. via cos)
  1099. MAPREDUCE-1812. New properties for suspend and resume process. (Vinay
  1100. Thota via cos)
  1101. OPTIMIZATIONS
  1102. MAPREDUCE-270. Fix the tasktracker to optionally send an out-of-band
  1103. heartbeat on task-completion for better job-latency. (acmurthy)
  1104. Configuration changes:
  1105. add mapreduce.tasktracker.outofband.heartbeat
  1106. MAPREDUCE-1186. Modified code in distributed cache to set permissions
  1107. only on required set of localized paths.
  1108. (Amareshwari Sriramadasu via yhemanth)
  1109. MAPREDUCE-1501. FileInputFormat supports multi-level, recursive
  1110. directory listing. (Zheng Shao via dhruba)
  1111. MAPREDUCE-1556. upgrade to Avro 1.3.0. (cutting via tomwhite)
  1112. MAPREDUCE-1613. Install/deploy source jars to Maven repo
  1113. (Patrick Angeles via ddas)
  1114. MAPREDUCE-1610. Forrest documentation should be updated to reflect
  1115. the changes in MAPREDUCE-856. (Ravi Gummadi via vinodkv)
  1116. MAPREDUCE-1853. Adds caching for TaskAttemptContext in MultipleOutputs.
  1117. (Torsten Curdt via amareshwari)
  1118. BUG FIXES
  1119. MAPREDUCE-878. Rename fair scheduler design doc to
  1120. fair-scheduler-design-doc.tex and add Apache license header (matei)
  1121. HADOOP-4687. MapReduce is split from Hadoop Core. It is a subproject under
  1122. Hadoop (Owen O'Malley)
  1123. HADOOP-6096. Fix Eclipse project and classpath files following project
  1124. split. (tomwhite)
  1125. MAPREDUCE-419. Reconcile mapred.userlog.limit.kb defaults in configuration
  1126. and code. (Philip Zeyliger via cdouglas)
  1127. MAPREDUCE-2. Fixes a bug in KeyFieldBasedPartitioner in handling empty
  1128. keys. (Amar Kamat via sharad)
  1129. MAPREDUCE-130. Delete the jobconf copy from the log directory of the
  1130. JobTracker when the job is retired. (Amar Kamat via sharad)
  1131. MAPREDUCE-657. Fix hardcoded filesystem problem in CompletedJobStatusStore.
  1132. (Amar Kamat via sharad)
  1133. MAPREDUCE-179. Update progress in new RecordReaders. (cdouglas)
  1134. MAPREDUCE-658. Replace NPE in distcp with a meaningful error message when
  1135. the source path does not exist. (Ravi Gummadi via cdouglas)
  1136. MAPREDUCE-671. Update ignore list to include untracked, generated
  1137. build artifacts and config files. (cdouglas)
  1138. MAPREDUCE-433. Use more reliable counters in TestReduceFetch. (cdouglas)
  1139. MAPREDUCE-124. Fix a bug in failure handling of abort task of
  1140. OutputCommiter. (Amareshwari Sriramadasu via sharad)
  1141. MAPREDUCE-694. Fix to add jsp-api jars to capacity-scheduler classpath.
  1142. (Giridharan Kesavan)
  1143. MAPREDUCE-702. Fix eclipse-plugin jar target (Giridharan Kesavan)
  1144. MAPREDUCE-522. Replace TestQueueCapacities with simpler test case to
  1145. test integration between capacity scheduler and MR framework.
  1146. (Sreekanth Ramakrishnan via yhemanth)
  1147. MAPREDUCE-683. Fixes an initialization problem in the JobHistory.
  1148. The initialization of JobHistoryFilesManager is now done in the
  1149. JobHistory.init call. (Amar Kamat via ddas)
  1150. MAPREDUCE-708. Fixes a bug to allow updating the reason for
  1151. blacklisting a node on the JobTracker UI.
  1152. (Sreekanth Ramakrishnan via yhemanth)
  1153. MAPREDUCE-709. Fixes message displayed for a blacklisted node where
  1154. the reason for blacklisting is due to the health check script
  1155. timing out. (Sreekanth Ramakrishnan via yhemanth)
  1156. MAPREDUCE-676. Existing diagnostic rules fail for MAP ONLY jobs.
  1157. (Suhas Gogate via tomwhite)
  1158. MAPREDUCE-722. Fixes a bug with tasktracker reservations for
  1159. high memory jobs in capacity scheduler.
  1160. (Vinod Kumar Vavilapalli via yhemanth)
  1161. HADOOP-6090. Updates gridmix script to use new mapreduce api output
  1162. format. (Amareshwari Sriramadasu via sharad)
  1163. MAPREDUCE-732. Removed spurious log statements in the node
  1164. blacklisting logic. (Sreekanth Ramakrishnan via yhemanth)
  1165. MAPREDUCE-734. Fix a ConcurrentModificationException in unreserving
  1166. unused reservations for a job when it completes.
  1167. (Arun Murthy and Sreekanth Ramakrishnan via yhemanth)
  1168. MAPREDUCE-733. Fix a RuntimeException while unreserving trackers
  1169. that are blacklisted for a job.
  1170. (Arun Murthy and Sreekanth Ramakrishnan via yhemanth)
  1171. MAPREDUCE-677. Fix timeout in TestNodeRefresh. (Amar Kamat via
  1172. sharad)
  1173. MAPREDUCE-153. Fix timeout in TestJobInProgressListener. (Amar
  1174. Kamat via sharad)
  1175. MAPREDUCE-742. Fix output messages and java comments in the Pi related
  1176. examples. (szetszwo)
  1177. MAPREDUCE-565. Fix partitioner to work with new API. (Owen O'Malley via
  1178. cdouglas)
  1179. MAPREDUCE-680. Fix so MRUnit can handle reuse of Writable objects.
  1180. (Aaron Kimball via johan)
  1181. MAPREDUCE-18. Puts some checks for cross checking whether a reduce
  1182. task gets the correct shuffle data. (Ravi Gummadi via ddas)
  1183. MAPREDUCE-771. Fix scheduling of setup and cleanup tasks to use
  1184. free slots instead of tasks for scheduling. (yhemanth)
  1185. MAPREDUCE-717. Fixes some corner case issues in speculative
  1186. execution heuristics. (Devaraj Das)
  1187. MAPREDUCE-716. Make DBInputFormat work with Oracle. (Aaron Kimball
  1188. via tomwhite)
  1189. MAPREDUCE-735. Fixes a problem in the KeyFieldHelper to do with
  1190. the end index for some inputs (Amar Kamat via ddas)
  1191. MAPREDUCE-682. Removes reservations on tasktrackers which are
  1192. blacklisted. (Sreekanth Ramakrishnan via yhemanth)
  1193. MAPREDUCE-743. Fixes a problem to do with progress reporting
  1194. in the map phase. (Ravi Gummadi via ddas)
  1195. MAPREDUCE-765. Eliminate the deprecated warnings introduced by H-5438.
  1196. (He Yongqiang via szetszwo)
  1197. MAPREDUCE-383. Fix a bug in Pipes combiner due to bytes count not
  1198. getting reset after the spill. (Christian Kunz via sharad)
  1199. MAPREDUCE-809. Fix job-summary logs to correctly record status of FAILED
  1200. and KILLED jobs. (acmurthy)
  1201. MAPREDUCE-792. Fix unchecked warnings in DBInputFormat. (Aaron Kimball
  1202. via szetszwo)
  1203. MAPREDUCE-760. Fix a timing issue in TestNodeRefresh. (Amar Kamat via
  1204. sharad)
  1205. MAPREDUCE-40. Keep memory management backwards compatible for job
  1206. configuration parameters and limits. (Rahul Kumar Singh via yhemanth)
  1207. MAPREDUCE-587. Fixes a OOM issue in TestStreamingExitStatus.
  1208. (Amar Kamat via ddas)
  1209. MAPREDUCE-408. Fixes an assertion problem in TestKillSubProcesses
  1210. (Ravi Gummadi via ddas)
  1211. MAPREDUCE-659. Fix gridmix2 compilation. (Giridharan Kesavan)
  1212. MAPREDUCE-796. Fixes a ClassCastException in an exception log in
  1213. MultiThreadedMapRunner. (Amar Kamat via ddas)
  1214. MAPREDUCE-808. Fixes a serialization problem in TypedBytes.
  1215. (Klaas Bosteels via ddas)
  1216. MAPREDUCE-845. Fix a findbugs heap size problem in build.xml and add
  1217. a new property findbugs.heap.size. (Lee Tucker via szetszwo)
  1218. MAPREDUCE-838. Fixes a problem in the way commit of task outputs
  1219. happens. The bug was that even if commit failed, the task would
  1220. be declared as successful. (Amareshwari Sriramadasu via ddas)
  1221. MAPREDUCE-813. Updates Streaming and M/R tutorial documents.
  1222. (Corinne Chandel via ddas)
  1223. MAPREDUCE-805. Fixes some deadlocks in the JobTracker due to the fact
  1224. the JobTracker lock hierarchy wasn't maintained in some JobInProgress
  1225. method calls. (Amar Kamat via ddas)
  1226. MAPREDUCE-799. Fixes so all of the MRUnit self-tests run.
  1227. (Aaron Kimball via johan)
  1228. MAPREDUCE-848. Fixes a problem to do with TestCapacityScheduler
  1229. failing (Amar Kamat via ddas)
  1230. MAPREDUCE-840. DBInputFormat leaves open transaction.
  1231. (Aaron Kimball via tomwhite)
  1232. MAPREDUCE-859. Adds Avro and its dependencies required by Hadoop
  1233. common. (Ravi Gummadi via sharad)
  1234. MAPREDUCE-867. Fix ivy conf to look for avro jar from maven repo.
  1235. (Giridharan Kesavan)
  1236. MAPREDUCE-877. Added avro as a dependency to contrib ivy settings.
  1237. (Tsz Wo (Nicholas) Sze via yhemanth)
  1238. MAPREDUCE-852. In build.xml, remove the Main-Class, which is incorrectly
  1239. set in tools, and rename the target "tools-jar" to "tools". (szetszwo)
  1240. MAPREDUCE-773. Sends progress reports for compressed gzip inputs in maps.
  1241. Fixes a native direct buffer leak in LineRecordReader classes.
  1242. (Hong Tang and ddas)
  1243. MAPREDUCE-832. Reduce number of warning messages printed when
  1244. deprecated memory variables are used. (Rahul Kumar Singh via yhemanth)
  1245. MAPREDUCE-745. Fixes a testcase problem to do with generation of JobTracker
  1246. IDs. (Amar Kamat via ddas)
  1247. MAPREDUCE-834. Enables memory management on tasktrackers when old
  1248. memory management parameters are used in configuration.
  1249. (Sreekanth Ramakrishnan via yhemanth)
  1250. MAPREDUCE-818. Fixes Counters#getGroup API. (Amareshwari Sriramadasu
  1251. via sharad)
  1252. MAPREDUCE-807. Handles the AccessControlException during the deletion of
  1253. mapred.system.dir in the JobTracker. The JobTracker will bail out if it
  1254. encounters such an exception. (Amar Kamat via ddas)
  1255. MAPREDUCE-430. Fix a bug related to task getting stuck in case of
  1256. OOM error. (Amar Kamat via ddas)
  1257. MAPREDUCE-871. Fix ownership of Job/Task local files to have correct
  1258. group ownership according to the egid of the tasktracker.
  1259. (Vinod Kumar Vavilapalli via yhemanth)
  1260. MAPREDUCE-911. Fix a bug in TestTaskFail related to speculative
  1261. execution. (Amareshwari Sriramadasu via sharad)
  1262. MAPREDUCE-687. Fix an assertion in TestMiniMRMapRedDebugScript.
  1263. (Amareshwari Sriramadasu via sharad)
  1264. MAPREDUCE-924. Fixes the TestPipes testcase to use Tool.
  1265. (Amareshwari Sriramadasu via sharad)
  1266. MAPREDUCE-903. Add Avro jar to eclipse classpath.
  1267. (Philip Zeyliger via tomwhite)
  1268. MAPREDUCE-943. Removes a testcase in TestNodeRefresh that doesn't make
  1269. sense in the new Job recovery model. (Amar Kamat via ddas)
  1270. MAPREDUCE-764. TypedBytesInput's readRaw() does not preserve custom type
  1271. codes. (Klaas Bosteels via tomwhite)
  1272. HADOOP-6243. Fixes a NullPointerException in handling deprecated keys.
  1273. (Sreekanth Ramakrishnan via yhemanth)
  1274. MAPREDUCE-968. NPE in distcp encountered when placing _logs directory on
  1275. S3FileSystem. (Aaron Kimball via tomwhite)
  1276. MAPREDUCE-826. harchive doesn't use ToolRunner / harchive returns 0 even
  1277. if the job fails with exception (koji Noguchi via mahadev)
  1278. MAPREDUCE-839. unit test TestMiniMRChildTask fails on mac os-x (hong tang
  1279. via mahadev)
  1280. MAPREDUCE-112. Add counters for reduce input, output records to the new API.
  1281. (Jothi Padmanabhan via cdouglas)
  1282. MAPREDUCE-648. Fix two distcp bugs: (1) it should not launch a job if all
  1283. src paths are directories, and (2) it does not skip copying when updating
  1284. a single file. (Ravi Gummadi via szetszwo)
  1285. MAPREDUCE-946. Fix a regression in LineRecordReader where the
  1286. maxBytesToConsume parameter is not set correctly. (cdouglas)
  1287. MAPREDUCE-977. Missing jackson jars from Eclipse template. (tomwhite)
  1288. MAPREDUCE-988. Fix a packaging issue in the contrib modules. (Hong Tang via
  1289. cdouglas)
  1290. MAPREDUCE-971. distcp does not always remove distcp.tmp.dir. (Aaron Kimball
  1291. via tomwhite)
  1292. MAPREDUCE-995. Fix a bug in JobHistory where tasks completing after the job
  1293. is closed cause a NPE. (Jothi Padmanabhan via cdouglas)
  1294. MAPREDUCE-953. Fix QueueManager to dump queue configuration in JSON format.
  1295. (V.V. Chaitanya Krishna via yhemanth)
  1296. MAPREDUCE-645. Prevent distcp from running a job when the destination is a
  1297. file, but the source is not. (Ravi Gummadi via cdouglas)
  1298. MAPREDUCE-1002. Flushed writer in JobQueueClient so queue information is
  1299. printed correctly. (V.V. Chaitanya Krishna via yhemanth)
  1300. MAPREDUCE-1003. Fix compilation problem in eclipse plugin when
  1301. eclipse.home is set. (Ravi Gummadi via yhemanth)
  1302. MAPREDUCE-941. Vaidya script fails on Solaris. (Chad Metcalf
  1303. via tomwhite)
  1304. MAPREDUCE-912. Add and standardize Apache license headers. (Chad Metcalf
  1305. via cdouglas)
  1306. MAPREDUCE-1022. Fix compilation of vertica testcases. (Vinod Kumar
  1307. Vavilapalli via acmurthy)
  1308. MAPREDUCE-1000. Handle corrupt history files in JobHistory.initDone().
  1309. (Jothi Padmanabhan via sharad)
  1310. MAPREDUCE-1028. Fixed number of slots occupied by cleanup tasks to one
  1311. irrespective of slot size for the job.
  1312. (Ravi Gummadi via yhemanth)
  1313. MAPREDUCE-964. Fixed start and finish times of TaskStatus to be
  1314. consistent, thereby fixing inconsistencies in metering tasks.
  1315. (Sreekanth Ramakrishnan via yhemanth)
  1316. MAPREDUCE-1076. Deprecate ClusterStatus and add javadoc in ClusterMetrics.
  1317. (Amareshwari Sriramadasu via sharad)
  1318. MAPREDUCE-979. Fixed JobConf APIs related to memory parameters to return
  1319. values of new configuration variables when deprecated variables are
  1320. disabled. (Sreekanth Ramakrishnan via yhemanth)
  1321. MAPREDUCE-1030. Modified scheduling algorithm to return a map and reduce
  1322. task per heartbeat in the capacity scheduler.
  1323. (Rahul Kumar Singh via yhemanth)
  1324. MAPREDUCE-1071. Use DataInputStream rather than FSDataInputStream in the
  1325. JobHistory EventReader. (Hong Tang via cdouglas)
  1326. MAPREDUCE-986. Fix Rumen to work with truncated task lines. (Dick King via
  1327. cdouglas)
  1328. MAPREDUCE-1029. Fix failing TestCopyFiles by restoring the unzipping of
  1329. HDFS webapps from the hdfs jar. (Aaron Kimball and Jothi Padmanabhan via
  1330. cdouglas)
  1331. MAPREDUCE-769. Make findbugs and javac warnings to zero.
  1332. (Amareshwari Sriramadasu via sharad)
  1333. MAPREDUCE-1104. Initialize RecoveryManager in JobTracker cstr called by
  1334. Mumak. (Hong Tang via cdouglas)
  1335. MAPREDUCE-1061. Add unit test validating byte specifications for gridmix
  1336. jobs. (cdouglas)
  1337. MAPREDUCE-1077. Fix Rumen so that truncated tasks do not mark the job as
  1338. successful. (Dick King via cdouglas)
  1339. MAPREDUCE-1041. Make TaskInProgress::taskStatuses map package-private.
  1340. (Jothi Padmanabhan via cdouglas)
  1341. MAPREDUCE-1070. Prevent a deadlock in the fair scheduler servlet.
  1342. (Todd Lipcon via cdouglas)
  1343. MAPREDUCE-1086. Setup Hadoop logging environment for tasks to point to
  1344. task related parameters. (Ravi Gummadi via yhemanth)
  1345. MAPREDUCE-1105. Remove max limit configuration in capacity scheduler in
  1346. favor of max capacity percentage thus allowing the limit to go over
  1347. queue capacity. (Rahul Kumar Singh via yhemanth)
  1348. MAPREDUCE-1016. Make the job history log format JSON. (cutting)
  1349. MAPREDUCE-1038. Weave Mumak aspects only if related files have changed.
  1350. (Aaron Kimball via cdouglas)
  1351. MAPREDUCE-1163. Remove unused, hard-coded paths from libhdfs. (Allen
  1352. Wittenauer via cdouglas)
  1353. MAPREDUCE-962. Fix a NullPointerException while killing task process
  1354. trees. (Ravi Gummadi via yhemanth)
  1355. MAPREDUCE-1177. Correct setup/cleanup inversion in
  1356. JobTracker::getTaskReports. (Vinod Kumar Vavilapalli via cdouglas)
  1357. MAPREDUCE-1178. Fix ClassCastException in MultipleInputs by adding
  1358. a DelegatingRecordReader. (Amareshwari Sriramadasu and Jay Booth
  1359. via sharad)
  1360. MAPREDUCE-1068. Fix streaming job to show proper message if file is
  1361. is not present. (Amareshwari Sriramadasu via sharad)
  1362. MAPREDUCE-1147. Add map output counters to new API. (Amar Kamat via
  1363. cdouglas)
  1364. MAPREDUCE-915. The debug scripts are run as the job user. (ddas)
  1365. MAPREDUCE-1007. Fix NPE in CapacityTaskScheduler.getJobs().
  1366. (V.V.Chaitanya Krishna via sharad)
  1367. MAPREDUCE-28. Refactor TestQueueManager and fix default ACLs.
  1368. (V.V.Chaitanya Krishna and Rahul K Singh via sharad)
  1369. MAPREDUCE-1182. Fix overflow in reduce causing allocations to exceed the
  1370. configured threshold. (cdouglas)
  1371. MAPREDUCE-1239. Fix contrib components build dependencies.
  1372. (Giridharan Kesavan and omalley)
  1373. MAPREDUCE-787. Fix JobSubmitter to honor user given symlink path.
  1374. (Amareshwari Sriramadasu via sharad)
  1375. MAPREDUCE-1249. Update config default value for socket read timeout to
  1376. match code default. (Amareshwari Sriramadasu via cdouglas)
  1377. MAPREDUCE-1161. Remove ineffective synchronization in NotificationTestCase.
  1378. (Owen O'Malley via cdouglas)
  1379. MAPREDUCE-1244. Fix eclipse-plugin's build dependencies. (gkesavan)
  1380. MAPREDUCE-1075. Fix JobTracker to not throw an NPE for a non-existent
  1381. queue. (V.V.Chaitanya Krishna via yhemanth)
  1382. MAPREDUCE-754. Fix NPE in expiry thread when a TT is lost. (Amar Kamat
  1383. via sharad)
  1384. MAPREDUCE-1074. Document Reducer mark/reset functionality. (Jothi
  1385. Padmanabhan via cdouglas)
  1386. MAPREDUCE-1267. Fix typo in mapred-default.xml. (Todd Lipcon via cdouglas)
  1387. MAPREDUCE-952. Remove inadvertently reintroduced Task.Counter enum. (Jothi
  1388. Padmanabhan via cdouglas)
  1389. MAPREDUCE-1230. Fix handling of null records in VerticaInputFormat. (Omer
  1390. Trajman via cdouglas)
  1391. MAPREDUCE-1171. Allow shuffle retries and read-error reporting to be
  1392. configurable. (Amareshwari Sriramadasu via acmurthy)
  1393. MAPREDUCE-879. Fix broken unit test TestTaskTrackerLocalization on MacOS.
  1394. (Sreekanth Ramakrishnan via yhemanth)
  1395. MAPREDUCE-1124. Fix imprecise byte counts in Gridmix. (cdouglas)
  1396. MAPREDUCE-1222. Add an option to exclude numeric IP addresses in topologies
  1397. processed by Mumak. (Hong Tang via cdouglas)
  1398. MAPREDUCE-1284. Fix fts_open() call in task-controller that was failing
  1399. LinuxTaskController unit tests. (Ravi Gummadi via yhemanth)
  1400. MAPREDUCE-1143. Fix running task counters to be updated correctly
  1401. when speculative attempts are running for a TIP.
  1402. (Rahul Kumar Singh via yhemanth)
  1403. MAPREDUCE-1241. Use a default queue configuration in JobTracker when
  1404. mapred-queues.xml is unavailable. (Todd Lipcon via cdouglas)
  1405. MAPREDUCE-1301. Fix set up of permission checking script used in
  1406. localization tests. (Amareshwari Sriramadasu via yhemanth)
  1407. MAPREDUCE-1286. Remove quoting from client opts in TaskRunner. (Yuri
  1408. Pradkin via cdouglas)
  1409. MAPREDUCE-1059. Use distcp.bytes.per.map when adding sync markers in
  1410. distcp. (Aaron Kimball via cdouglas)
  1411. MAPREDUCE-1009. Update forrest documentation describing hierarchical
  1412. queues. (Vinod Kumar Vavilapalli via yhemanth)
  1413. MAPREDUCE-1342. Fixed deadlock in global blacklisting of tasktrackers.
  1414. (Amareshwari Sriramadasu via acmurthy)
  1415. MAPREDUCE-1316. Fixes a memory leak of TaskInProgress instances in
  1416. the jobtracker. (Amar Kamat via yhemanth)
  1417. MAPREDUCE-1359. TypedBytes TestIO doesn't mkdir its test dir first.
  1418. (Anatoli Fomenko via cos)
  1419. MAPREDUCE-1314. Correct errant mapreduce.x.mapreduce.x replacements from
  1420. bulk change. (Amareshwari Sriramadasu via cdouglas)
  1421. MAPREDUCE-1365. Restore accidentally renamed test in
  1422. TestTaskTrackerBloacklisting. (Amareshwari Sriramadasu via cdouglas)
  1423. MAPREDUCE-1406. Fix spelling of JobContext.MAP_COMBINE_MIN_SPILLS.
  1424. (cdouglas)
  1425. MAPREDUCE-1369. JUnit tests should never depend on anything in conf
  1426. (Anatoli Fomenko via cos)
  1427. MAPREDUCE-1412. Fix timer granularity issue causing failures in
  1428. TestTaskTrackerBlacklisting. (cdouglas)
  1429. MAPREDUCE-1448. Respect --config option in Mumak script. (Hong Tang via
  1430. cdouglas)
  1431. MAPREDUCE-1251. c++ utils doesn't compile. (Eli Collins via tomwhite)
  1432. MAPREDUCE-1522. FileInputFormat may use the default FileSystem for the
  1433. input path. (Tsz Wo (Nicholas), SZE via cdouglas)
  1434. MAPREDUCE-1407. Update javadoc in mapreduce.{Mapper,Reducer} to match
  1435. actual usage. (Benoit Sigoure via cdouglas)
  1436. MAPREDUCE-1258. Fix fair scheduler event log not logging job info.
  1437. (matei)
  1438. MAPREDUCE-1089. Fix NPE in fair scheduler preemption when tasks are
  1439. scheduled but not running. (Todd Lipcon via matei)
  1440. MAPREDUCE-1014. Fix the libraries for common and hdfs. (omalley)
  1441. MAPREDUCE-1111. JT Jetty UI not working if we run mumak.sh
  1442. off packaged distribution directory. (hong tang via mahadev)
  1443. MAPREDUCE-1133. Eclipse .classpath template has outdated jar files and is
  1444. missing some new ones. (cos)
  1445. MAPREDUCE-1098. Fixed the distributed-cache to not do i/o while holding a
  1446. global lock. (Amareshwari Sriramadasu via acmurthy)
  1447. MAPREDUCE-1158. Fix JT running maps and running reduces metrics.
  1448. (sharad)
  1449. MAPREDUCE-1160. Reduce verbosity of log lines in some Map/Reduce classes
  1450. to avoid filling up jobtracker logs on a busy cluster.
  1451. (Ravi Gummadi and Hong Tang via yhemanth)
  1452. MAPREDUCE-1153. Fix tasktracker metrics when trackers are decommissioned.
  1453. (sharad)
  1454. MAPREDUCE-1128. Fix MRUnit to prohibit iterating over values twice. (Aaron
  1455. Kimball via cdouglas)
  1456. MAPREDUCE-665. Move libhdfs to HDFS subproject. (Eli Collins via dhruba)
  1457. MAPREDUCE-1196. Fix FileOutputCommitter to use the deprecated cleanupJob
  1458. api correctly. (acmurthy)
  1459. MAPREDUCE-1244. Fix eclipse-plugin's build dependencies. (gkesavan)
  1460. MAPREDUCE-1140. Fix DistributedCache to not decrement reference counts for
  1461. unreferenced files in error conditions.
  1462. (Amareshwari Sriramadasu via yhemanth)
  1463. MAPREDUCE-1245. Fix TestFairScheduler failures by instantiating lightweight
  1464. Jobtracker. (sharad)
  1465. MAPREDUCE-1260. Update Eclipse configuration to match changes to Ivy
  1466. configuration. (Edwin Chan via cos)
  1467. MAPREDUCE-1152. Distinguish between failed and killed tasks in
  1468. JobTrackerInstrumentation. (Sharad Agarwal via cdouglas)
  1469. MAPREDUCE-1285. In DistCp.deleteNonexisting(..), get class from the
  1470. parameter instead of using FileStatus.class. (Peter Romianowski via
  1471. szetszwo)
  1472. MAPREDUCE-1294. Build fails to pull latest hadoop-core-* artifacts (cos)
  1473. MAPREDUCE-1213. TaskTrackers restart is faster because it deletes
  1474. distributed cache directory asynchronously. (Zheng Shao via dhruba)
  1475. MAPREDUCE-1265. The task attempt error log prints the name of the
  1476. tasktracker machine. (Scott Chen via dhruba)
  1477. MAPREDUCE-1201. ProcfsBasedProcessTree collects CPU usage information.
  1478. (Scott Chen via dhruba)
  1479. MAPREDUCE-1326. fi tests don't use fi-site.xml (cos)
  1480. MAPREDUCE-1165. Replace non-portable function name with C99 equivalent.
  1481. (Allen Wittenauer via cdouglas)
  1482. MAPREDUCE-1331. Fixes a typo in a testcase (Devaraj Das)
  1483. MAPREDUCE-1293. AutoInputFormat doesn't work with non-default FileSystems.
  1484. (Andrew Hitchcock via tomwhite)
  1485. MAPREDUCE-1131. Using profilers other than hprof can cause JobClient to
  1486. report job failure. (Aaron Kimball via tomwhite)
  1487. MAPREDUCE-1155. Streaming tests swallow exceptions.
  1488. (Todd Lipcon via tomwhite)
  1489. MAPREDUCE-1212. Mapreduce contrib project ivy dependencies are not included
  1490. in binary target. (Aaron Kimball via tomwhite)
  1491. MAPREDUCE-1388. Move the HDFS RAID package from HDFS to MAPREDUCE.
  1492. (Eli Collins via dhruba)
  1493. MAPREDUCE-1322. Defines default value for staging directory to be user
  1494. based fixing a failing streaming test.
  1495. (Devaraj Das and Amareshwari Sriramadasu via yhemanth)
  1496. MAPREDUCE-899. Modified LinuxTaskController to check that task-controller
  1497. has right permissions and ownership before performing any actions.
  1498. (Amareshwari Sriramadasu via yhemanth)
  1499. MAPREDUCE-1443. DBInputFormat can leak connections.
  1500. (Aaron Kimball via tomwhite)
  1501. MAPREDUCE-1457. Fixes JobTracker to get the FileSystem object within
  1502. getStagingAreaDir within a privileged block. Fixes Child.java to use the
  1503. appropriate UGIs while getting the TaskUmbilicalProtocol proxy and
  1504. while executing the task. (Jakob Homan via ddas)
  1505. MAPREDUCE-1399. The archive command shows a null error message (nicholas
  1506. via mahadev)
  1507. MAPREDUCE-1305. Improve efficiency of distcp -delete. (Peter Romianowski
  1508. via cdouglas)
  1509. MAPREDUCE-1474. Update forrest documentation for Hadoop Archives. (Mahadev
  1510. Konar via cdouglas)
  1511. MAPREDUCE-1400. Use tr rather than sed to effect literal substitution in
  1512. the build script. (Allen Wittenauer via cdouglas)
  1513. MAPREDUCE-1358. Avoid false positives in OutputLogFilter. (Todd Lipcon via
  1514. cdouglas)
  1515. MAPREDUCE-1490. Fix a NullPointerException that could occur during
  1516. instantiation and initialization of the DistributedRaidFileSystem.
  1517. (Rodrigo Schmidt via dhruba)
  1518. MAPREDUCE-1476. Fix the M/R framework to not call commit for special
  1519. tasks like job setup/cleanup and task cleanup.
  1520. (Amareshwari Sriramadasu via yhemanth)
  1521. MAPREDUCE-1398. Fix TaskLauncher to stop waiting for slots on a TIP that
  1522. is killed / failed.
  1523. (Amareshwari Sriramadasu via yhemanth)
  1524. MAPREDUCE-1491. The parity files created by the RAID are combined
  1525. using Hadoop Archive Files (HAR). (Rodrigo Schmidt via dhruba)
  1526. MAPREDUCE-1378. URL encode link in jobhistory.jsp to avoid errors caused by
  1527. unescaped characters. (E. Sammer via cdouglas)
  1528. MAPREDUCE-1519. RaidNode fails to create new parity file
  1529. if an older version already exists. (Rodrigo Schmidt via dhruba)
  1530. MAPREDUCE-1537. Fixes a compilation problem in a testcase after commit
  1531. HDFS-984. (Jitendra Nath Pandey via ddas)
  1532. MAPREDUCE-1537. The patch makes the job client call the getDelegationToken
  1533. only when security is enabled. (Jitendra Nath Pandey via ddas)
  1534. MAPREDUCE-1510. RAID should regenerate parity files if they get deleted.
  1535. (Rodrigo Schmidt via dhruba)
  1536. MAPREDUCE-1421. Fix the LinuxTaskController tests failing on trunk after
  1537. the commit of MAPREDUCE-1385. (Amareshwari Sriramadasu via vinodkv)
  1538. MAPREDUCE-1520. Fix TestMiniMRLocalFS failure caused by regression in
  1539. getting user working dir. (Amareshwari Sriramadasu via cdouglas)
  1540. MAPREDUCE-1512. RAID uses HarFileSystem directly instead of
  1541. FileSystem.get (Rodrigo Schmidt via dhruba)
  1542. MAPREDUCE-1435. Fix symlink handling in task work directory when
  1543. cleaning up, essentially to avoid following links.
  1544. (Ravi Gummadi via yhemanth)
  1545. MAPREDUCE-1518. RaidNode does not run the deletion check on the
  1546. directory that stores the parity files. (Rodrigo Schmidt via dhruba)
  1547. MAPREDUCE-1573. TestStreamingAsDifferentUser fails if run as tt_user.
  1548. (Ravi Gummadi via vinodkv)
  1549. MAPREDUCE-927. Cleanup of task-logs should happen in TaskTracker instead
  1550. of the Child. (Amareshwari Sriramadasu via vinodkv)
  1551. MAPREDUCE-1578. Decouple HadoopArchives vesrion from HarFileSystem version.
  1552. (Rodrigo Schmidt via szetszwo)
  1553. MAPREDUCE-1422. Fix cleanup of localized job directory to work if files
  1554. with non-deletable permissions are created within it.
  1555. (Amar Kamat via yhemanth)
  1556. MAPREDUCE-1306. Randomize the arrival of heartbeat responses in Mumak.
  1557. (Tamas Sarlos via cdouglas)
  1558. MAPREDUCE-1579. archive: check and possibly replace the space charater
  1559. in source paths. (szetszwo)
  1560. MAPREDUCE-1536. DataDrivenDBInputFormat does not split date columns correctly.
  1561. (Aaron Kimball via enis)
  1562. MAPREDUCE-890. After HADOOP-4491, the user who started mapred system is
  1563. not able to run job. (Ravi Gummadi via vinodkv)
  1564. MAPREDUCE-1615. Fix compilation of TestSubmitJob. (cdouglas)
  1565. MAPREDUCE-1508. Protect against NPE in TestMultipleLevelCaching. (Aaron
  1566. Kimball via cdouglas)
  1567. MAPREDUCE-1497. Suppress spurious findbugs warning about IndexCache
  1568. synchronization. (Amareshwari Sriramadasu via cdouglas)
  1569. MAPREDUCE-1420. Fix TestTTResourceReporting failure. (Scott Chen via
  1570. cdouglas)
  1571. MAPREDUCE-1480. Correctly initialize child RecordReaders in
  1572. CombineFileInputFormat. (Aaron Kimball via cdouglas)
  1573. MAPREDUCE-1348. Fix block forensics packaging. (Tom White via cdouglas)
  1574. MAPREDUCE-1628. HarFileSystem shows incorrect replication numbers and
  1575. permissions. (szetszwo via mahadev)
  1576. MAPREDUCE-1602. Fix the error message for the case that src does not
  1577. exist. (szetszwo)
  1578. MAPREDUCE-1585. Create Hadoop Archives version 2 with filenames
  1579. URL-encoded (rodrigo via mahadev)
  1580. MAPREDUCE-1523. Sometimes rumen trace generator fails to extract the job
  1581. finish time. (dick king via mahadev)
  1582. MAPREDUCE-1635. ResourceEstimator does not work after MAPREDUCE-842.
  1583. (Amareshwari Sriramadasu via vinodkv)
  1584. MAPREDUCE-889. binary communication formats added to Streaming by
  1585. HADOOP-1722 should be documented. (Klaas Bosteels via tomwhite)
  1586. MAPREDUCE-1031. ant tar target doens't seem to compile tests in contrib
  1587. projects. (Aaron Kimball via tomwhite)
  1588. MAPREDUCE-1692. Removed unused testcase TestStreamedMerge.
  1589. (Sreekanth Ramakrishnan and Amareshwari Sriramadasu via yhemanth)
  1590. MAPREDUCE-1062. Fix ReliabilityTest to work with retired jobs. (Sreekanth
  1591. Ramakrishnan via cdouglas)
  1592. MAPREDUCE-1409. IOExceptions thrown from FIleOutputCommitter::abortTask
  1593. should cause the task to fail. (Amareshwari Sriramadasu via cdouglas)
  1594. MAPREDUCE-1695. Include capacity scheduler in findbugs and javadoc-dev
  1595. targets and also fix existing warnings. (Hong Tang via yhemanth)
  1596. MAPREDUCE-1494. Ensure TestJobDirCleanup verifies the correct paths.
  1597. (Amareshwari Sriramadasu via cdouglas)
  1598. MAPREDUCE-1622. Include missing slf4j dependencies. (cdouglas)
  1599. MAPREDUCE-1515. Accept java5.home from build.properties, not only from the
  1600. command line when building forrest docs. (Al Thompson via cdouglas)
  1601. MAPREDUCE-1618. Add missing javadoc to JobStatus::*JobAcls. (Amareshwari
  1602. Sriramadasu via cdouglas)
  1603. MAPREDUCE-1219. Remove job level metrics from jobtracker metrics to ease
  1604. undue load on jobtracker. (Sreekanth Ramakrishnan via sharad)
  1605. MAPREDUCE-1604. Add Forrest documentation for Job ACLs.
  1606. (Amareshwari Sriramadasu via yhemanth)
  1607. MAPREDUCE-1705. Archiving and Purging of HDFS parity files should
  1608. handle globbed policies accurately. (Rodrigo Schmidt via dhruba)
  1609. MAPREDUCE-1612. job conf file is not accessible from job history web page.
  1610. (Ravi Gummadi and Sreekanth Ramakrishnan via vinodkv)
  1611. MAPREDUCE-1397. NullPointerException observed during task failures.
  1612. (Amareshwari Sriramadasu via vinodkv)
  1613. MAPREDUCE-1728. Oracle timezone strings do not match Java.
  1614. (Aaron Kimball via tomwhite)
  1615. MAPREDUCE-1609. TaskTracker.localizeJob should not set permissions on
  1616. job log directory recursively. (Amareshwari Sriramadasu via vinodkv)
  1617. MAPREDUCE-1657. After task logs directory is deleted, tasklog servlet
  1618. displays wrong error message about job ACLs. (Ravi Gummadi via vinodkv)
  1619. MAPREDUCE-1727. TestJobACLs fails after HADOOP-6686. (Ravi Gummadi via vinodkv)
  1620. MAPREDUCE-1611. Refresh nodes and refresh queues doesnt work with service
  1621. authorization enabled. (Amar Kamat via vinodkv)
  1622. MAPREDUCE-1276. Correct flaws in the shuffle related to connection setup
  1623. and failure attribution. (Amareshwari Sriramadasu via cdouglas)
  1624. MAPREDUCE-1372. ConcurrentModificationException in JobInProgress.
  1625. (Dick King and Amareshwari Sriramadasu via tomwhite)
  1626. MAPREDUCE-118. Fix Job.getJobID(). (Amareshwari Sriramadasu via sharad)
  1627. MAPREDUCE-913. TaskRunner crashes with NPE resulting in held up slots,
  1628. UNINITIALIZED tasks and hung TaskTracker. (Amareshwari Sriramadasu and
  1629. Sreekanth Ramakrishnan via vinodkv)
  1630. MAPREDUCE-1725. Fix MapReduce API incompatibilities between 0.20 and 0.21.
  1631. (tomwhite)
  1632. MAPREDUCE-1606. TestJobACLs may timeout as there are no slots for launching
  1633. JOB_CLEANUP task. (Ravi Gummadi via vinodkv)
  1634. MAPREDUCE-1765. Correct streaming documentation for StreamXmlRecordReader.
  1635. (Corinne Chandel via amareshwari)
  1636. MAPREDUCE-1880. Fix BigDecimal.divide(..) in the pi example. (szetszwo)
  1637. MAPREDUCE-1885. Revert FileSystem create method that takes CreateFlags
  1638. (MapReduce part of HADOOP-6826). (Ravi Gummadi via tomwhite)
  1639. MAPREDUCE-1870. Harmonize MapReduce JAR library versions with Common and
  1640. HDFS. (tomwhite)
  1641. MAPREDUCE-1791. Remote cluster control functionality needs JavaDocs
  1642. improvement (Konstantin Boudnik)
  1643. MAPREDUCE-1942. 'compile-fault-inject' should never be called directly.
  1644. (Konstantin Boudnik)
  1645. MAPREDUCE-1876. Fixes TaskAttemptStartedEvent to correctly log event type
  1646. for all task types. (Amar Kamat via amareshwari)
  1647. MAPREDUCE-1926. MapReduce distribution is missing build-utils.xml.
  1648. (tomwhite)
  1649. MAPREDUCE-2012. Some contrib tests fail in branch 0.21 and trunk.
  1650. (Amareshwari Sriramadasu via tomwhite)
  1651. MAPREDUCE-1980. Fixes TaskAttemptUnsuccessfulCompletionEvent and
  1652. TaskAttemptFinishedEvent to correctly log event type for all task types.
  1653. (Amar Kamat via amareshwari)
  1654. MAPREDUCE-1856. Extract a subset of tests for smoke (DOA) validation (cos)