1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488248924902491249224932494249524962497249824992500250125022503250425052506250725082509251025112512251325142515251625172518251925202521252225232524252525262527252825292530253125322533253425352536253725382539254025412542254325442545254625472548254925502551255225532554255525562557255825592560256125622563256425652566256725682569257025712572257325742575257625772578257925802581258225832584258525862587258825892590259125922593259425952596259725982599260026012602260326042605260626072608260926102611261226132614261526162617261826192620262126222623262426252626262726282629263026312632263326342635263626372638263926402641264226432644264526462647264826492650265126522653265426552656265726582659266026612662266326642665266626672668266926702671267226732674267526762677267826792680268126822683268426852686268726882689269026912692269326942695269626972698269927002701270227032704270527062707270827092710271127122713271427152716271727182719272027212722272327242725272627272728272927302731273227332734273527362737273827392740274127422743274427452746274727482749275027512752275327542755275627572758275927602761276227632764276527662767276827692770277127722773277427752776277727782779278027812782278327842785278627872788278927902791279227932794279527962797279827992800280128022803280428052806280728082809281028112812281328142815281628172818281928202821282228232824282528262827282828292830283128322833283428352836283728382839284028412842284328442845284628472848284928502851285228532854285528562857285828592860286128622863286428652866286728682869287028712872287328742875287628772878287928802881288228832884288528862887288828892890289128922893289428952896289728982899290029012902290329042905290629072908290929102911291229132914291529162917291829192920292129222923292429252926292729282929293029312932293329342935293629372938293929402941294229432944294529462947294829492950295129522953295429552956295729582959296029612962296329642965296629672968296929702971297229732974297529762977297829792980298129822983298429852986298729882989299029912992299329942995299629972998299930003001300230033004300530063007300830093010301130123013301430153016301730183019302030213022302330243025302630273028302930303031303230333034303530363037303830393040304130423043304430453046304730483049305030513052305330543055305630573058305930603061306230633064306530663067306830693070307130723073307430753076307730783079308030813082308330843085308630873088308930903091309230933094309530963097309830993100310131023103310431053106310731083109311031113112311331143115311631173118311931203121312231233124312531263127312831293130313131323133313431353136313731383139314031413142314331443145314631473148314931503151315231533154315531563157315831593160316131623163316431653166316731683169317031713172317331743175317631773178317931803181318231833184318531863187318831893190319131923193319431953196319731983199320032013202320332043205320632073208320932103211321232133214321532163217321832193220322132223223322432253226322732283229323032313232323332343235323632373238323932403241324232433244324532463247324832493250325132523253325432553256325732583259326032613262326332643265326632673268326932703271327232733274327532763277327832793280328132823283328432853286328732883289329032913292329332943295329632973298329933003301330233033304330533063307330833093310331133123313331433153316331733183319332033213322332333243325332633273328332933303331333233333334333533363337333833393340334133423343334433453346334733483349335033513352335333543355335633573358335933603361336233633364336533663367336833693370337133723373337433753376337733783379338033813382338333843385338633873388338933903391339233933394339533963397339833993400340134023403340434053406340734083409341034113412341334143415341634173418341934203421342234233424342534263427342834293430343134323433343434353436343734383439344034413442344334443445344634473448344934503451345234533454345534563457345834593460346134623463346434653466346734683469347034713472347334743475347634773478347934803481348234833484348534863487348834893490349134923493349434953496349734983499350035013502350335043505350635073508350935103511351235133514351535163517351835193520352135223523352435253526352735283529353035313532353335343535353635373538353935403541354235433544354535463547354835493550355135523553355435553556355735583559356035613562356335643565356635673568356935703571357235733574357535763577357835793580358135823583358435853586358735883589359035913592359335943595359635973598359936003601360236033604360536063607360836093610361136123613361436153616361736183619362036213622362336243625362636273628362936303631363236333634363536363637363836393640364136423643364436453646364736483649365036513652365336543655365636573658365936603661366236633664366536663667366836693670367136723673367436753676367736783679368036813682368336843685368636873688368936903691369236933694369536963697369836993700370137023703370437053706370737083709371037113712371337143715371637173718371937203721372237233724372537263727372837293730373137323733373437353736373737383739374037413742374337443745374637473748374937503751375237533754375537563757375837593760376137623763376437653766376737683769377037713772377337743775377637773778377937803781378237833784378537863787378837893790379137923793379437953796379737983799380038013802380338043805380638073808380938103811381238133814381538163817381838193820382138223823382438253826382738283829383038313832383338343835383638373838383938403841384238433844384538463847384838493850385138523853385438553856385738583859386038613862386338643865386638673868386938703871387238733874387538763877387838793880388138823883388438853886388738883889389038913892389338943895389638973898389939003901390239033904390539063907390839093910391139123913391439153916391739183919392039213922392339243925392639273928392939303931393239333934393539363937393839393940394139423943394439453946394739483949395039513952395339543955395639573958395939603961396239633964396539663967396839693970397139723973397439753976397739783979398039813982398339843985398639873988398939903991399239933994399539963997399839994000400140024003400440054006400740084009401040114012401340144015401640174018401940204021402240234024402540264027402840294030403140324033403440354036403740384039404040414042404340444045404640474048404940504051405240534054405540564057405840594060406140624063406440654066406740684069407040714072407340744075407640774078407940804081408240834084408540864087408840894090409140924093409440954096409740984099410041014102410341044105410641074108410941104111411241134114411541164117411841194120412141224123412441254126412741284129413041314132413341344135413641374138413941404141414241434144414541464147414841494150415141524153415441554156415741584159416041614162416341644165416641674168416941704171417241734174417541764177417841794180418141824183418441854186418741884189419041914192419341944195419641974198419942004201420242034204420542064207420842094210421142124213421442154216421742184219422042214222422342244225422642274228422942304231423242334234423542364237423842394240424142424243424442454246424742484249425042514252425342544255425642574258425942604261426242634264426542664267426842694270427142724273427442754276427742784279428042814282428342844285428642874288428942904291429242934294429542964297429842994300430143024303430443054306430743084309431043114312431343144315431643174318431943204321432243234324432543264327432843294330433143324333433443354336433743384339434043414342434343444345434643474348434943504351435243534354435543564357435843594360436143624363436443654366436743684369437043714372437343744375437643774378437943804381438243834384438543864387438843894390439143924393439443954396439743984399440044014402440344044405440644074408440944104411441244134414441544164417441844194420442144224423442444254426442744284429443044314432443344344435443644374438443944404441444244434444444544464447444844494450445144524453445444554456445744584459446044614462446344644465446644674468446944704471447244734474447544764477447844794480448144824483448444854486448744884489449044914492449344944495449644974498449945004501450245034504450545064507450845094510451145124513451445154516451745184519452045214522452345244525452645274528452945304531453245334534453545364537453845394540454145424543454445454546454745484549455045514552455345544555455645574558455945604561456245634564456545664567456845694570457145724573457445754576457745784579458045814582458345844585458645874588458945904591459245934594459545964597459845994600460146024603460446054606460746084609461046114612461346144615461646174618461946204621462246234624462546264627462846294630463146324633463446354636463746384639464046414642464346444645464646474648464946504651465246534654465546564657465846594660466146624663466446654666466746684669467046714672467346744675467646774678467946804681468246834684468546864687468846894690469146924693469446954696469746984699470047014702470347044705470647074708470947104711471247134714471547164717471847194720472147224723472447254726472747284729473047314732473347344735473647374738473947404741474247434744474547464747474847494750475147524753475447554756475747584759476047614762476347644765476647674768476947704771477247734774477547764777477847794780478147824783478447854786478747884789479047914792479347944795479647974798479948004801480248034804480548064807480848094810481148124813481448154816481748184819482048214822482348244825482648274828482948304831483248334834483548364837483848394840484148424843484448454846484748484849485048514852485348544855485648574858485948604861486248634864486548664867486848694870487148724873487448754876487748784879488048814882488348844885488648874888488948904891489248934894489548964897489848994900490149024903490449054906490749084909491049114912491349144915491649174918491949204921492249234924492549264927492849294930493149324933493449354936493749384939494049414942494349444945494649474948494949504951495249534954495549564957495849594960496149624963 |
- <!--
- **********************************************************
- ** WARNING: This file is generated from CHANGES.txt by the
- ** Perl script 'changes2html.pl'.
- ** Do *not* edit this file!
- **********************************************************
-
- ****************************************************************************
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements. See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License. You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- ****************************************************************************
- -->
- <html>
- <head>
- <title>Hadoop Change Log</title>
- <link rel="stylesheet" href="ChangesFancyStyle.css" title="Fancy">
- <link rel="alternate stylesheet" href="ChangesSimpleStyle.css" title="Simple">
- <META http-equiv="Content-Type" content="text/html; charset=UTF-8"/>
- <SCRIPT>
- function toggleList(e) {
- element = document.getElementById(e).style;
- element.display == 'none' ? element.display = 'block' : element.display='none';
- }
- function collapse() {
- for (var i = 0; i < document.getElementsByTagName("ul").length; i++) {
- var list = document.getElementsByTagName("ul")[i];
- if (list.id != 'release_0.19.1_-_2009-02-23_' && list.id != 'release_0.19.0_-_2008-11-18_') {
- list.style.display = "none";
- }
- }
- for (var i = 0; i < document.getElementsByTagName("ol").length; i++) {
- document.getElementsByTagName("ol")[i].style.display = "none";
- }
- }
- window.onload = collapse;
- </SCRIPT>
- </head>
- <body>
- <a href="http://hadoop.apache.org/core/"><img class="logoImage" alt="Hadoop" src="images/hadoop-logo.jpg" title="Scalable Computing Platform"></a>
- <h1>Hadoop Change Log</h1>
- <h2><a href="javascript:toggleList('release_0.19.1_-_2009-02-23_')">Release 0.19.1 - 2009-02-23
- </a></h2>
- <ul id="release_0.19.1_-_2009-02-23_">
- <li><a href="javascript:toggleList('release_0.19.1_-_2009-02-23_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (2)
- <ol id="release_0.19.1_-_2009-02-23_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5225">HADOOP-5225</a>. Workaround for tmp file handling in HDFS. sync() is
- incomplete as a result. committed only to 0.19.x.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5224">HADOOP-5224</a>. HDFS append() is disabled. It throws
- UnsupportedOperationException. committed only to 0.19.x<br />(Raghu Angadi)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.19.1_-_2009-02-23_._improvements_')"> IMPROVEMENTS
- </a> (4)
- <ol id="release_0.19.1_-_2009-02-23_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4739">HADOOP-4739</a>. Fix spelling and grammar, improve phrasing of some sections in
- mapred tutorial.<br />(Vivek Ratan via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3894">HADOOP-3894</a>. DFSClient logging improvements.<br />(Steve Loughran via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5126">HADOOP-5126</a>. Remove empty file BlocksWithLocations.java<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5127">HADOOP-5127</a>. Remove public methods in FSDirectory.<br />(Jakob Homan via shv)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.19.1_-_2009-02-23_._bug_fixes_')"> BUG FIXES
- </a> (31)
- <ol id="release_0.19.1_-_2009-02-23_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4697">HADOOP-4697</a>. Fix getBlockLocations in KosmosFileSystem to handle multiple
- blocks correctly.<br />(Sriram Rao via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4420">HADOOP-4420</a>. Add null checks for job, caused by invalid job IDs.<br />(Aaron Kimball via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4632">HADOOP-4632</a>. Fix TestJobHistoryVersion to use test.build.dir instead of the
- current workding directory for scratch space.<br />(Amar Kamat via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4508">HADOOP-4508</a>. Fix FSDataOutputStream.getPos() for append.<br />(dhruba via
- szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4727">HADOOP-4727</a>. Fix a group checking bug in fill_stat_structure(...) in
- fuse-dfs.<br />(Brian Bockelman via szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4731">HADOOP-4731</a>. Fix capacity scheduler to correctly remove job on completion
- from waiting queue.<br />(Amar Kamat via yhemanth)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4836">HADOOP-4836</a>. Correct typos in mapred related documentation.<br />(Jord? Polo
- via szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4821">HADOOP-4821</a>. Usage description in the Quotas guide documentations are
- incorrect.<br />(Boris Shkolnik via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4847">HADOOP-4847</a>. Moves the loading of OutputCommitter to the Task.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4966">HADOOP-4966</a>. Marks completed setup tasks for removal.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4992">HADOOP-4992</a>. Fixes a package name problem introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-4847">HADOOP-4847</a>.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4982">HADOOP-4982</a>. TestFsck should run in Eclipse.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5008">HADOOP-5008</a>. TestReplication#testPendingReplicationRetry leaves an opened
- fd unclosed.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4906">HADOOP-4906</a>. Fix TaskTracker OOM by keeping a shallow copy of JobConf in
- TaskTracker.TaskInProgress.<br />(Sharad Agarwal via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4918">HADOOP-4918</a>. Fix bzip2 compression to work with Sequence Files.
- (Zheng Shao via dhruba).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4965">HADOOP-4965</a>. TestFileAppend3 should close FileSystem.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4967">HADOOP-4967</a>. Fixes a race condition in the JvmManager to do with killing
- tasks.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5002">HADOOP-5002</a>. Fixes a problem to do with the order of initialization of
- reduce task and instantiating the reducer class.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5009">HADOOP-5009</a>. DataNode#shutdown sometimes leaves data block scanner
- verification log unclosed.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5086">HADOOP-5086</a>. Use the appropriate FileSystem for trash URIs.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4955">HADOOP-4955</a>. Make DBOutputFormat us column names from setOutput().<br />(Kevin Peterson via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4862">HADOOP-4862</a>. Minor : <a href="http://issues.apache.org/jira/browse/HADOOP-3678">HADOOP-3678</a> did not remove all the cases of
- spurious IOExceptions logged by DataNode.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5034">HADOOP-5034</a>. NameNode should send both replication and deletion requests
- to DataNode in one reply to a heartbeat.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5156">HADOOP-5156</a>. TestHeartbeatHandling uses MiiDFSCluster.getNamesystem()
- which does not exit in branch 0.19 and 0.20.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4759">HADOOP-4759</a>. <a href="http://issues.apache.org/jira/browse/HADOOP-4759">HADOOP-4759</a>. Removes temporary output directory for failed and
- killed tasks by launching special CLEANUP tasks for the same.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5161">HADOOP-5161</a>. Accepted sockets do not get placed in
- DataXceiverServer#childSockets.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5193">HADOOP-5193</a>. Correct calculation of edits modification time.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4494">HADOOP-4494</a>. Allow libhdfs to append to files.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5166">HADOOP-5166</a>. Fix JobTracker restart to work when ACLs are configured
- for the JobTracker. (Amar Kamat via yhemanth).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5067">HADOOP-5067</a>. Fixes TaskInProgress.java to keep track of count of failed and
- killed tasks correctly.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4760">HADOOP-4760</a>. HDFS streams should not throw exceptions when closed twice.<br />(enis)</li>
- </ol>
- </li>
- </ul>
- <h2><a href="javascript:toggleList('release_0.19.0_-_2008-11-18_')">Release 0.19.0 - 2008-11-18
- </a></h2>
- <ul id="release_0.19.0_-_2008-11-18_">
- <li><a href="javascript:toggleList('release_0.19.0_-_2008-11-18_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (22)
- <ol id="release_0.19.0_-_2008-11-18_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3595">HADOOP-3595</a>. Remove deprecated methods for mapred.combine.once
- functionality, which was necessary to providing backwards
- compatible combiner semantics for 0.18.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3667">HADOOP-3667</a>. Remove the following deprecated methods from JobConf:
- addInputPath(Path)
- getInputPaths()
- getMapOutputCompressionType()
- getOutputPath()
- getSystemDir()
- setInputPath(Path)
- setMapOutputCompressionType(CompressionType style)
- setOutputPath(Path)<br />(Amareshwari Sriramadasu via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3652">HADOOP-3652</a>. Remove deprecated class OutputFormatBase.<br />(Amareshwari Sriramadasu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2885">HADOOP-2885</a>. Break the hadoop.dfs package into separate packages under
- hadoop.hdfs that reflect whether they are client, server, protocol,
- etc. DistributedFileSystem and DFSClient have moved and are now
- considered package private.<br />(Sanjay Radia via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2325">HADOOP-2325</a>. Require Java 6.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-372">HADOOP-372</a>. Add support for multiple input paths with a different
- InputFormat and Mapper for each path.<br />(Chris Smith via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1700">HADOOP-1700</a>. Support appending to file in HDFS.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3792">HADOOP-3792</a>. Make FsShell -test consistent with unix semantics, returning
- zero for true and non-zero for false.<br />(Ben Slusky via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3664">HADOOP-3664</a>. Remove the deprecated method InputFormat.validateInput,
- which is no longer needed.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3549">HADOOP-3549</a>. Give more meaningful errno's in libhdfs. In particular,
- EACCES is returned for permission problems.<br />(Ben Slusky via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4036">HADOOP-4036</a>. ResourceStatus was added to TaskTrackerStatus by <a href="http://issues.apache.org/jira/browse/HADOOP-3759">HADOOP-3759</a>,
- so increment the InterTrackerProtocol version.<br />(Hemanth Yamijala via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3150">HADOOP-3150</a>. Moves task promotion to tasks. Defines a new interface for
- committing output files. Moves job setup to jobclient, and moves jobcleanup
- to a separate task.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3446">HADOOP-3446</a>. Keep map outputs in memory during the reduce. Remove
- fs.inmemory.size.mb and replace with properties defining in memory map
- output retention during the shuffle and reduce relative to maximum heap
- usage.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3245">HADOOP-3245</a>. Adds the feature for supporting JobTracker restart. Running
- jobs can be recovered from the history file. The history file format has
- been modified to support recovery. The task attempt ID now has the
- JobTracker start time to disinguish attempts of the same TIP across
- restarts.<br />(Amar Ramesh Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4007">HADOOP-4007</a>. REMOVE DFSFileInfo - FileStatus is sufficient.<br />(Sanjay Radia via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3722">HADOOP-3722</a>. Fixed Hadoop Streaming and Hadoop Pipes to use the Tool
- interface and GenericOptionsParser.<br />(Enis Soztutar via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2816">HADOOP-2816</a>. Cluster summary at name node web reports the space
- utilization as:
- Configured Capacity: capacity of all the data directories - Reserved space
- Present Capacity: Space available for dfs,i.e. remaining+used space
- DFS Used%: DFS used space/Present Capacity<br />(Suresh Srinivas via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3938">HADOOP-3938</a>. Disk space quotas for HDFS. This is similar to namespace
- quotas in 0.18.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4293">HADOOP-4293</a>. Make Configuration Writable and remove unreleased
- WritableJobConf. Configuration.write is renamed to writeXml.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4281">HADOOP-4281</a>. Change dfsadmin to report available disk space in a format
- consistent with the web interface as defined in <a href="http://issues.apache.org/jira/browse/HADOOP-2816">HADOOP-2816</a>.<br />(Suresh
- Srinivas via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4430">HADOOP-4430</a>. Further change the cluster summary at name node web that was
- changed in <a href="http://issues.apache.org/jira/browse/HADOOP-2816">HADOOP-2816</a>:
- Non DFS Used - This indicates the disk space taken by non DFS file from
- the Configured capacity
- DFS Used % - DFS Used % of Configured Capacity
- DFS Remaining % - Remaing % Configured Capacity available for DFS use
- DFS command line report reflects the same change. Config parameter
- dfs.datanode.du.pct is no longer used and is removed from the
- hadoop-default.xml.<br />(Suresh Srinivas via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4116">HADOOP-4116</a>. Balancer should provide better resource management.<br />(hairong)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.19.0_-_2008-11-18_._new_features_')"> NEW FEATURES
- </a> (39)
- <ol id="release_0.19.0_-_2008-11-18_._new_features_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3341">HADOOP-3341</a>. Allow streaming jobs to specify the field separator for map
- and reduce input and output. The new configuration values are:
- stream.map.input.field.separator
- stream.map.output.field.separator
- stream.reduce.input.field.separator
- stream.reduce.output.field.separator
- All of them default to "\t".<br />(Zheng Shao via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3479">HADOOP-3479</a>. Defines the configuration file for the resource manager in
- Hadoop. You can configure various parameters related to scheduling, such
- as queues and queue properties here. The properties for a queue follow a
- naming convention,such as, hadoop.rm.queue.queue-name.property-name.<br />(Hemanth Yamijala via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3149">HADOOP-3149</a>. Adds a way in which map/reducetasks can create multiple
- outputs.<br />(Alejandro Abdelnur via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3714">HADOOP-3714</a>. Add a new contrib, bash-tab-completion, which enables
- bash tab completion for the bin/hadoop script. See the README file
- in the contrib directory for the installation.<br />(Chris Smith via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3730">HADOOP-3730</a>. Adds a new JobConf constructor that disables loading
- default configurations.<br />(Alejandro Abdelnur via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3772">HADOOP-3772</a>. Add a new Hadoop Instrumentation api for the JobTracker and
- the TaskTracker, refactor Hadoop Metrics as an implementation of the api.<br />(Ari Rabkin via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2302">HADOOP-2302</a>. Provides a comparator for numerical sorting of key fields.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-153">HADOOP-153</a>. Provides a way to skip bad records.<br />(Sharad Agarwal via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-657">HADOOP-657</a>. Free disk space should be modelled and used by the scheduler
- to make scheduling decisions.<br />(Ari Rabkin via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3719">HADOOP-3719</a>. Initial checkin of Chukwa, which is a data collection and
- analysis framework.<br />(Jerome Boulon, Andy Konwinski, Ari Rabkin,
- and Eric Yang)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3873">HADOOP-3873</a>. Add -filelimit and -sizelimit options to distcp to cap the
- number of files/bytes copied in a particular run to support incremental
- updates and mirroring. (TszWo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3585">HADOOP-3585</a>. FailMon package for hardware failure monitoring and
- analysis of anomalies.<br />(Ioannis Koltsidas via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1480">HADOOP-1480</a>. Add counters to the C++ Pipes API.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3854">HADOOP-3854</a>. Add support for pluggable servlet filters in the HttpServers.
- (Tsz Wo (Nicholas) Sze via omalley)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3759">HADOOP-3759</a>. Provides ability to run memory intensive jobs without
- affecting other running tasks on the nodes.<br />(Hemanth Yamijala via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3746">HADOOP-3746</a>. Add a fair share scheduler.<br />(Matei Zaharia via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3754">HADOOP-3754</a>. Add a thrift interface to access HDFS.<br />(dhruba via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3828">HADOOP-3828</a>. Provides a way to write skipped records to DFS.<br />(Sharad Agarwal via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3948">HADOOP-3948</a>. Separate name-node edits and fsimage directories.<br />(Lohit Vijayarenu via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3939">HADOOP-3939</a>. Add an option to DistCp to delete files at the destination
- not present at the source. (Tsz Wo (Nicholas) Sze via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3601">HADOOP-3601</a>. Add a new contrib module for Hive, which is a sql-like
- query processing tool that uses map/reduce.<br />(Ashish Thusoo via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3866">HADOOP-3866</a>. Added sort and multi-job updates in the JobTracker web ui.<br />(Craig Weisenfluh via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3698">HADOOP-3698</a>. Add access control to control who is allowed to submit or
- modify jobs in the JobTracker.<br />(Hemanth Yamijala via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1869">HADOOP-1869</a>. Support access times for HDFS files.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3941">HADOOP-3941</a>. Extend FileSystem API to return file-checksums.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3581">HADOOP-3581</a>. Prevents memory intensive user tasks from taking down
- nodes.<br />(Vinod K V via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3970">HADOOP-3970</a>. Provides a way to recover counters written to JobHistory.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3702">HADOOP-3702</a>. Adds ChainMapper and ChainReducer classes allow composing
- chains of Maps and Reduces in a single Map/Reduce job, something like
- MAP+ / REDUCE MAP*.<br />(Alejandro Abdelnur via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3445">HADOOP-3445</a>. Add capacity scheduler that provides guaranteed capacities to
- queues as a percentage of the cluster.<br />(Vivek Ratan via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3992">HADOOP-3992</a>. Add a synthetic load generation facility to the test
- directory.<br />(hairong via szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3981">HADOOP-3981</a>. Implement a distributed file checksum algorithm in HDFS
- and change DistCp to use file checksum for comparing src and dst files<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3829">HADOOP-3829</a>. Narrown down skipped records based on user acceptable value.<br />(Sharad Agarwal via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3930">HADOOP-3930</a>. Add common interfaces for the pluggable schedulers and the
- cli & gui clients.<br />(Sreekanth Ramakrishnan via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4176">HADOOP-4176</a>. Implement getFileChecksum(Path) in HftpFileSystem.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-249">HADOOP-249</a>. Reuse JVMs across Map-Reduce Tasks.
- Configuration changes to hadoop-default.xml:
- add mapred.job.reuse.jvm.num.tasks<br />(Devaraj Das via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4070">HADOOP-4070</a>. Provide a mechanism in Hive for registering UDFs from the
- query language.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2536">HADOOP-2536</a>. Implement a JDBC based database input and output formats to
- allow Map-Reduce applications to work with databases.<br />(Fredrik Hedberg and
- Enis Soztutar via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3019">HADOOP-3019</a>. A new library to support total order partitions.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3924">HADOOP-3924</a>. Added a 'KILLED' job status.<br />(Subramaniam Krishnan via
- acmurthy)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.19.0_-_2008-11-18_._improvements_')"> IMPROVEMENTS
- </a> (78)
- <ol id="release_0.19.0_-_2008-11-18_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4205">HADOOP-4205</a>. hive: metastore and ql to use the refactored SerDe library.<br />(zshao)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4106">HADOOP-4106</a>. libhdfs: add time, permission and user attribute support
- (part 2).<br />(Pete Wyckoff through zshao)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4104">HADOOP-4104</a>. libhdfs: add time, permission and user attribute support.<br />(Pete Wyckoff through zshao)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3908">HADOOP-3908</a>. libhdfs: better error message if llibhdfs.so doesn't exist.<br />(Pete Wyckoff through zshao)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3732">HADOOP-3732</a>. Delay intialization of datanode block verification till
- the verification thread is started.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1627">HADOOP-1627</a>. Various small improvements to 'dfsadmin -report' output.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3577">HADOOP-3577</a>. Tools to inject blocks into name node and simulated
- data nodes for testing.<br />(Sanjay Radia via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2664">HADOOP-2664</a>. Add a lzop compatible codec, so that files compressed by lzop
- may be processed by map/reduce.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3655">HADOOP-3655</a>. Add additional ant properties to control junit.<br />(Steve
- Loughran via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3543">HADOOP-3543</a>. Update the copyright year to 2008.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3587">HADOOP-3587</a>. Add a unit test for the contrib/data_join framework.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3402">HADOOP-3402</a>. Add terasort example program<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3660">HADOOP-3660</a>. Add replication factor for injecting blocks in simulated
- datanodes.<br />(Sanjay Radia via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3684">HADOOP-3684</a>. Add a cloning function to the contrib/data_join framework
- permitting users to define a more efficient method for cloning values from
- the reduce than serialization/deserialization.<br />(Runping Qi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3478">HADOOP-3478</a>. Improves the handling of map output fetching. Now the
- randomization is by the hosts (and not the map outputs themselves).<br />(Jothi Padmanabhan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3617">HADOOP-3617</a>. Removed redundant checks of accounting space in MapTask and
- makes the spill thread persistent so as to avoid creating a new one for
- each spill.<br />(Chris Douglas via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3412">HADOOP-3412</a>. Factor the scheduler out of the JobTracker and make
- it pluggable.<br />(Tom White and Brice Arnould via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3756">HADOOP-3756</a>. Minor. Remove unused dfs.client.buffer.dir from
- hadoop-default.xml.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3747">HADOOP-3747</a>. Adds counter suport for MultipleOutputs.<br />(Alejandro Abdelnur via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3169">HADOOP-3169</a>. LeaseChecker daemon should not be started in DFSClient
- constructor. (TszWo (Nicholas), SZE via hairong)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3824">HADOOP-3824</a>. Move base functionality of StatusHttpServer to a core
- package. (TszWo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3646">HADOOP-3646</a>. Add a bzip2 compatible codec, so bzip compressed data
- may be processed by map/reduce.<br />(Abdul Qadeer via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3861">HADOOP-3861</a>. MapFile.Reader and Writer should implement Closeable.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3791">HADOOP-3791</a>. Introduce generics into ReflectionUtils.<br />(Chris Smith via
- cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3694">HADOOP-3694</a>. Improve unit test performance by changing
- MiniDFSCluster to listen only on 127.0.0.1.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3620">HADOOP-3620</a>. Namenode should synchronously resolve a datanode's network
- location when the datanode registers.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3860">HADOOP-3860</a>. NNThroughputBenchmark is extended with rename and delete
- benchmarks.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3892">HADOOP-3892</a>. Include unix group name in JobConf.<br />(Matei Zaharia via johan)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3875">HADOOP-3875</a>. Change the time period between heartbeats to be relative to
- the end of the heartbeat rpc, rather than the start. This causes better
- behavior if the JobTracker is overloaded.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3853">HADOOP-3853</a>. Move multiple input format (<a href="http://issues.apache.org/jira/browse/HADOOP-372">HADOOP-372</a>) extension to
- library package.<br />(tomwhite via johan)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-9">HADOOP-9</a>. Use roulette scheduling for temporary space when the size
- is not known.<br />(Ari Rabkin via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3202">HADOOP-3202</a>. Use recursive delete rather than FileUtil.fullyDelete.<br />(Amareshwari Sriramadasu via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3368">HADOOP-3368</a>. Remove common-logging.properties from conf.<br />(Steve Loughran
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3851">HADOOP-3851</a>. Fix spelling mistake in FSNamesystemMetrics.<br />(Steve Loughran
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3780">HADOOP-3780</a>. Remove asynchronous resolution of network topology in the
- JobTracker<br />(Amar Kamat via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3852">HADOOP-3852</a>. Add ShellCommandExecutor.toString method to make nicer
- error messages.<br />(Steve Loughran via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3844">HADOOP-3844</a>. Include message of local exception in RPC client failures.<br />(Steve Loughran via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3935">HADOOP-3935</a>. Split out inner classes from DataNode.java.<br />(johan)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3905">HADOOP-3905</a>. Create generic interfaces for edit log streams.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3062">HADOOP-3062</a>. Add metrics to DataNode and TaskTracker to record network
- traffic for HDFS reads/writes and MR shuffling.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3742">HADOOP-3742</a>. Remove HDFS from public java doc and add javadoc-dev for
- generative javadoc for developers.<br />(Sanjay Radia via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3944">HADOOP-3944</a>. Improve documentation for public TupleWritable class in
- join package.<br />(Chris Douglas via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2330">HADOOP-2330</a>. Preallocate HDFS transaction log to improve performance.<br />(dhruba and hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3965">HADOOP-3965</a>. Convert DataBlockScanner into a package private class.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3488">HADOOP-3488</a>. Prevent hadoop-daemon from rsync'ing log files<br />(Stefan
- Groshupf and Craig Macdonald via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3342">HADOOP-3342</a>. Change the kill task actions to require http post instead of
- get to prevent accidental crawls from triggering it.<br />(enis via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3937">HADOOP-3937</a>. Limit the job name in the job history filename to 50
- characters.<br />(Matei Zaharia via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3943">HADOOP-3943</a>. Remove unnecessary synchronization in
- NetworkTopology.pseudoSortByDistance.<br />(hairong via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3498">HADOOP-3498</a>. File globbing alternation should be able to span path
- components.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3361">HADOOP-3361</a>. Implement renames for NativeS3FileSystem.<br />(Albert Chern via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3605">HADOOP-3605</a>. Make EC2 scripts show an error message if AWS_ACCOUNT_ID is
- unset.<br />(Al Hoang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4147">HADOOP-4147</a>. Remove unused class JobWithTaskContext from class
- JobInProgress.<br />(Amareshwari Sriramadasu via johan)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4151">HADOOP-4151</a>. Add a byte-comparable interface that both Text and
- BytesWritable implement.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4174">HADOOP-4174</a>. Move fs image/edit log methods from ClientProtocol to
- NamenodeProtocol.<br />(shv via szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4181">HADOOP-4181</a>. Include a .gitignore and saveVersion.sh change to support
- developing under git.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4186">HADOOP-4186</a>. Factor LineReader out of LineRecordReader.<br />(tomwhite via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4184">HADOOP-4184</a>. Break the module dependencies between core, hdfs, and
- mapred.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4075">HADOOP-4075</a>. test-patch.sh now spits out ant commands that it runs.<br />(Ramya R via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4117">HADOOP-4117</a>. Improve configurability of Hadoop EC2 instances.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2411">HADOOP-2411</a>. Add support for larger CPU EC2 instance types.<br />(Chris K Wensel via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4083">HADOOP-4083</a>. Changed the configuration attribute queue.name to
- mapred.job.queue.name.<br />(Hemanth Yamijala via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4194">HADOOP-4194</a>. Added the JobConf and JobID to job-related methods in
- JobTrackerInstrumentation for better metrics.<br />(Mac Yang via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3975">HADOOP-3975</a>. Change test-patch script to report working the dir
- modifications preventing the suite from being run.<br />(Ramya R via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4124">HADOOP-4124</a>. Added a command-line switch to allow users to set job
- priorities, also allow it to be manipulated via the web-ui.<br />(Hemanth
- Yamijala via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2165">HADOOP-2165</a>. Augmented JobHistory to include the URIs to the tasks'
- userlogs.<br />(Vinod Kumar Vavilapalli via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4062">HADOOP-4062</a>. Remove the synchronization on the output stream when a
- connection is closed and also remove an undesirable exception when
- a client is stoped while there is no pending RPC request.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4227">HADOOP-4227</a>. Remove the deprecated class org.apache.hadoop.fs.ShellCommand.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4006">HADOOP-4006</a>. Clean up FSConstants and move some of the constants to
- better places.<br />(Sanjay Radia via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4279">HADOOP-4279</a>. Trace the seeds of random sequences in append unit tests to
- make itermitant failures reproducible.<br />(szetszwo via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4209">HADOOP-4209</a>. Remove the change to the format of task attempt id by
- incrementing the task attempt numbers by 1000 when the job restarts.<br />(Amar Kamat via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4301">HADOOP-4301</a>. Adds forrest doc for the skip bad records feature.<br />(Sharad Agarwal via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4354">HADOOP-4354</a>. Separate TestDatanodeDeath.testDatanodeDeath() into 4 tests.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3790">HADOOP-3790</a>. Add more unit tests for testing HDFS file append.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4321">HADOOP-4321</a>. Include documentation for the capacity scheduler.<br />(Hemanth
- Yamijala via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4424">HADOOP-4424</a>. Change menu layout for Hadoop documentation (Boris Shkolnik
- via cdouglas).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4438">HADOOP-4438</a>. Update forrest documentation to include missing FsShell
- commands.<br />(Suresh Srinivas via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4105">HADOOP-4105</a>. Add forrest documentation for libhdfs.<br />(Pete Wyckoff via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4510">HADOOP-4510</a>. Make getTaskOutputPath public.<br />(Chris Wensel via omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.19.0_-_2008-11-18_._optimizations_')"> OPTIMIZATIONS
- </a> (11)
- <ol id="release_0.19.0_-_2008-11-18_._optimizations_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3556">HADOOP-3556</a>. Removed lock contention in MD5Hash by changing the
- singleton MessageDigester by an instance per Thread using
- ThreadLocal.<br />(Iv?n de Prado via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3328">HADOOP-3328</a>. When client is writing data to DFS, only the last
- datanode in the pipeline needs to verify the checksum. Saves around
- 30% CPU on intermediate datanodes.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3863">HADOOP-3863</a>. Use a thread-local string encoder rather than a static one
- that is protected by a lock.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3864">HADOOP-3864</a>. Prevent the JobTracker from locking up when a job is being
- initialized.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3816">HADOOP-3816</a>. Faster directory listing in KFS.<br />(Sriram Rao via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2130">HADOOP-2130</a>. Pipes submit job should have both blocking and non-blocking
- versions.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3769">HADOOP-3769</a>. Make the SampleMapper and SampleReducer from
- GenericMRLoadGenerator public, so they can be used in other contexts.<br />(Lingyun Yang via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3514">HADOOP-3514</a>. Inline the CRCs in intermediate files as opposed to reading
- it from a different .crc file.<br />(Jothi Padmanabhan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3638">HADOOP-3638</a>. Caches the iFile index files in memory to reduce seeks<br />(Jothi Padmanabhan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4225">HADOOP-4225</a>. FSEditLog.logOpenFile() should persist accessTime
- rather than modificationTime.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4380">HADOOP-4380</a>. Made several new classes (Child, JVMId,
- JobTrackerInstrumentation, QueueManager, ResourceEstimator,
- TaskTrackerInstrumentation, and TaskTrackerMetricsInst) in
- org.apache.hadoop.mapred package private instead of public.<br />(omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.19.0_-_2008-11-18_._bug_fixes_')"> BUG FIXES
- </a> (152)
- <ol id="release_0.19.0_-_2008-11-18_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3563">HADOOP-3563</a>. Refactor the distributed upgrade code so that it is
- easier to identify datanode and namenode related code.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3640">HADOOP-3640</a>. Fix the read method in the NativeS3InputStream.<br />(tomwhite via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3711">HADOOP-3711</a>. Fixes the Streaming input parsing to properly find the
- separator.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3725">HADOOP-3725</a>. Prevent TestMiniMRMapDebugScript from swallowing exceptions.<br />(Steve Loughran via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3726">HADOOP-3726</a>. Throw exceptions from TestCLI setup and teardown instead of
- swallowing them.<br />(Steve Loughran via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3721">HADOOP-3721</a>. Refactor CompositeRecordReader and related mapred.join classes
- to make them clearer.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3720">HADOOP-3720</a>. Re-read the config file when dfsadmin -refreshNodes is invoked
- so dfs.hosts and dfs.hosts.exclude are observed.<br />(lohit vijayarenu via
- cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3485">HADOOP-3485</a>. Allow writing to files over fuse.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3723">HADOOP-3723</a>. The flags to the libhdfs.create call can be treated as
- a bitmask.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3643">HADOOP-3643</a>. Filter out completed tasks when asking for running tasks in
- the JobTracker web/ui.<br />(Amar Kamat via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3777">HADOOP-3777</a>. Ensure that Lzo compressors/decompressors correctly handle the
- case where native libraries aren't available.<br />(Chris Douglas via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3728">HADOOP-3728</a>. Fix SleepJob so that it doesn't depend on temporary files,
- this ensures we can now run more than one instance of SleepJob
- simultaneously.<br />(Chris Douglas via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3795">HADOOP-3795</a>. Fix saving image files on Namenode with different checkpoint
- stamps.<br />(Lohit Vijayarenu via mahadev)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3624">HADOOP-3624</a>. Improving createeditslog to create tree directory structure.<br />(Lohit Vijayarenu via mahadev)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3778">HADOOP-3778</a>. DFSInputStream.seek() did not retry in case of some errors.<br />(LN via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3661">HADOOP-3661</a>. The handling of moving files deleted through fuse-dfs to
- Trash made similar to the behaviour from dfs shell.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3819">HADOOP-3819</a>. Unset LANG and LC_CTYPE in saveVersion.sh to make it
- compatible with non-English locales.<br />(Rong-En Fan via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3848">HADOOP-3848</a>. Cache calls to getSystemDir in the TaskTracker instead of
- calling it for each task start.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3131">HADOOP-3131</a>. Fix reduce progress reporting for compressed intermediate
- data.<br />(Matei Zaharia via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3796">HADOOP-3796</a>. fuse-dfs configuration is implemented as file system
- mount options.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3836">HADOOP-3836</a>. Fix TestMultipleOutputs to correctly clean up.<br />(Alejandro
- Abdelnur via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3805">HADOOP-3805</a>. Improve fuse-dfs write performance.<br />(Pete Wyckoff via zshao)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3846">HADOOP-3846</a>. Fix unit test CreateEditsLog to generate paths correctly.<br />(Lohit Vjayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3904">HADOOP-3904</a>. Fix unit tests using the old dfs package name.
- (TszWo (Nicholas), SZE via johan)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3319">HADOOP-3319</a>. Fix some HOD error messages to go stderr instead of
- stdout.<br />(Vinod Kumar Vavilapalli via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3907">HADOOP-3907</a>. Move INodeDirectoryWithQuota to its own .java file.
- (Tsz Wo (Nicholas), SZE via hairong)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3919">HADOOP-3919</a>. Fix attribute name in hadoop-default for
- mapred.jobtracker.instrumentation.<br />(Ari Rabkin via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3903">HADOOP-3903</a>. Change the package name for the servlets to be hdfs instead of
- dfs. (Tsz Wo (Nicholas) Sze via omalley)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3773">HADOOP-3773</a>. Change Pipes to set the default map output key and value
- types correctly.<br />(Koji Noguchi via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3952">HADOOP-3952</a>. Fix compilation error in TestDataJoin referencing dfs package.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3951">HADOOP-3951</a>. Fix package name for FSNamesystem logs and modify other
- hard-coded Logs to use the class name.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3889">HADOOP-3889</a>. Improve error reporting from HftpFileSystem, handling in
- DistCp. (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3946">HADOOP-3946</a>. Fix TestMapRed after hadoop-3664.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3949">HADOOP-3949</a>. Remove duplicate jars from Chukwa.<br />(Jerome Boulon via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3933">HADOOP-3933</a>. DataNode sometimes sends up to io.byte.per.checksum bytes
- more than required to client.<br />(Ning Li via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3962">HADOOP-3962</a>. Shell command "fs -count" should support paths with different
- file systems. (Tsz Wo (Nicholas), SZE via mahadev)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3957">HADOOP-3957</a>. Fix javac warnings in DistCp and TestCopyFiles. (Tsz Wo
- (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3958">HADOOP-3958</a>. Fix TestMapRed to check the success of test-job.<br />(omalley via
- acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3985">HADOOP-3985</a>. Fix TestHDFSServerPorts to use random ports.<br />(Hairong Kuang
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3964">HADOOP-3964</a>. Fix javadoc warnings introduced by FailMon.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3785">HADOOP-3785</a>. Fix FileSystem cache to be case-insensitive for scheme and
- authority.<br />(Bill de hOra via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3506">HADOOP-3506</a>. Fix a rare NPE caused by error handling in S3.<br />(Tom White via
- cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3705">HADOOP-3705</a>. Fix mapred.join parser to accept InputFormats named with
- underscore and static, inner classes.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4023">HADOOP-4023</a>. Fix javadoc warnings introduced when the HDFS javadoc was
- made private.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4030">HADOOP-4030</a>. Remove lzop from the default list of codecs.<br />(Arun Murthy via
- cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3961">HADOOP-3961</a>. Fix task disk space requirement estimates for virtual
- input jobs. Delays limiting task placement until after 10% of the maps
- have finished.<br />(Ari Rabkin via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2168">HADOOP-2168</a>. Fix problem with C++ record reader's progress not being
- reported to framework.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3966">HADOOP-3966</a>. Copy findbugs generated output files to PATCH_DIR while
- running test-patch.<br />(Ramya R via lohit)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4037">HADOOP-4037</a>. Fix the eclipse plugin for versions of kfs and log4j.<br />(nigel
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3950">HADOOP-3950</a>. Cause the Mini MR cluster to wait for task trackers to
- register before continuing.<br />(enis via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3910">HADOOP-3910</a>. Remove unused ClusterTestDFSNamespaceLogging and
- ClusterTestDFS. (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3954">HADOOP-3954</a>. Disable record skipping by default.<br />(Sharad Agarwal via
- cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4050">HADOOP-4050</a>. Fix TestFairScheduler to use absolute paths for the work
- directory.<br />(Matei Zaharia via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4069">HADOOP-4069</a>. Keep temporary test files from TestKosmosFileSystem under
- test.build.data instead of /tmp.<br />(lohit via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4078">HADOOP-4078</a>. Create test files for TestKosmosFileSystem in separate
- directory under test.build.data.<br />(lohit)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3968">HADOOP-3968</a>. Fix getFileBlockLocations calls to use FileStatus instead
- of Path reflecting the new API.<br />(Pete Wyckoff via lohit)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3963">HADOOP-3963</a>. libhdfs does not exit on its own, instead it returns error
- to the caller and behaves as a true library.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4100">HADOOP-4100</a>. Removes the cleanupTask scheduling from the Scheduler
- implementations and moves it to the JobTracker.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4097">HADOOP-4097</a>. Make hive work well with speculative execution turned on.<br />(Joydeep Sen Sarma via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4113">HADOOP-4113</a>. Changes to libhdfs to not exit on its own, rather return
- an error code to the caller.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4054">HADOOP-4054</a>. Remove duplicate lease removal during edit log loading.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4071">HADOOP-4071</a>. FSNameSystem.isReplicationInProgress should add an
- underReplicated block to the neededReplication queue using method
- "add" not "update".<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4154">HADOOP-4154</a>. Fix type warnings in WritableUtils.<br />(szetszwo via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4133">HADOOP-4133</a>. Log files generated by Hive should reside in the
- build directory.<br />(Prasad Chakka via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4094">HADOOP-4094</a>. Hive now has hive-default.xml and hive-site.xml similar
- to core hadoop.<br />(Prasad Chakka via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4112">HADOOP-4112</a>. Handles cleanupTask in JobHistory<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3831">HADOOP-3831</a>. Very slow reading clients sometimes failed while reading.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4155">HADOOP-4155</a>. Use JobTracker's start time while initializing JobHistory's
- JobTracker Unique String.<br />(lohit)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4099">HADOOP-4099</a>. Fix null pointer when using HFTP from an 0.18 server.<br />(dhruba via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3570">HADOOP-3570</a>. Includes user specified libjar files in the client side
- classpath path.<br />(Sharad Agarwal via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4129">HADOOP-4129</a>. Changed memory limits of TaskTracker and Tasks to be in
- KiloBytes rather than bytes.<br />(Vinod Kumar Vavilapalli via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4139">HADOOP-4139</a>. Optimize Hive multi group-by.<br />(Namin Jain via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3911">HADOOP-3911</a>. Add a check to fsck options to make sure -files is not
- the first option to resolve conflicts with GenericOptionsParser<br />(lohit)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3623">HADOOP-3623</a>. Refactor LeaseManager.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4125">HADOOP-4125</a>. Handles Reduce cleanup tip on the web ui.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4087">HADOOP-4087</a>. Hive Metastore API for php and python clients.<br />(Prasad Chakka via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4197">HADOOP-4197</a>. Update DATA_TRANSFER_VERSION for <a href="http://issues.apache.org/jira/browse/HADOOP-3981">HADOOP-3981</a>.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4138">HADOOP-4138</a>. Refactor the Hive SerDe library to better structure
- the interfaces to the serializer and de-serializer.<br />(Zheng Shao via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4195">HADOOP-4195</a>. Close compressor before returning to codec pool.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2403">HADOOP-2403</a>. Escapes some special characters before logging to
- history files.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4200">HADOOP-4200</a>. Fix a bug in the test-patch.sh script.<br />(Ramya R via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4084">HADOOP-4084</a>. Add explain plan capabilities to Hive Query Language.<br />(Ashish Thusoo via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4121">HADOOP-4121</a>. Preserve cause for exception if the initialization of
- HistoryViewer for JobHistory fails.<br />(Amareshwari Sri Ramadasu via
- acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4213">HADOOP-4213</a>. Fixes NPE in TestLimitTasksPerJobTaskScheduler.<br />(Sreekanth Ramakrishnan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4077">HADOOP-4077</a>. Setting access and modification time for a file
- requires write permissions on the file.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3592">HADOOP-3592</a>. Fix a couple of possible file leaks in FileUtil<br />(Bill de hOra via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4120">HADOOP-4120</a>. Hive interactive shell records the time taken by a
- query.<br />(Raghotham Murthy via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4090">HADOOP-4090</a>. The hive scripts pick up hadoop from HADOOP_HOME
- and then the path.<br />(Raghotham Murthy via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4242">HADOOP-4242</a>. Remove extra ";" in FSDirectory that blocks compilation
- in some IDE's.<br />(szetszwo via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4249">HADOOP-4249</a>. Fix eclipse path to include the hsqldb.jar.<br />(szetszwo via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4247">HADOOP-4247</a>. Move InputSampler into org.apache.hadoop.mapred.lib, so that
- examples.jar doesn't depend on tools.jar.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4269">HADOOP-4269</a>. Fix the deprecation of LineReader by extending the new class
- into the old name and deprecating it. Also update the tests to test the
- new class.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4280">HADOOP-4280</a>. Fix conversions between seconds in C and milliseconds in
- Java for access times for files.<br />(Pete Wyckoff via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4254">HADOOP-4254</a>. -setSpaceQuota command does not convert "TB" extenstion to
- terabytes properly. Implementation now uses StringUtils for parsing this.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4259">HADOOP-4259</a>. Findbugs should run over tools.jar also.<br />(cdouglas via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4275">HADOOP-4275</a>. Move public method isJobValidName from JobID to a private
- method in JobTracker.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4173">HADOOP-4173</a>. fix failures in TestProcfsBasedProcessTree and
- TestTaskTrackerMemoryManager tests. ProcfsBasedProcessTree and
- memory management in TaskTracker are disabled on Windows.<br />(Vinod K V via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4189">HADOOP-4189</a>. Fixes the history blocksize & intertracker protocol version
- issues introduced as part of <a href="http://issues.apache.org/jira/browse/HADOOP-3245">HADOOP-3245</a>.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4190">HADOOP-4190</a>. Fixes the backward compatibility issue with Job History.
- introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-3245">HADOOP-3245</a> and <a href="http://issues.apache.org/jira/browse/HADOOP-2403">HADOOP-2403</a>.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4237">HADOOP-4237</a>. Fixes the TestStreamingBadRecords.testNarrowDown testcase.<br />(Sharad Agarwal via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4274">HADOOP-4274</a>. Capacity scheduler accidently modifies the underlying
- data structures when browing the job lists.<br />(Hemanth Yamijala via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4309">HADOOP-4309</a>. Fix eclipse-plugin compilation.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4232">HADOOP-4232</a>. Fix race condition in JVM reuse when multiple slots become
- free.<br />(ddas via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4302">HADOOP-4302</a>. Fix a race condition in TestReduceFetch that can yield false
- negatvies.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3942">HADOOP-3942</a>. Update distcp documentation to include features introduced in
- <a href="http://issues.apache.org/jira/browse/HADOOP-3873">HADOOP-3873</a>, <a href="http://issues.apache.org/jira/browse/HADOOP-3939">HADOOP-3939</a>. (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4319">HADOOP-4319</a>. fuse-dfs dfs_read function returns as many bytes as it is
- told to read unlesss end-of-file is reached.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4246">HADOOP-4246</a>. Ensure we have the correct lower bound on the number of
- retries for fetching map-outputs; also fixed the case where the reducer
- automatically kills on too many unique map-outputs could not be fetched
- for small jobs.<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4163">HADOOP-4163</a>. Report FSErrors from map output fetch threads instead of
- merely logging them.<br />(Sharad Agarwal via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4261">HADOOP-4261</a>. Adds a setup task for jobs. This is required so that we
- don't setup jobs that haven't been inited yet (since init could lead
- to job failure). Only after the init has successfully happened do we
- launch the setupJob task.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4256">HADOOP-4256</a>. Removes Completed and Failed Job tables from
- jobqueue_details.jsp.<br />(Sreekanth Ramakrishnan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4267">HADOOP-4267</a>. Occasional exceptions during shutting down HSQLDB is logged
- but not rethrown.<br />(enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4018">HADOOP-4018</a>. The number of tasks for a single job cannot exceed a
- pre-configured maximum value.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4288">HADOOP-4288</a>. Fixes a NPE problem in CapacityScheduler.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4014">HADOOP-4014</a>. Create hard links with 'fsutil hardlink' on Windows.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4393">HADOOP-4393</a>. Merged org.apache.hadoop.fs.permission.AccessControlException
- and org.apache.hadoop.security.AccessControlIOException into a single
- class hadoop.security.AccessControlException.<br />(omalley via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4287">HADOOP-4287</a>. Fixes an issue to do with maintaining counts of running/pending
- maps/reduces.<br />(Sreekanth Ramakrishnan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4361">HADOOP-4361</a>. Makes sure that jobs killed from command line are killed
- fast (i.e., there is a slot to run the cleanup task soon).<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4400">HADOOP-4400</a>. Add "hdfs://" to fs.default.name on quickstart.html.<br />(Jeff Hammerbacher via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4378">HADOOP-4378</a>. Fix TestJobQueueInformation to use SleepJob rather than
- WordCount via TestMiniMRWithDFS.<br />(Sreekanth Ramakrishnan via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4376">HADOOP-4376</a>. Fix formatting in hadoop-default.xml for
- hadoop.http.filter.initializers.<br />(Enis Soztutar via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4410">HADOOP-4410</a>. Adds an extra arg to the API FileUtil.makeShellPath to
- determine whether to canonicalize file paths or not.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4236">HADOOP-4236</a>. Ensure un-initialized jobs are killed correctly on
- user-demand.<br />(Sharad Agarwal via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4373">HADOOP-4373</a>. Fix calculation of Guaranteed Capacity for the
- capacity-scheduler.<br />(Hemanth Yamijala via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4053">HADOOP-4053</a>. Schedulers must be notified when jobs complete.<br />(Amar Kamat via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4335">HADOOP-4335</a>. Fix FsShell -ls for filesystems without owners/groups.<br />(David
- Phillips via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4426">HADOOP-4426</a>. TestCapacityScheduler broke due to the two commits <a href="http://issues.apache.org/jira/browse/HADOOP-4053">HADOOP-4053</a>
- and <a href="http://issues.apache.org/jira/browse/HADOOP-4373">HADOOP-4373</a>. This patch fixes that.<br />(Hemanth Yamijala via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4418">HADOOP-4418</a>. Updates documentation in forrest for Mapred, streaming and pipes.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3155">HADOOP-3155</a>. Ensure that there is only one thread fetching
- TaskCompletionEvents on TaskTracker re-init.<br />(Dhruba Borthakur via
- acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4425">HADOOP-4425</a>. Fix EditLogInputStream to overload the bulk read method.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4427">HADOOP-4427</a>. Adds the new queue/job commands to the manual.<br />(Sreekanth Ramakrishnan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4278">HADOOP-4278</a>. Increase debug logging for unit test TestDatanodeDeath.
- Fix the case when primary is dead.<br />(dhruba via szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4423">HADOOP-4423</a>. Keep block length when the block recovery is triggered by
- append.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4449">HADOOP-4449</a>. Fix dfsadmin usage.<br />(Raghu Angadi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4455">HADOOP-4455</a>. Added TestSerDe so that unit tests can run successfully.<br />(Ashish Thusoo via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4457">HADOOP-4457</a>. Fixes an input split logging problem introduced by
- <a href="http://issues.apache.org/jira/browse/HADOOP-3245">HADOOP-3245</a>.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4464">HADOOP-4464</a>. Separate out TestFileCreationClient from TestFileCreation.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4404">HADOOP-4404</a>. saveFSImage() removes files from a storage directory that do
- not correspond to its type.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4149">HADOOP-4149</a>. Fix handling of updates to the job priority, by changing the
- list of jobs to be keyed by the priority, submit time, and job tracker id.<br />(Amar Kamat via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4296">HADOOP-4296</a>. Fix job client failures by not retiring a job as soon as it
- is finished.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4439">HADOOP-4439</a>. Remove configuration variables that aren't usable yet, in
- particular mapred.tasktracker.tasks.maxmemory and mapred.task.max.memory.<br />(Hemanth Yamijala via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4230">HADOOP-4230</a>. Fix for serde2 interface, limit operator, select * operator,
- UDF trim functions and sampling.<br />(Ashish Thusoo via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4358">HADOOP-4358</a>. No need to truncate access time in INode. Also fixes NPE
- in CreateEditsLog.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4387">HADOOP-4387</a>. TestHDFSFileSystemContract fails on windows nightly builds.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4466">HADOOP-4466</a>. Ensure that SequenceFileOutputFormat isn't tied to Writables
- and can be used with other Serialization frameworks.<br />(Chris Wensel via
- acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4525">HADOOP-4525</a>. Fix ipc.server.ipcnodelay originally missed in in <a href="http://issues.apache.org/jira/browse/HADOOP-2232">HADOOP-2232</a>.<br />(cdouglas via Clint Morgan)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4498">HADOOP-4498</a>. Ensure that JobHistory correctly escapes the job name so that
- regex patterns work.<br />(Chris Wensel via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4446">HADOOP-4446</a>. Modify guaranteed capacity labels in capacity scheduler's UI
- to reflect the information being displayed.<br />(Sreekanth Ramakrishnan via
- yhemanth)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4282">HADOOP-4282</a>. Some user facing URLs are not filtered by user filters.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4595">HADOOP-4595</a>. Fixes two race conditions - one to do with updating free slot count,
- and another to do with starting the MapEventsFetcher thread.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4552">HADOOP-4552</a>. Fix a deadlock in RPC server.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4471">HADOOP-4471</a>. Sort running jobs by priority in the capacity scheduler.<br />(Amar Kamat via yhemanth)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4500">HADOOP-4500</a>. Fix MultiFileSplit to get the FileSystem from the relevant
- path rather than the JobClient.<br />(Joydeep Sen Sarma via dhruba)</li>
- </ol>
- </li>
- </ul>
- <h2><a href="javascript:toggleList('older')">Older Releases</a></h2>
- <ul id="older">
- <h3><a href="javascript:toggleList('release_0.18.4_-_unreleased_')">Release 0.18.4 - Unreleased
- </a></h3>
- <ul id="release_0.18.4_-_unreleased_">
- <li><a href="javascript:toggleList('release_0.18.4_-_unreleased_._bug_fixes_')"> BUG FIXES
- </a> (3)
- <ol id="release_0.18.4_-_unreleased_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5114">HADOOP-5114</a>. Remove timeout for accept() in DataNode. This makes accept()
- fail in JDK on Windows and causes many tests to fail.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5192">HADOOP-5192</a>. Block receiver should not remove a block that's created or
- being written by other threads.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-5134">HADOOP-5134</a>. FSNamesystem#commitBlockSynchronization adds under-construction
- block locations to blocksMap.<br />(Dhruba Borthakur via hairong)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.18.3_-_2009-01-27_')">Release 0.18.3 - 2009-01-27
- </a></h3>
- <ul id="release_0.18.3_-_2009-01-27_">
- <li><a href="javascript:toggleList('release_0.18.3_-_2009-01-27_._improvements_')"> IMPROVEMENTS
- </a> (1)
- <ol id="release_0.18.3_-_2009-01-27_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4150">HADOOP-4150</a>. Include librecordio in hadoop releases.<br />(Giridharan Kesavan
- via acmurthy)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.18.3_-_2009-01-27_._bug_fixes_')"> BUG FIXES
- </a> (41)
- <ol id="release_0.18.3_-_2009-01-27_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4499">HADOOP-4499</a>. DFSClient should invoke checksumOk only once.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4597">HADOOP-4597</a>. Calculate mis-replicated blocks when safe-mode is turned
- off manually.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3121">HADOOP-3121</a>. lsr should keep listing the remaining items but not
- terminate if there is any IOException.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4610">HADOOP-4610</a>. Always calculate mis-replicated blocks when safe-mode is
- turned off.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3883">HADOOP-3883</a>. Limit namenode to assign at most one generation stamp for
- a particular block within a short period.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4556">HADOOP-4556</a>. Block went missing.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4643">HADOOP-4643</a>. NameNode should exclude excessive replicas when counting
- live replicas for a block.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4703">HADOOP-4703</a>. Should not wait for proxy forever in lease recovering.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4647">HADOOP-4647</a>. NamenodeFsck should close the DFSClient it has created.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4616">HADOOP-4616</a>. Fuse-dfs can handle bad values from FileSystem.read call.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4061">HADOOP-4061</a>. Throttle Datanode decommission monitoring in Namenode.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4659">HADOOP-4659</a>. Root cause of connection failure is being lost to code that
- uses it for delaying startup.<br />(Steve Loughran and Hairong via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4614">HADOOP-4614</a>. Lazily open segments when merging map spills to avoid using
- too many file descriptors.<br />(Yuri Pradkin via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4257">HADOOP-4257</a>. The DFS client should pick only one datanode as the candidate
- to initiate lease recovery. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4713">HADOOP-4713</a>. Fix librecordio to handle records larger than 64k.<br />(Christian
- Kunz via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4635">HADOOP-4635</a>. Fix a memory leak in fuse dfs.<br />(pete wyckoff via mahadev)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4714">HADOOP-4714</a>. Report status between merges and make the number of records
- between progress reports configurable.<br />(Jothi Padmanabhan via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4726">HADOOP-4726</a>. Fix documentation typos "the the".<br />(Edward J. Yoon via
- szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4679">HADOOP-4679</a>. Datanode prints tons of log messages: waiting for threadgroup
- to exit, active threads is XX.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4746">HADOOP-4746</a>. Job output directory should be normalized.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4717">HADOOP-4717</a>. Removal of default port# in NameNode.getUri() causes a
- map/reduce job failed to prompt temporary output.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4778">HADOOP-4778</a>. Check for zero size block meta file when updating a block.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4742">HADOOP-4742</a>. Replica gets deleted by mistake.<br />(Wang Xu via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4702">HADOOP-4702</a>. Failed block replication leaves an incomplete block in
- receiver's tmp data directory.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4613">HADOOP-4613</a>. Fix block browsing on Web UI.<br />(Johan Oskarsson via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4806">HADOOP-4806</a>. HDFS rename should not use src path as a regular expression.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4795">HADOOP-4795</a>. Prevent lease monitor getting into an infinite loop when
- leases and the namespace tree does not match.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4620">HADOOP-4620</a>. Fixes Streaming to handle well the cases of map/reduce with empty
- input/output.<br />(Ravi Gummadi via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4857">HADOOP-4857</a>. Fixes TestUlimit to have exactly 1 map in the jobs spawned.<br />(Ravi Gummadi via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4810">HADOOP-4810</a>. Data lost at cluster startup time.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4797">HADOOP-4797</a>. Improve how RPC server reads and writes large buffers. Avoids
- soft-leak of direct buffers and excess copies in NIO layer.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4840">HADOOP-4840</a>. TestNodeCount sometimes fails with NullPointerException.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4904">HADOOP-4904</a>. Fix deadlock while leaving safe mode.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1980">HADOOP-1980</a>. 'dfsadmin -safemode enter' should prevent the namenode from
- leaving safemode automatically.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4951">HADOOP-4951</a>. Lease monitor should acquire the LeaseManager lock but not the
- Monitor lock.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4935">HADOOP-4935</a>. processMisReplicatedBlocks() should not clear
- excessReplicateMap.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4961">HADOOP-4961</a>. Fix ConcurrentModificationException in lease recovery
- of empty files.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4971">HADOOP-4971</a>. A long (unexpected) delay at datanodes could make subsequent
- block reports from many datanode at the same time.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4910">HADOOP-4910</a>. NameNode should exclude replicas when choosing excessive
- replicas to delete to avoid data lose.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4983">HADOOP-4983</a>. Fixes a problem in updating Counters in the status reporting.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4924">HADOOP-4924</a>. Fixes a race condition in TaskTracker re-init.<br />(ddas)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.18.2_-_2008-11-03_')">Release 0.18.2 - 2008-11-03
- </a></h3>
- <ul id="release_0.18.2_-_2008-11-03_">
- <li><a href="javascript:toggleList('release_0.18.2_-_2008-11-03_._bug_fixes_')"> BUG FIXES
- </a> (16)
- <ol id="release_0.18.2_-_2008-11-03_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3614">HADOOP-3614</a>. Fix a bug that Datanode may use an old GenerationStamp to get
- meta file.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4314">HADOOP-4314</a>. Simulated datanodes should not include blocks that are still
- being written in their block report.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4228">HADOOP-4228</a>. dfs datanode metrics, bytes_read and bytes_written, overflow
- due to incorrect type used.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4395">HADOOP-4395</a>. The FSEditLog loading is incorrect for the case OP_SET_OWNER.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4351">HADOOP-4351</a>. FSNamesystem.getBlockLocationsInternal throws
- ArrayIndexOutOfBoundsException.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4403">HADOOP-4403</a>. Make TestLeaseRecovery and TestFileCreation more robust.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4292">HADOOP-4292</a>. Do not support append() for LocalFileSystem.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4399">HADOOP-4399</a>. Make fuse-dfs multi-thread access safe.<br />(Pete Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4369">HADOOP-4369</a>. Use setMetric(...) instead of incrMetric(...) for metrics
- averages.<br />(Brian Bockelman via szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4469">HADOOP-4469</a>. Rename and add the ant task jar file to the tar file.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3914">HADOOP-3914</a>. DFSClient sends Checksum Ok only once for a block.<br />(Christian Kunz via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4467">HADOOP-4467</a>. SerializationFactory now uses the current context ClassLoader
- allowing for user supplied Serialization instances.<br />(Chris Wensel via
- acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4517">HADOOP-4517</a>. Release FSDataset lock before joining ongoing create threads.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4526">HADOOP-4526</a>. fsck failing with NullPointerException.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4483">HADOOP-4483</a> Honor the max parameter in DatanodeDescriptor.getBlockArray(..)<br />(Ahad Rana and Hairong Kuang via szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4340">HADOOP-4340</a>. Correctly set the exit code from JobShell.main so that the
- 'hadoop jar' command returns the right code to the user.<br />(acmurthy)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.18.2_-_2008-11-03_._new_features_')"> NEW FEATURES
- </a> (1)
- <ol id="release_0.18.2_-_2008-11-03_._new_features_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2421">HADOOP-2421</a>. Add jdiff output to documentation, listing all API
- changes from the prior release.<br />(cutting)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.18.1_-_2008-09-17_')">Release 0.18.1 - 2008-09-17
- </a></h3>
- <ul id="release_0.18.1_-_2008-09-17_">
- <li><a href="javascript:toggleList('release_0.18.1_-_2008-09-17_._improvements_')"> IMPROVEMENTS
- </a> (1)
- <ol id="release_0.18.1_-_2008-09-17_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3934">HADOOP-3934</a>. Upgrade log4j to 1.2.15.<br />(omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.18.1_-_2008-09-17_._bug_fixes_')"> BUG FIXES
- </a> (5)
- <ol id="release_0.18.1_-_2008-09-17_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3995">HADOOP-3995</a>. In case of quota failure on HDFS, rename does not restore
- source filename.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3821">HADOOP-3821</a>. Prevent SequenceFile and IFile from duplicating codecs in
- CodecPool when closed more than once.<br />(Arun Murthy via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4040">HADOOP-4040</a>. Remove coded default of the IPC idle connection timeout
- from the TaskTracker, which was causing HDFS client connections to not be
- collected.<br />(ddas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4046">HADOOP-4046</a>. Made WritableComparable's constructor protected instead of
- private to re-enable class derivation.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3940">HADOOP-3940</a>. Fix in-memory merge condition to wait when there are no map
- outputs or when the final map outputs are being fetched without contention.<br />(cdouglas)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.18.0_-_2008-08-19_')">Release 0.18.0 - 2008-08-19
- </a></h3>
- <ul id="release_0.18.0_-_2008-08-19_">
- <li><a href="javascript:toggleList('release_0.18.0_-_2008-08-19_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (23)
- <ol id="release_0.18.0_-_2008-08-19_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2703">HADOOP-2703</a>. The default options to fsck skips checking files
- that are being written to. The output of fsck is incompatible
- with previous release.<br />(lohit vijayarenu via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2865">HADOOP-2865</a>. FsShell.ls() printout format changed to print file names
- in the end of the line.<br />(Edward J. Yoon via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3283">HADOOP-3283</a>. The Datanode has a RPC server. It currently supports
- two RPCs: the first RPC retrives the metadata about a block and the
- second RPC sets the generation stamp of an existing block.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2797">HADOOP-2797</a>. Code related to upgrading to 0.14 (Block CRCs) is
- removed. As result, upgrade to 0.18 or later from 0.13 or earlier
- is not supported. If upgrading from 0.13 or earlier is required,
- please upgrade to an intermediate version (0.14-0.17) and then
- to this version.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-544">HADOOP-544</a>. This issue introduces new classes JobID, TaskID and
- TaskAttemptID, which should be used instead of their string counterparts.
- Functions in JobClient, TaskReport, RunningJob, jobcontrol.Job and
- TaskCompletionEvent that use string arguments are deprecated in favor
- of the corresponding ones that use ID objects. Applications can use
- xxxID.toString() and xxxID.forName() methods to convert/restore objects
- to/from strings.<br />(Enis Soztutar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2188">HADOOP-2188</a>. RPC client sends a ping rather than throw timeouts.
- RPC server does not throw away old RPCs. If clients and the server are on
- different versions, they are not able to function well. In addition,
- The property ipc.client.timeout is removed from the default hadoop
- configuration. It also removes metrics RpcOpsDiscardedOPsNum.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2181">HADOOP-2181</a>. This issue adds logging for input splits in Jobtracker log
- and jobHistory log. Also adds web UI for viewing input splits in job UI
- and history UI.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3226">HADOOP-3226</a>. Run combiners multiple times over map outputs as they
- are merged in both the map and the reduce tasks.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3329">HADOOP-3329</a>. DatanodeDescriptor objects should not be stored in the
- fsimage.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2656">HADOOP-2656</a>. The Block object has a generation stamp inside it.
- Existing blocks get a generation stamp of 0. This is needed to support
- appends.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3390">HADOOP-3390</a>. Removed deprecated ClientProtocol.abandonFileInProgress().
- (Tsz Wo (Nicholas), SZE via rangadi)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3405">HADOOP-3405</a>. Made some map/reduce internal classes non-public:
- MapTaskStatus, ReduceTaskStatus, JobSubmissionProtocol,
- CompletedJobStatusStore.<br />(enis via omaley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3265">HADOOP-3265</a>. Removed depcrecated API getFileCacheHints().<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3310">HADOOP-3310</a>. The namenode instructs the primary datanode to do lease
- recovery. The block gets a new generation stamp.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2909">HADOOP-2909</a>. Improve IPC idle connection management. Property
- ipc.client.maxidletime is removed from the default configuration,
- instead it is defined as twice of the ipc.client.connection.maxidletime.
- A connection with outstanding requests won't be treated as idle.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3459">HADOOP-3459</a>. Change in the output format of dfs -ls to more closely match
- /bin/ls. New format is: perm repl owner group size date name<br />(Mukund Madhugiri via omally)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3113">HADOOP-3113</a>. An fsync invoked on a HDFS file really really
- persists data! The datanode moves blocks in the tmp directory to
- the real block directory on a datanode-restart.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3452">HADOOP-3452</a>. Change fsck to return non-zero status for a corrupt
- FileSystem.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3193">HADOOP-3193</a>. Include the address of the client that found the corrupted
- block in the log. Also include a CorruptedBlocks metric to track the size
- of the corrupted block map.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3512">HADOOP-3512</a>. Separate out the tools into a tools jar.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3598">HADOOP-3598</a>. Ensure that temporary task-output directories are not created
- if they are not necessary e.g. for Maps with no side-effect files.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3665">HADOOP-3665</a>. Modify WritableComparator so that it only creates instances
- of the keytype if the type does not define a WritableComparator. Calling
- the superclass compare will throw a NullPointerException. Also define
- a RawComparator for NullWritable and permit it to be written as a key
- to SequenceFiles.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3673">HADOOP-3673</a>. Avoid deadlock caused by DataNode RPC receoverBlock().
- (Tsz Wo (Nicholas), SZE via rangadi)
- </li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.18.0_-_2008-08-19_._new_features_')"> NEW FEATURES
- </a> (25)
- <ol id="release_0.18.0_-_2008-08-19_._new_features_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3074">HADOOP-3074</a>. Provides a UrlStreamHandler for DFS and other FS,
- relying on FileSystem<br />(taton)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2585">HADOOP-2585</a>. Name-node imports namespace data from a recent checkpoint
- accessible via a NFS mount.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3061">HADOOP-3061</a>. Writable types for doubles and bytes.<br />(Andrzej
- Bialecki via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2857">HADOOP-2857</a>. Allow libhdfs to set jvm options.<br />(Craig Macdonald
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3317">HADOOP-3317</a>. Add default port for HDFS namenode. The port in
- "hdfs:" URIs now defaults to 8020, so that one may simply use URIs
- of the form "hdfs://example.com/dir/file".<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2019">HADOOP-2019</a>. Adds support for .tar, .tgz and .tar.gz files in
- DistributedCache<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3058">HADOOP-3058</a>. Add FSNamesystem status metrics.<br />(Lohit Vjayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1915">HADOOP-1915</a>. Allow users to specify counters via strings instead
- of enumerations.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2065">HADOOP-2065</a>. Delay invalidating corrupt replicas of block until its
- is removed from under replicated state. If all replicas are found to
- be corrupt, retain all copies and mark the block as corrupt.<br />(Lohit Vjayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3221">HADOOP-3221</a>. Adds org.apache.hadoop.mapred.lib.NLineInputFormat, which
- splits files into splits each of N lines. N can be specified by
- configuration property "mapred.line.input.format.linespermap", which
- defaults to 1.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3336">HADOOP-3336</a>. Direct a subset of annotated FSNamesystem calls for audit
- logging.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3400">HADOOP-3400</a>. A new API FileSystem.deleteOnExit() that facilitates
- handling of temporary files in HDFS.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4">HADOOP-4</a>. Add fuse-dfs to contrib, permitting one to mount an
- HDFS filesystem on systems that support FUSE, e.g., Linux.<br />(Pete Wyckoff via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3246">HADOOP-3246</a>. Add FTPFileSystem.<br />(Ankur Goel via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3250">HADOOP-3250</a>. Extend FileSystem API to allow appending to files.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3177">HADOOP-3177</a>. Implement Syncable interface for FileSystem.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1328">HADOOP-1328</a>. Implement user counters in streaming.<br />(tomwhite via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3187">HADOOP-3187</a>. Quotas for namespace management.<br />(Hairong Kuang via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3307">HADOOP-3307</a>. Support for Archives in Hadoop.<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3460">HADOOP-3460</a>. Add SequenceFileAsBinaryOutputFormat to permit direct
- writes of serialized data.<br />(Koji Noguchi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3230">HADOOP-3230</a>. Add ability to get counter values from command
- line.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-930">HADOOP-930</a>. Add support for native S3 files.<br />(tomwhite via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3502">HADOOP-3502</a>. Quota API needs documentation in Forrest.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3413">HADOOP-3413</a>. Allow SequenceFile.Reader to use serialization
- framework.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3541">HADOOP-3541</a>. Import of the namespace from a checkpoint documented
- in hadoop user guide.<br />(shv)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.18.0_-_2008-08-19_._improvements_')"> IMPROVEMENTS
- </a> (47)
- <ol id="release_0.18.0_-_2008-08-19_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3677">HADOOP-3677</a>. Simplify generation stamp upgrade by making is a
- local upgrade on datandodes. Deleted distributed upgrade.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2928">HADOOP-2928</a>. Remove deprecated FileSystem.getContentLength().<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3130">HADOOP-3130</a>. Make the connect timeout smaller for getFile.<br />(Amar Ramesh Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3160">HADOOP-3160</a>. Remove deprecated exists() from ClientProtocol and
- FSNamesystem<br />(Lohit Vjayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2910">HADOOP-2910</a>. Throttle IPC Clients during bursts of requests or
- server slowdown. Clients retry connection for up to 15 minutes
- when socket connection times out.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3295">HADOOP-3295</a>. Allow TextOutputFormat to use configurable spearators.
- (Zheng Shao via cdouglas).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3308">HADOOP-3308</a>. Improve QuickSort by excluding values eq the pivot from the
- partition.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2461">HADOOP-2461</a>. Trim property names in configuration.
- (Tsz Wo (Nicholas), SZE via shv)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2799">HADOOP-2799</a>. Deprecate o.a.h.io.Closable in favor of java.io.Closable.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3345">HADOOP-3345</a>. Enhance the hudson-test-patch target to cleanup messages,
- fix minor defects, and add eclipse plugin and python unit tests.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3144">HADOOP-3144</a>. Improve robustness of LineRecordReader by defining a maximum
- line length (mapred.linerecordreader.maxlength), thereby avoiding reading
- too far into the following split.<br />(Zheng Shao via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3334">HADOOP-3334</a>. Move lease handling from FSNamesystem into a seperate class.
- (Tsz Wo (Nicholas), SZE via rangadi)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3332">HADOOP-3332</a>. Reduces the amount of logging in Reducer's shuffle phase.<br />(Devaraj Das)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3355">HADOOP-3355</a>. Enhances Configuration class to accept hex numbers for getInt
- and getLong.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3350">HADOOP-3350</a>. Add an argument to distcp to permit the user to limit the
- number of maps.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3013">HADOOP-3013</a>. Add corrupt block reporting to fsck.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3377">HADOOP-3377</a>. Remove TaskRunner::replaceAll and replace with equivalent
- String::replace.<br />(Brice Arnould via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3398">HADOOP-3398</a>. Minor improvement to a utility function in that participates
- in backoff calculation.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3381">HADOOP-3381</a>. Clear referenced when directories are deleted so that
- effect of memory leaks are not multiplied.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2867">HADOOP-2867</a>. Adds the task's CWD to its LD_LIBRARY_PATH.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3232">HADOOP-3232</a>. DU class runs the 'du' command in a seperate thread so
- that it does not block user. DataNode misses heartbeats in large
- nodes otherwise.<br />(Johan Oskarsson via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3035">HADOOP-3035</a>. During block transfers between datanodes, the receiving
- datanode, now can report corrupt replicas received from src node to
- the namenode.<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3434">HADOOP-3434</a>. Retain the cause of the bind failure in Server::bind.<br />(Steve Loughran via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3429">HADOOP-3429</a>. Increases the size of the buffers used for the communication
- for Streaming jobs.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3486">HADOOP-3486</a>. Change default for initial block report to 0 seconds
- and document it.<br />(Sanjay Radia via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3448">HADOOP-3448</a>. Improve the text in the assertion making sure the
- layout versions are consistent in the data node.<br />(Steve Loughran
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2095">HADOOP-2095</a>. Improve the Map-Reduce shuffle/merge by cutting down
- buffer-copies; changed intermediate sort/merge to use the new IFile format
- rather than SequenceFiles and compression of map-outputs is now
- implemented by compressing the entire file rather than SequenceFile
- compression. Shuffle also has been changed to use a simple byte-buffer
- manager rather than the InMemoryFileSystem.
- Configuration changes to hadoop-default.xml:
- deprecated mapred.map.output.compression.type<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-236">HADOOP-236</a>. JobTacker now refuses connection from a task tracker with a
- different version number.<br />(Sharad Agarwal via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3427">HADOOP-3427</a>. Improves the shuffle scheduler. It now waits for notifications
- from shuffle threads when it has scheduled enough, before scheduling more.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2393">HADOOP-2393</a>. Moves the handling of dir deletions in the tasktracker to
- a separate thread.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3501">HADOOP-3501</a>. Deprecate InMemoryFileSystem.<br />(cutting via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3366">HADOOP-3366</a>. Stall the shuffle while in-memory merge is in progress.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2916">HADOOP-2916</a>. Refactor src structure, but leave package structure alone.<br />(Raghu Angadi via mukund)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3492">HADOOP-3492</a>. Add forrest documentation for user archives.<br />(Mahadev Konar via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3467">HADOOP-3467</a>. Improve documentation for FileSystem::deleteOnExit.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3379">HADOOP-3379</a>. Documents stream.non.zero.exit.status.is.failure for Streaming.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3096">HADOOP-3096</a>. Improves documentation about the Task Execution Environment in
- the Map-Reduce tutorial.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2984">HADOOP-2984</a>. Add forrest documentation for DistCp.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3406">HADOOP-3406</a>. Add forrest documentation for Profiling.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2762">HADOOP-2762</a>. Add forrest documentation for controls of memory limits on
- hadoop daemons and Map-Reduce tasks.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3535">HADOOP-3535</a>. Fix documentation and name of IOUtils.close to
- reflect that it should only be used in cleanup contexts.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3593">HADOOP-3593</a>. Updates the mapred tutorial.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3547">HADOOP-3547</a>. Documents the way in which native libraries can be distributed
- via the DistributedCache.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3606">HADOOP-3606</a>. Updates the Streaming doc.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3532">HADOOP-3532</a>. Add jdiff reports to the build scripts.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3100">HADOOP-3100</a>. Develop tests to test the DFS command line interface.<br />(mukund)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3688">HADOOP-3688</a>. Fix up HDFS docs.<br />(Robert Chansler via hairong)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.18.0_-_2008-08-19_._optimizations_')"> OPTIMIZATIONS
- </a> (10)
- <ol id="release_0.18.0_-_2008-08-19_._optimizations_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3274">HADOOP-3274</a>. The default constructor of BytesWritable creates empty
- byte array. (Tsz Wo (Nicholas), SZE via shv)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3272">HADOOP-3272</a>. Remove redundant copy of Block object in BlocksMap.<br />(Lohit Vjayarenu via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3164">HADOOP-3164</a>. Reduce DataNode CPU usage by using FileChannel.tranferTo().
- On Linux DataNode takes 5 times less CPU while serving data. Results may
- vary on other platforms.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3248">HADOOP-3248</a>. Optimization of saveFSImage.<br />(Dhruba via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3297">HADOOP-3297</a>. Fetch more task completion events from the job
- tracker and task tracker.<br />(ddas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3364">HADOOP-3364</a>. Faster image and log edits loading.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3369">HADOOP-3369</a>. Fast block processing during name-node startup.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1702">HADOOP-1702</a>. Reduce buffer copies when data is written to DFS.
- DataNodes take 30% less CPU while writing data.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3095">HADOOP-3095</a>. Speed up split generation in the FileInputSplit,
- especially for non-HDFS file systems. Deprecates
- InputFormat.validateInput.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3552">HADOOP-3552</a>. Add forrest documentation for Hadoop commands.<br />(Sharad Agarwal via cdouglas)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.18.0_-_2008-08-19_._bug_fixes_')"> BUG FIXES
- </a> (144)
- <ol id="release_0.18.0_-_2008-08-19_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2905">HADOOP-2905</a>. 'fsck -move' triggers NPE in NameNode.<br />(Lohit Vjayarenu via rangadi)</li>
- <li>Increment ClientProtocol.versionID missed by <a href="http://issues.apache.org/jira/browse/HADOOP-2585">HADOOP-2585</a>.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3254">HADOOP-3254</a>. Restructure internal namenode methods that process
- heartbeats to use well-defined BlockCommand object(s) instead of
- using the base java Object. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3176">HADOOP-3176</a>. Change lease record when a open-for-write-file
- gets renamed.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3269">HADOOP-3269</a>. Fix a case when namenode fails to restart
- while processing a lease record. ((Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3282">HADOOP-3282</a>. Port issues in TestCheckpoint resolved.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3268">HADOOP-3268</a>. file:// URLs issue in TestUrlStreamHandler under Windows.<br />(taton)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3127">HADOOP-3127</a>. Deleting files in trash should really remove them.<br />(Brice Arnould via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3300">HADOOP-3300</a>. Fix locking of explicit locks in NetworkTopology.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3270">HADOOP-3270</a>. Constant DatanodeCommands are stored in static final
- immutable variables for better code clarity.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2793">HADOOP-2793</a>. Fix broken links for worst performing shuffle tasks in
- the job history page.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3313">HADOOP-3313</a>. Avoid unnecessary calls to System.currentTimeMillis
- in RPC::Invoker.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3318">HADOOP-3318</a>. Recognize "Darwin" as an alias for "Mac OS X" to
- support Soylatte.<br />(Sam Pullara via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3301">HADOOP-3301</a>. Fix misleading error message when S3 URI hostname
- contains an underscore.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3338">HADOOP-3338</a>. Fix Eclipse plugin to compile after <a href="http://issues.apache.org/jira/browse/HADOOP-544">HADOOP-544</a> was
- committed. Updated all references to use the new JobID representation.<br />(taton via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3337">HADOOP-3337</a>. Loading FSEditLog was broken by <a href="http://issues.apache.org/jira/browse/HADOOP-3283">HADOOP-3283</a> since it
- changed Writable serialization of DatanodeInfo. This patch handles it.
- (Tsz Wo (Nicholas), SZE via rangadi)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3101">HADOOP-3101</a>. Prevent JobClient from throwing an exception when printing
- usage.<br />(Edward J. Yoon via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3119">HADOOP-3119</a>. Update javadoc for Text::getBytes to better describe its
- behavior.<br />(Tim Nelson via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2294">HADOOP-2294</a>. Fix documentation in libhdfs to refer to the correct free
- function.<br />(Craig Macdonald via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3335">HADOOP-3335</a>. Prevent the libhdfs build from deleting the wrong
- files on make clean.<br />(cutting via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2930">HADOOP-2930</a>. Make {start,stop}-balancer.sh work even if hadoop-daemon.sh
- is not in the PATH.<br />(Spiros Papadimitriou via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3085">HADOOP-3085</a>. Catch Exception in metrics util classes to ensure that
- misconfigured metrics don't prevent others from updating.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3299">HADOOP-3299</a>. CompositeInputFormat should configure the sub-input
- formats.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3309">HADOOP-3309</a>. Lower io.sort.mb and fs.inmemory.size.mb for MiniMRDFSSort
- unit test so it passes on Windows.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3348">HADOOP-3348</a>. TestUrlStreamHandler should set URLStreamFactory after
- DataNodes are initialized.<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3371">HADOOP-3371</a>. Ignore InstanceAlreadyExistsException from
- MBeanUtil::registerMBean.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3349">HADOOP-3349</a>. A file rename was incorrectly changing the name inside a
- lease record. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3365">HADOOP-3365</a>. Removes an unnecessary copy of the key from SegmentDescriptor
- to MergeQueue.<br />(Devaraj Das)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3388">HADOOP-3388</a>. Fix for TestDatanodeBlockScanner to handle blocks with
- generation stamps in them.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3203">HADOOP-3203</a>. Fixes TaskTracker::localizeJob to pass correct file sizes
- for the jarfile and the jobfile.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3391">HADOOP-3391</a>. Fix a findbugs warning introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-3248">HADOOP-3248</a><br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3393">HADOOP-3393</a>. Fix datanode shutdown to call DataBlockScanner::shutdown and
- close its log, even if the scanner thread is not running.<br />(lohit vijayarenu
- via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3399">HADOOP-3399</a>. A debug message was logged at info level.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3396">HADOOP-3396</a>. TestDatanodeBlockScanner occationally fails.<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3339">HADOOP-3339</a>. Some of the failures on 3rd datanode in DFS write pipelie
- are not detected properly. This could lead to hard failure of client's
- write operation.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3409">HADOOP-3409</a>. Namenode should save the root inode into fsimage.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3296">HADOOP-3296</a>. Fix task cache to work for more than two levels in the cache
- hierarchy. This also adds a new counter to track cache hits at levels
- greater than two.<br />(Amar Kamat via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3375">HADOOP-3375</a>. Lease paths were sometimes not removed from
- LeaseManager.sortedLeasesByPath. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3424">HADOOP-3424</a>. Values returned by getPartition should be checked to
- make sure they are in the range 0 to #reduces - 1<br />(cdouglas via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3408">HADOOP-3408</a>. Change FSNamesystem to send its metrics as integers to
- accommodate collectors that don't support long values.<br />(lohit vijayarenu
- via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3403">HADOOP-3403</a>. Fixes a problem in the JobTracker to do with handling of lost
- tasktrackers.<br />(Arun Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1318">HADOOP-1318</a>. Completed maps are not failed if the number of reducers are
- zero. (Amareshwari Sriramadasu via ddas).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3351">HADOOP-3351</a>. Fixes the history viewer tool to not do huge StringBuffer
- allocations.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3419">HADOOP-3419</a>. Fixes TestFsck to wait for updates to happen before
- checking results to make the test more reliable.<br />(Lohit Vijaya
- Renu via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3259">HADOOP-3259</a>. Makes failure to read system properties due to a
- security manager non-fatal.<br />(Edward Yoon via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3451">HADOOP-3451</a>. Update libhdfs to use FileSystem::getFileBlockLocations
- instead of removed getFileCacheHints.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3401">HADOOP-3401</a>. Update FileBench to set the new
- "mapred.work.output.dir" property to work post-3041.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2669">HADOOP-2669</a>. DFSClient locks pendingCreates appropriately.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3410">HADOOP-3410</a>. Fix KFS implemenation to return correct file
- modification time.<br />(Sriram Rao via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3340">HADOOP-3340</a>. Fix DFS metrics for BlocksReplicated, HeartbeatsNum, and
- BlockReportsAverageTime.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3435">HADOOP-3435</a>. Remove the assuption in the scripts that bash is at
- /bin/bash and fix the test patch to require bash instead of sh.<br />(Brice Arnould via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3471">HADOOP-3471</a>. Fix spurious errors from TestIndexedSort and add additional
- logging to let failures be reproducible.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3443">HADOOP-3443</a>. Avoid copying map output across partitions when renaming a
- single spill.<br />(omalley via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3454">HADOOP-3454</a>. Fix Text::find to search only valid byte ranges.<br />(Chad Whipkey
- via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3417">HADOOP-3417</a>. Removes the static configuration variable,
- commandLineConfig from JobClient. Moves the cli parsing from
- JobShell to GenericOptionsParser. Thus removes the class
- org.apache.hadoop.mapred.JobShell.<br />(Amareshwari Sriramadasu via
- ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2132">HADOOP-2132</a>. Only RUNNING/PREP jobs can be killed.<br />(Jothi Padmanabhan
- via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3476">HADOOP-3476</a>. Code cleanup in fuse-dfs.<br />(Peter Wyckoff via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2427">HADOOP-2427</a>. Ensure that the cwd of completed tasks is cleaned-up
- correctly on task-completion.<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2565">HADOOP-2565</a>. Remove DFSPath cache of FileStatus.
- (Tsz Wo (Nicholas), SZE via hairong)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3326">HADOOP-3326</a>. Cleanup the local-fs and in-memory merge in the ReduceTask by
- spawing only one thread each for the on-disk and in-memory merge.<br />(Sharad Agarwal via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3493">HADOOP-3493</a>. Fix TestStreamingFailure to use FileUtil.fullyDelete to
- ensure correct cleanup.<br />(Lohit Vijayarenu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3455">HADOOP-3455</a>. Fix NPE in ipc.Client in case of connection failure and
- improve its synchronization.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3240">HADOOP-3240</a>. Fix a testcase to not create files in the current directory.
- Instead the file is created in the test directory<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3496">HADOOP-3496</a>. Fix failure in TestHarFileSystem.testArchives due to change
- in <a href="http://issues.apache.org/jira/browse/HADOOP-3095">HADOOP-3095</a>.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3135">HADOOP-3135</a>. Get the system directory from the JobTracker instead of from
- the conf.<br />(Subramaniam Krishnan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3503">HADOOP-3503</a>. Fix a race condition when client and namenode start
- simultaneous recovery of the same block. (dhruba & Tsz Wo
- (Nicholas), SZE)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3440">HADOOP-3440</a>. Fixes DistributedCache to not create symlinks for paths which
- don't have fragments even when createSymLink is true.<br />(Abhijit Bagri via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3463">HADOOP-3463</a>. Hadoop-daemons script should cd to $HADOOP_HOME.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3489">HADOOP-3489</a>. Fix NPE in SafeModeMonitor.<br />(Lohit Vijayarenu via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3509">HADOOP-3509</a>. Fix NPE in FSNamesystem.close. (Tsz Wo (Nicholas), SZE via
- shv)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3491">HADOOP-3491</a>. Name-node shutdown causes InterruptedException in
- ResolutionMonitor.<br />(Lohit Vijayarenu via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3511">HADOOP-3511</a>. Fixes namenode image to not set the root's quota to an
- invalid value when the quota was not saved in the image.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3516">HADOOP-3516</a>. Ensure the JobClient in HadoopArchives is initialized
- with a configuration.<br />(Subramaniam Krishnan via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3513">HADOOP-3513</a>. Improve NNThroughputBenchmark log messages.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3519">HADOOP-3519</a>. Fix NPE in DFS FileSystem rename.<br />(hairong via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3528">HADOOP-3528</a>. Metrics FilesCreated and files_deleted metrics
- do not match.<br />(Lohit via Mahadev)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3418">HADOOP-3418</a>. When a directory is deleted, any leases that point to files
- in the subdirectory are removed. ((Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3542">HADOOP-3542</a>. Diables the creation of _logs directory for the archives
- directory.<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3544">HADOOP-3544</a>. Fixes a documentation issue for hadoop archives.<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3517">HADOOP-3517</a>. Fixes a problem in the reducer due to which the last InMemory
- merge may be missed.<br />(Arun Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3548">HADOOP-3548</a>. Fixes build.xml to copy all *.jar files to the dist.<br />(Owen O'Malley via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3363">HADOOP-3363</a>. Fix unformatted storage detection in FSImage.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3560">HADOOP-3560</a>. Fixes a problem to do with split creation in archives.<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3545">HADOOP-3545</a>. Fixes a overflow problem in archives.<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3561">HADOOP-3561</a>. Prevent the trash from deleting its parent directories.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3575">HADOOP-3575</a>. Fix the clover ant target after package refactoring.<br />(Nigel Daley via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3539">HADOOP-3539</a>. Fix the tool path in the bin/hadoop script under
- cygwin. (Tsz Wo (Nicholas), Sze via omalley)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3520">HADOOP-3520</a>. TestDFSUpgradeFromImage triggers a race condition in the
- Upgrade Manager. Fixed.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3586">HADOOP-3586</a>. Provide deprecated, backwards compatibile semantics for the
- combiner to be run once and only once on each record.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3533">HADOOP-3533</a>. Add deprecated methods to provide API compatibility
- between 0.18 and 0.17. Remove the deprecated methods in trunk.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3580">HADOOP-3580</a>. Fixes a problem to do with specifying a har as an input to
- a job.<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3333">HADOOP-3333</a>. Don't assign a task to a tasktracker that it failed to
- execute earlier (used to happen in the case of lost tasktrackers where
- the tasktracker would reinitialize and bind to a different port).<br />(Jothi Padmanabhan and Arun Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3534">HADOOP-3534</a>. Log IOExceptions that happen in closing the name
- system when the NameNode shuts down. (Tsz Wo (Nicholas) Sze via omalley)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3546">HADOOP-3546</a>. TaskTracker re-initialization gets stuck in cleaning up.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3576">HADOOP-3576</a>. Fix NullPointerException when renaming a directory
- to its subdirectory. (Tse Wo (Nicholas), SZE via hairong)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3320">HADOOP-3320</a>. Fix NullPointerException in NetworkTopology.getDistance().<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3569">HADOOP-3569</a>. KFS input stream read() now correctly reads 1 byte
- instead of 4.<br />(Sriram Rao via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3599">HADOOP-3599</a>. Fix JobConf::setCombineOnceOnly to modify the instance rather
- than a parameter.<br />(Owen O'Malley via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3590">HADOOP-3590</a>. Null pointer exception in JobTracker when the task tracker is
- not yet resolved.<br />(Amar Ramesh Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3603">HADOOP-3603</a>. Fix MapOutputCollector to spill when io.sort.spill.percent is
- 1.0 and to detect spills when emitted records write no data.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3615">HADOOP-3615</a>. Set DatanodeProtocol.versionID to the correct value.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3559">HADOOP-3559</a>. Fix the libhdfs test script and config to work with the
- current semantics.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3480">HADOOP-3480</a>. Need to update Eclipse template to reflect current trunk.<br />(Brice Arnould via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3588">HADOOP-3588</a>. Fixed usability issues with archives.<br />(mahadev)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3635">HADOOP-3635</a>. Uncaught exception in DataBlockScanner.
- (Tsz Wo (Nicholas), SZE via hairong)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3639">HADOOP-3639</a>. Exception when closing DFSClient while multiple files are
- open.<br />(Benjamin Gufler via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3572">HADOOP-3572</a>. SetQuotas usage interface has some minor bugs.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3649">HADOOP-3649</a>. Fix bug in removing blocks from the corrupted block map.<br />(Lohit Vijayarenu via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3604">HADOOP-3604</a>. Work around a JVM synchronization problem observed while
- retrieving the address of direct buffers from compression code by obtaining
- a lock during this call.<br />(Arun C Murthy via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3683">HADOOP-3683</a>. Fix dfs metrics to count file listings rather than files
- listed.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3597">HADOOP-3597</a>. Fix SortValidator to use filesystems other than the default as
- input. Validation job still runs on default fs.<br />(Jothi Padmanabhan via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3693">HADOOP-3693</a>. Fix archives, distcp and native library documentation to
- conform to style guidelines.<br />(Amareshwari Sriramadasu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3653">HADOOP-3653</a>. Fix test-patch target to properly account for Eclipse
- classpath jars.<br />(Brice Arnould via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3692">HADOOP-3692</a>. Fix documentation for Cluster setup and Quick start guides.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3691">HADOOP-3691</a>. Fix streaming and tutorial docs.<br />(Jothi Padmanabhan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3630">HADOOP-3630</a>. Fix NullPointerException in CompositeRecordReader from empty
- sources<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3706">HADOOP-3706</a>. Fix a ClassLoader issue in the mapred.join Parser that
- prevents it from loading user-specified InputFormats.<br />(Jingkei Ly via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3718">HADOOP-3718</a>. Fix KFSOutputStream::write(int) to output a byte instead of
- an int, per the OutputStream contract.<br />(Sriram Rao via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3647">HADOOP-3647</a>. Add debug logs to help track down a very occassional,
- hard-to-reproduce, bug in shuffle/merge on the reducer.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3716">HADOOP-3716</a>. Prevent listStatus in KosmosFileSystem from returning
- null for valid, empty directories.<br />(Sriram Rao via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3752">HADOOP-3752</a>. Fix audit logging to record rename events.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3737">HADOOP-3737</a>. Fix CompressedWritable to call Deflater::end to release
- compressor memory.<br />(Grant Glouser via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3670">HADOOP-3670</a>. Fixes JobTracker to clear out split bytes when no longer
- required.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3755">HADOOP-3755</a>. Update gridmix to work with HOD 0.4<br />(Runping Qi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3743">HADOOP-3743</a>. Fix -libjars, -files, -archives options to work even if
- user code does not implement tools.<br />(Amareshwari Sriramadasu via mahadev)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3774">HADOOP-3774</a>. Fix typos in shell output. (Tsz Wo (Nicholas), SZE via
- cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3762">HADOOP-3762</a>. Fixed FileSystem cache to work with the default port.<br />(cutting
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3798">HADOOP-3798</a>. Fix tests compilation.<br />(Mukund Madhugiri via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3794">HADOOP-3794</a>. Return modification time instead of zero for KosmosFileSystem.<br />(Sriram Rao via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3806">HADOOP-3806</a>. Remove debug statement to stdout from QuickSort.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3776">HADOOP-3776</a>. Fix NPE at NameNode when datanode reports a block after it is
- deleted at NameNode.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3537">HADOOP-3537</a>. Disallow adding a datanode to a network topology when its
- network location is not resolved.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3571">HADOOP-3571</a>. Fix bug in block removal used in lease recovery.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3645">HADOOP-3645</a>. MetricsTimeVaryingRate returns wrong value for
- metric_avg_time.<br />(Lohit Vijayarenu via hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3521">HADOOP-3521</a>. Reverted the missing cast to float for sending Counters' values
- to Hadoop metrics which was removed by <a href="http://issues.apache.org/jira/browse/HADOOP-544">HADOOP-544</a>.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3820">HADOOP-3820</a>. Fixes two problems in the gridmix-env - a syntax error, and a
- wrong definition of USE_REAL_DATASET by default.<br />(Arun Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3724">HADOOP-3724</a>. Fixes two problems related to storing and recovering lease
- in the fsimage.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3827">HADOOP-3827</a>. Fixed compression of empty map-outputs.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3865">HADOOP-3865</a>. Remove reference to FSNamesystem from metrics preventing
- garbage collection.<br />(Lohit Vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3884">HADOOP-3884</a>. Fix so that Eclipse plugin builds against recent
- Eclipse releases.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3837">HADOOP-3837</a>. Streaming jobs report progress status.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3897">HADOOP-3897</a>. Fix a NPE in secondary namenode.<br />(Lohit Vijayarenu via
- cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3901">HADOOP-3901</a>. Fix bin/hadoop to correctly set classpath under cygwin.
- (Tsz Wo (Nicholas) Sze via omalley)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3947">HADOOP-3947</a>. Fix a problem in tasktracker reinitialization.<br />(Amareshwari Sriramadasu via ddas)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.17.3_-_unreleased_')">Release 0.17.3 - Unreleased
- </a></h3>
- <ul id="release_0.17.3_-_unreleased_">
- <li><a href="javascript:toggleList('release_0.17.3_-_unreleased_._improvements_')"> IMPROVEMENTS
- </a> (1)
- <ol id="release_0.17.3_-_unreleased_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4164">HADOOP-4164</a>. Chinese translation of the documentation.<br />(Xuebing Yan via
- omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.17.3_-_unreleased_._bug_fixes_')"> BUG FIXES
- </a> (4)
- <ol id="release_0.17.3_-_unreleased_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4277">HADOOP-4277</a>. Checksum verification was mistakenly disabled for
- LocalFileSystem.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4271">HADOOP-4271</a>. Checksum input stream can sometimes return invalid
- data to the user.<br />(Ning Li via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4318">HADOOP-4318</a>. DistCp should use absolute paths for cleanup.<br />(szetszwo)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-4326">HADOOP-4326</a>. ChecksumFileSystem does not override create(...) correctly.<br />(szetszwo)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.17.2_-_2008-08-11_')">Release 0.17.2 - 2008-08-11
- </a></h3>
- <ul id="release_0.17.2_-_2008-08-11_">
- <li><a href="javascript:toggleList('release_0.17.2_-_2008-08-11_._bug_fixes_')"> BUG FIXES
- </a> (12)
- <ol id="release_0.17.2_-_2008-08-11_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3678">HADOOP-3678</a>. Avoid spurious exceptions logged at DataNode when clients
- read from DFS.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3707">HADOOP-3707</a>. NameNode keeps a count of number of blocks scheduled
- to be written to a datanode and uses it to avoid allocating more
- blocks than a datanode can hold.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3760">HADOOP-3760</a>. Fix a bug with HDFS file close() mistakenly introduced
- by <a href="http://issues.apache.org/jira/browse/HADOOP-3681">HADOOP-3681</a>.<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3681">HADOOP-3681</a>. DFSClient can get into an infinite loop while closing
- a file if there are some errors.<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3002">HADOOP-3002</a>. Hold off block removal while in safe mode.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3685">HADOOP-3685</a>. Unbalanced replication target.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3758">HADOOP-3758</a>. Shutdown datanode on version mismatch instead of retrying
- continuously, preventing excessive logging at the namenode.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3633">HADOOP-3633</a>. Correct exception handling in DataXceiveServer, and throttle
- the number of xceiver threads in a data-node.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3370">HADOOP-3370</a>. Ensure that the TaskTracker.runningJobs data-structure is
- correctly cleaned-up on task completion.<br />(Zheng Shao via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3813">HADOOP-3813</a>. Fix task-output clean-up on HDFS to use the recursive
- FileSystem.delete rather than the FileUtil.fullyDelete.<br />(Amareshwari
- Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3859">HADOOP-3859</a>. Allow the maximum number of xceivers in the data node to
- be configurable.<br />(Johan Oskarsson via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3931">HADOOP-3931</a>. Fix corner case in the map-side sort that causes some values
- to be counted as too large and cause pre-mature spills to disk. Some values
- will also bypass the combiner incorrectly.<br />(cdouglas via omalley)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.17.1_-_2008-06-23_')">Release 0.17.1 - 2008-06-23
- </a></h3>
- <ul id="release_0.17.1_-_2008-06-23_">
- <li><a href="javascript:toggleList('release_0.17.1_-_2008-06-23_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (1)
- <ol id="release_0.17.1_-_2008-06-23_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3565">HADOOP-3565</a>. Fix the Java serialization, which is not enabled by
- default, to clear the state of the serializer between objects.<br />(tomwhite via omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.17.1_-_2008-06-23_._improvements_')"> IMPROVEMENTS
- </a> (2)
- <ol id="release_0.17.1_-_2008-06-23_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3522">HADOOP-3522</a>. Improve documentation on reduce pointing out that
- input keys and values will be reused.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3487">HADOOP-3487</a>. Balancer uses thread pools for managing its threads;
- therefore provides better resource management.<br />(hairong)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.17.1_-_2008-06-23_._bug_fixes_')"> BUG FIXES
- </a> (8)
- <ol id="release_0.17.1_-_2008-06-23_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2159">HADOOP-2159</a> Namenode stuck in safemode. The counter blockSafe should
- not be decremented for invalid blocks.<br />(hairong)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3472">HADOOP-3472</a> MapFile.Reader getClosest() function returns incorrect results
- when before is true<br />(Todd Lipcon via Stack)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3442">HADOOP-3442</a>. Limit recursion depth on the stack for QuickSort to prevent
- StackOverflowErrors. To avoid O(n*n) cases, when partitioning depth exceeds
- a multiple of log(n), change to HeapSort.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3477">HADOOP-3477</a>. Fix build to not package contrib/*/bin twice in
- distributions.<br />(Adam Heath via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3475">HADOOP-3475</a>. Fix MapTask to correctly size the accounting allocation of
- io.sort.mb.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3550">HADOOP-3550</a>. Fix the serialization data structures in MapTask where the
- value lengths are incorrectly calculated.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3526">HADOOP-3526</a>. Fix contrib/data_join framework by cloning values retained
- in the reduce.<br />(Spyros Blanas via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1979">HADOOP-1979</a>. Speed up fsck by adding a buffered stream.<br />(Lohit
- Vijaya Renu via omalley)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.17.0_-_2008-05-18_')">Release 0.17.0 - 2008-05-18
- </a></h3>
- <ul id="release_0.17.0_-_2008-05-18_">
- <li><a href="javascript:toggleList('release_0.17.0_-_2008-05-18_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (26)
- <ol id="release_0.17.0_-_2008-05-18_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2786">HADOOP-2786</a>. Move hbase out of hadoop core
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2345">HADOOP-2345</a>. New HDFS transactions to support appending
- to files. Disk layout version changed from -11 to -12.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2192">HADOOP-2192</a>. Error messages from "dfs mv" command improved.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1902">HADOOP-1902</a>. "dfs du" command without any arguments operates on the
- current working directory.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2873">HADOOP-2873</a>. Fixed bad disk format introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-2345">HADOOP-2345</a>.
- Disk layout version changed from -12 to -13. See changelist 630992<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1985">HADOOP-1985</a>. This addresses rack-awareness for Map tasks and for
- HDFS in a uniform way.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1986">HADOOP-1986</a>. Add support for a general serialization mechanism for
- Map Reduce.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-771">HADOOP-771</a>. FileSystem.delete() takes an explicit parameter that
- specifies whether a recursive delete is intended.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2470">HADOOP-2470</a>. Remove getContentLength(String), open(String, long, long)
- and isDir(String) from ClientProtocol. ClientProtocol version changed
- from 26 to 27. (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2822">HADOOP-2822</a>. Remove deprecated code for classes InputFormatBase and
- PhasedFileSystem.<br />(Amareshwari Sriramadasu via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2116">HADOOP-2116</a>. Changes the layout of the task execution directory.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2828">HADOOP-2828</a>. The following deprecated methods in Configuration.java
- have been removed
- getObject(String name)
- setObject(String name, Object value)
- get(String name, Object defaultValue)
- set(String name, Object value)
- Iterator entries()<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2824">HADOOP-2824</a>. Removes one deprecated constructor from MiniMRCluster.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2823">HADOOP-2823</a>. Removes deprecated methods getColumn(), getLine() from
- org.apache.hadoop.record.compiler.generated.SimpleCharStream.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3060">HADOOP-3060</a>. Removes one unused constructor argument from MiniMRCluster.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2854">HADOOP-2854</a>. Remove deprecated o.a.h.ipc.Server::getUserInfo().<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2563">HADOOP-2563</a>. Remove deprecated FileSystem::listPaths.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2818">HADOOP-2818</a>. Remove deprecated methods in Counters.<br />(Amareshwari Sriramadasu via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2831">HADOOP-2831</a>. Remove deprecated o.a.h.dfs.INode::getAbsoluteName()<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2839">HADOOP-2839</a>. Remove deprecated FileSystem::globPaths.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2634">HADOOP-2634</a>. Deprecate ClientProtocol::exists.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2410">HADOOP-2410</a>. Make EC2 cluster nodes more independent of each other.
- Multiple concurrent EC2 clusters are now supported, and nodes may be
- added to a cluster on the fly with new nodes starting in the same EC2
- availability zone as the cluster. Ganglia monitoring and large
- instance sizes have also been added.<br />(Chris K Wensel via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2826">HADOOP-2826</a>. Deprecated FileSplit.getFile(), LineRecordReader.readLine().<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3239">HADOOP-3239</a>. getFileInfo() returns null for non-existing files instead
- of throwing FileNotFoundException.<br />(Lohit Vijayarenu via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3266">HADOOP-3266</a>. Removed HOD changes from CHANGES.txt, as they are now inside
- src/contrib/hod<br />(Hemanth Yamijala via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3280">HADOOP-3280</a>. Separate the configuration of the virtual memory size
- (mapred.child.ulimit) from the jvm heap size, so that 64 bit
- streaming applications are supported even when running with 32 bit
- jvms.<br />(acmurthy via omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.17.0_-_2008-05-18_._new_features_')"> NEW FEATURES
- </a> (12)
- <ol id="release_0.17.0_-_2008-05-18_._new_features_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1398">HADOOP-1398</a>. Add HBase in-memory block cache.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2178">HADOOP-2178</a>. Job History on DFS.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2063">HADOOP-2063</a>. A new parameter to dfs -get command to fetch a file
- even if it is corrupted. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2219">HADOOP-2219</a>. A new command "df -count" that counts the number of
- files and directories. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2906">HADOOP-2906</a>. Add an OutputFormat capable of using keys, values, and
- config params to map records to different output files.<br />(Runping Qi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2346">HADOOP-2346</a>. Utilities to support timeout while writing to sockets.
- DFSClient and DataNode sockets have 10min write timeout.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2951">HADOOP-2951</a>. Add a contrib module that provides a utility to
- build or update Lucene indexes using Map/Reduce.<br />(Ning Li via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1622">HADOOP-1622</a>. Allow multiple jar files for map reduce.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2055">HADOOP-2055</a>. Allows users to set PathFilter on the FileInputFormat.<br />(Alejandro Abdelnur via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2551">HADOOP-2551</a>. More environment variables like HADOOP_NAMENODE_OPTS
- for better control of HADOOP_OPTS for each component.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3001">HADOOP-3001</a>. Add job counters that measure the number of bytes
- read and written to HDFS, S3, KFS, and local file systems.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3048">HADOOP-3048</a>. A new Interface and a default implementation to convert
- and restore serializations of objects to/from strings.<br />(enis)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.17.0_-_2008-05-18_._improvements_')"> IMPROVEMENTS
- </a> (29)
- <ol id="release_0.17.0_-_2008-05-18_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2655">HADOOP-2655</a>. Copy on write for data and metadata files in the
- presence of snapshots. Needed for supporting appends to HDFS
- files.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1967">HADOOP-1967</a>. When a Path specifies the same scheme as the default
- FileSystem but no authority, the default FileSystem's authority is
- used. Also add warnings for old-format FileSystem names, accessor
- methods for fs.default.name, and check for null authority in HDFS.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2895">HADOOP-2895</a>. Let the profiling string be configurable.<br />(Martin Traverso via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-910">HADOOP-910</a>. Enables Reduces to do merges for the on-disk map output files
- in parallel with their copying.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-730">HADOOP-730</a>. Use rename rather than copy for local renames.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2810">HADOOP-2810</a>. Updated the Hadoop Core logo.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2057">HADOOP-2057</a>. Streaming should optionally treat a non-zero exit status
- of a child process as a failed task.<br />(Rick Cox via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2765">HADOOP-2765</a>. Enables specifying ulimits for streaming/pipes tasks<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2888">HADOOP-2888</a>. Make gridmix scripts more readily configurable and amenable
- to automated execution.<br />(Mukund Madhugiri via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2908">HADOOP-2908</a>. A document that describes the DFS Shell command.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2981">HADOOP-2981</a>. Update README.txt to reflect the upcoming use of
- cryptography.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2804">HADOOP-2804</a>. Add support to publish CHANGES.txt as HTML when running
- the Ant 'docs' target.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2559">HADOOP-2559</a>. Change DFS block placement to allocate the first replica
- locally, the second off-rack, and the third intra-rack from the
- second.<br />(lohit vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2939">HADOOP-2939</a>. Make the automated patch testing process an executable
- Ant target, test-patch.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2239">HADOOP-2239</a>. Add HsftpFileSystem to permit transferring files over ssl.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2886">HADOOP-2886</a>. Track individual RPC metrics.<br />(girish vaitheeswaran via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2373">HADOOP-2373</a>. Improvement in safe-mode reporting.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3091">HADOOP-3091</a>. Modify FsShell command -put to accept multiple sources.<br />(Lohit Vijaya Renu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3092">HADOOP-3092</a>. Show counter values from job -status command.<br />(Tom White via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1228">HADOOP-1228</a>. Ant task to generate Eclipse project files.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3093">HADOOP-3093</a>. Adds Configuration.getStrings(name, default-value) and
- the corresponding setStrings.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3106">HADOOP-3106</a>. Adds documentation in forrest for debugging.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3099">HADOOP-3099</a>. Add an option to distcp to preserve user, group, and
- permission information. (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2841">HADOOP-2841</a>. Unwrap AccessControlException and FileNotFoundException
- from RemoteException for DFSClient.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3152">HADOOP-3152</a>. Make index interval configuable when using
- MapFileOutputFormat for map-reduce job.<br />(Rong-En Fan via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3143">HADOOP-3143</a>. Decrease number of slaves from 4 to 3 in TestMiniMRDFSSort,
- as Hudson generates false negatives under the current load.<br />(Nigel Daley via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3174">HADOOP-3174</a>. Illustrative example for MultipleFileInputFormat.<br />(Enis
- Soztutar via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2993">HADOOP-2993</a>. Clarify the usage of JAVA_HOME in the Quick Start guide.<br />(acmurthy via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3124">HADOOP-3124</a>. Make DataNode socket write timeout configurable.<br />(rangadi)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.17.0_-_2008-05-18_._optimizations_')"> OPTIMIZATIONS
- </a> (12)
- <ol id="release_0.17.0_-_2008-05-18_._optimizations_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2790">HADOOP-2790</a>. Fixed inefficient method hasSpeculativeTask by removing
- repetitive calls to get the current time and late checking to see if
- we want speculation on at all.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2758">HADOOP-2758</a>. Reduce buffer copies in DataNode when data is read from
- HDFS, without negatively affecting read throughput.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2399">HADOOP-2399</a>. Input key and value to combiner and reducer is reused.
- (Owen O'Malley via ddas).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2423">HADOOP-2423</a>. Code optimization in FSNamesystem.mkdirs.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2606">HADOOP-2606</a>. ReplicationMonitor selects data-nodes to replicate directly
- from needed replication blocks instead of looking up for the blocks for
- each live data-node.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2148">HADOOP-2148</a>. Eliminate redundant data-node blockMap lookups.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2027">HADOOP-2027</a>. Return the number of bytes in each block in a file
- via a single rpc to the namenode to speed up job planning.<br />(Lohit Vijaya Renu via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2902">HADOOP-2902</a>. Replace uses of "fs.default.name" with calls to the
- accessor methods added in <a href="http://issues.apache.org/jira/browse/HADOOP-1967">HADOOP-1967</a>.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2119">HADOOP-2119</a>. Optimize scheduling of jobs with large numbers of
- tasks by replacing static arrays with lists of runnable tasks.<br />(Amar Kamat via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2919">HADOOP-2919</a>. Reduce the number of memory copies done during the
- map output sorting. Also adds two config variables:
- io.sort.spill.percent - the percentages of io.sort.mb that should
- cause a spill (default 80%)
- io.sort.record.percent - the percent of io.sort.mb that should
- hold key/value indexes (default 5%)<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3140">HADOOP-3140</a>. Doesn't add a task in the commit queue if the task hadn't
- generated any output.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3168">HADOOP-3168</a>. Reduce the amount of logging in streaming to an
- exponentially increasing number of records (up to 10,000
- records/log).<br />(Zheng Shao via omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.17.0_-_2008-05-18_._bug_fixes_')"> BUG FIXES
- </a> (102)
- <ol id="release_0.17.0_-_2008-05-18_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2195">HADOOP-2195</a>. '-mkdir' behaviour is now closer to Linux shell in case of
- errors.<br />(Mahadev Konar via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2190">HADOOP-2190</a>. bring behaviour '-ls' and '-du' closer to Linux shell
- commands in case of errors.<br />(Mahadev Konar via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2193">HADOOP-2193</a>. 'fs -rm' and 'fs -rmr' show error message when the target
- file does not exist.<br />(Mahadev Konar via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2738">HADOOP-2738</a> Text is not subclassable because set(Text) and compareTo(Object)
- access the other instance's private members directly.<br />(jimk)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2779">HADOOP-2779</a>. Remove the references to HBase in the build.xml.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2194">HADOOP-2194</a>. dfs cat on a non-existent file throws FileNotFoundException.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2767">HADOOP-2767</a>. Fix for NetworkTopology erroneously skipping the last leaf
- node on a rack.<br />(Hairong Kuang and Mark Butler via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1593">HADOOP-1593</a>. FsShell works with paths in non-default FileSystem.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2191">HADOOP-2191</a>. du and dus command on non-existent directory gives
- appropriate error message.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2832">HADOOP-2832</a>. Remove tabs from code of DFSClient for better
- indentation.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2844">HADOOP-2844</a>. distcp closes file handles for sequence files.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2727">HADOOP-2727</a>. Fix links in Web UI of the hadoop daemons and some docs<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2871">HADOOP-2871</a>. Fixes a problem to do with file: URI in the JobHistory init.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2800">HADOOP-2800</a>. Deprecate SetFile.Writer constructor not the whole class.<br />(Johan Oskarsson via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2891">HADOOP-2891</a>. DFSClient.close() closes all open files.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2845">HADOOP-2845</a>. Fix dfsadmin disk utilization report on Solaris.<br />(Martin Traverso via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2912">HADOOP-2912</a>. MiniDFSCluster restart should wait for namenode to exit
- safemode. This was causing TestFsck to fail.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2820">HADOOP-2820</a>. The following classes in streaming are removed :
- StreamLineRecordReader StreamOutputFormat StreamSequenceRecordReader.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2819">HADOOP-2819</a>. The following methods in JobConf are removed:
- getInputKeyClass() setInputKeyClass getInputValueClass()
- setInputValueClass(Class theClass) setSpeculativeExecution
- getSpeculativeExecution()<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2817">HADOOP-2817</a>. Removes deprecated mapred.tasktracker.tasks.maximum and
- ClusterStatus.getMaxTasks().<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2821">HADOOP-2821</a>. Removes deprecated ShellUtil and ToolBase classes from
- the util package.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2934">HADOOP-2934</a>. The namenode was encountreing a NPE while loading
- leases from the fsimage. Fixed.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2938">HADOOP-2938</a>. Some fs commands did not glob paths.
- (Tsz Wo (Nicholas), SZE via rangadi)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2943">HADOOP-2943</a>. Compression of intermediate map output causes failures
- in the merge.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2870">HADOOP-2870</a>. DataNode and NameNode closes all connections while
- shutting down.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2973">HADOOP-2973</a>. Fix TestLocalDFS for Windows platform.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2971">HADOOP-2971</a>. select multiple times if it returns early in
- SocketIOWithTimeout.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2955">HADOOP-2955</a>. Fix TestCrcCorruption test failures caused by <a href="http://issues.apache.org/jira/browse/HADOOP-2758">HADOOP-2758</a><br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2657">HADOOP-2657</a>. A flush call on the DFSOutputStream flushes the last
- partial CRC chunk too.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2974">HADOOP-2974</a>. IPC unit tests used "0.0.0.0" to connect to server, which
- is not always supported.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2996">HADOOP-2996</a>. Fixes uses of StringBuffer in StreamUtils class.<br />(Dave Brosius via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2995">HADOOP-2995</a>. Fixes StreamBaseRecordReader's getProgress to return a
- floating point number.<br />(Dave Brosius via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2972">HADOOP-2972</a>. Fix for a NPE in FSDataset.invalidate.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2994">HADOOP-2994</a>. Code cleanup for DFSClient: remove redundant
- conversions from string to string.<br />(Dave Brosius via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3009">HADOOP-3009</a>. TestFileCreation sometimes fails because restarting
- minidfscluster sometimes creates datanodes with ports that are
- different from their original instance.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2992">HADOOP-2992</a>. Distributed Upgrade framework works correctly with
- more than one upgrade object.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2679">HADOOP-2679</a>. Fix a typo in libhdfs.<br />(Jason via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2976">HADOOP-2976</a>. When a lease expires, the Namenode ensures that
- blocks of the file are adequately replicated.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2901">HADOOP-2901</a>. Fixes the creation of info servers in the JobClient
- and JobTracker. Removes the creation from JobClient and removes
- additional info server from the JobTracker. Also adds the command
- line utility to view the history files (<a href="http://issues.apache.org/jira/browse/HADOOP-2896">HADOOP-2896</a>), and fixes
- bugs in JSPs to do with analysis - <a href="http://issues.apache.org/jira/browse/HADOOP-2742">HADOOP-2742</a>, <a href="http://issues.apache.org/jira/browse/HADOOP-2792">HADOOP-2792</a>.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2890">HADOOP-2890</a>. If different datanodes report the same block but
- with different sizes to the namenode, the namenode picks the
- replica(s) with the largest size as the only valid replica(s).<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2825">HADOOP-2825</a>. Deprecated MapOutputLocation.getFile() is removed.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2806">HADOOP-2806</a>. Fixes a streaming document.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3008">HADOOP-3008</a>. SocketIOWithTimeout throws InterruptedIOException if the
- thread is interrupted while it is waiting.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3006">HADOOP-3006</a>. Fix wrong packet size reported by DataNode when a block
- is being replicated.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3029">HADOOP-3029</a>. Datanode prints log message "firstbadlink" only if
- it detects a bad connection to another datanode in the pipeline.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3030">HADOOP-3030</a>. Release reserved space for file in InMemoryFileSystem if
- checksum reservation fails.<br />(Devaraj Das via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3036">HADOOP-3036</a>. Fix findbugs warnings in UpgradeUtilities.<br />(Konstantin
- Shvachko via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3025">HADOOP-3025</a>. ChecksumFileSystem supports the delete method with
- the recursive flag.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3012">HADOOP-3012</a>. dfs -mv file to user home directory throws exception if
- the user home directory does not exist.<br />(Mahadev Konar via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3066">HADOOP-3066</a>. Should not require superuser privilege to query if hdfs is in
- safe mode<br />(jimk)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3040">HADOOP-3040</a>. If the input line starts with the separator char, the key
- is set as empty.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3080">HADOOP-3080</a>. Removes flush calls from JobHistory.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3086">HADOOP-3086</a>. Adds the testcase missed during commit of hadoop-3040.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3046">HADOOP-3046</a>. Fix the raw comparators for Text and BytesWritables
- to use the provided length rather than recompute it.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3094">HADOOP-3094</a>. Fix BytesWritable.toString to avoid extending the sign bit<br />(Owen O'Malley via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3067">HADOOP-3067</a>. DFSInputStream's position read does not close the sockets.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3073">HADOOP-3073</a>. close() on SocketInputStream or SocketOutputStream should
- close the underlying channel.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3087">HADOOP-3087</a>. Fixes a problem to do with refreshing of loadHistory.jsp.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3065">HADOOP-3065</a>. Better logging message if the rack location of a datanode
- cannot be determined.<br />(Devaraj Das via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3064">HADOOP-3064</a>. Commas in a file path should not be treated as delimiters.<br />(Hairong Kuang via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2997">HADOOP-2997</a>. Adds test for non-writable serialier. Also fixes a problem
- introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-2399">HADOOP-2399</a>.<br />(Tom White via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3114">HADOOP-3114</a>. Fix TestDFSShell on Windows.<br />(Lohit Vijaya Renu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3118">HADOOP-3118</a>. Fix Namenode NPE while loading fsimage after a cluster
- upgrade from older disk format.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3161">HADOOP-3161</a>. Fix FIleUtil.HardLink.getLinkCount on Mac OS.<br />(nigel
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2927">HADOOP-2927</a>. Fix TestDU to acurately calculate the expected file size.<br />(shv via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3123">HADOOP-3123</a>. Fix the native library build scripts to work on Solaris.<br />(tomwhite via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3089">HADOOP-3089</a>. Streaming should accept stderr from task before
- first key arrives.<br />(Rick Cox via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3146">HADOOP-3146</a>. A DFSOutputStream.flush method is renamed as
- DFSOutputStream.fsync.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3165">HADOOP-3165</a>. -put/-copyFromLocal did not treat input file "-" as stdin.<br />(Lohit Vijayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3041">HADOOP-3041</a>. Deprecate JobConf.setOutputPath and JobConf.getOutputPath.
- Deprecate OutputFormatBase. Add FileOutputFormat. Existing output formats
- extending OutputFormatBase, now extend FileOutputFormat. Add the following
- APIs in FileOutputFormat: setOutputPath, getOutputPath, getWorkOutputPath.<br />(Amareshwari Sriramadasu via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3083">HADOOP-3083</a>. The fsimage does not store leases. This would have to be
- reworked in the next release to support appends.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3166">HADOOP-3166</a>. Fix an ArrayIndexOutOfBoundsException in the spill thread
- and make exception handling more promiscuous to catch this condition.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3050">HADOOP-3050</a>. DataNode sends one and only one block report after
- it registers with the namenode.<br />(Hairong Kuang)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3044">HADOOP-3044</a>. NNBench sets the right configuration for the mapper.<br />(Hairong Kuang)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3178">HADOOP-3178</a>. Fix GridMix scripts for small and medium jobs
- to handle input paths differently.<br />(Mukund Madhugiri via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1911">HADOOP-1911</a>. Fix an infinite loop in DFSClient when all replicas of a
- block are bad<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3157">HADOOP-3157</a>. Fix path handling in DistributedCache and TestMiniMRLocalFS.<br />(Doug Cutting via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3018">HADOOP-3018</a>. Fix the eclipse plug-in contrib wrt removed deprecated
- methods<br />(taton)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3183">HADOOP-3183</a>. Fix TestJobShell to use 'ls' instead of java.io.File::exists
- since cygwin symlinks are unsupported.<br />(Mahadev konar via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3175">HADOOP-3175</a>. Fix FsShell.CommandFormat to handle "-" in arguments.<br />(Edward J. Yoon via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3220">HADOOP-3220</a>. Safemode message corrected.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3208">HADOOP-3208</a>. Fix WritableDeserializer to set the Configuration on
- deserialized Writables.<br />(Enis Soztutar via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3224">HADOOP-3224</a>. 'dfs -du /dir' does not return correct size.<br />(Lohit Vjayarenu via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3223">HADOOP-3223</a>. Fix typo in help message for -chmod.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1373">HADOOP-1373</a>. checkPath() should ignore case when it compares authoriy.<br />(Edward J. Yoon via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3204">HADOOP-3204</a>. Fixes a problem to do with ReduceTask's LocalFSMerger not
- catching Throwable.<br />(Amar Ramesh Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3229">HADOOP-3229</a>. Report progress when collecting records from the mapper and
- the combiner.<br />(Doug Cutting via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3225">HADOOP-3225</a>. Unwrapping methods of RemoteException should initialize
- detailedMassage field.<br />(Mahadev Konar, shv, cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3247">HADOOP-3247</a>. Fix gridmix scripts to use the correct globbing syntax and
- change maxentToSameCluster to run the correct number of jobs.<br />(Runping Qi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3242">HADOOP-3242</a>. Fix the RecordReader of SequenceFileAsBinaryInputFormat to
- correctly read from the start of the split and not the beginning of the
- file.<br />(cdouglas via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3256">HADOOP-3256</a>. Encodes the job name used in the filename for history files.<br />(Arun Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3162">HADOOP-3162</a>. Ensure that comma-separated input paths are treated correctly
- as multiple input paths.<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3263">HADOOP-3263</a>. Ensure that the job-history log file always follows the
- pattern of hostname_timestamp_jobid_username_jobname even if username
- and/or jobname are not specfied. This helps to avoid wrong assumptions
- made about the job-history log filename in jobhistory.jsp.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3251">HADOOP-3251</a>. Fixes getFilesystemName in JobTracker and LocalJobRunner to
- use FileSystem.getUri instead of FileSystem.getName.<br />(Arun Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3237">HADOOP-3237</a>. Fixes TestDFSShell.testErrOutPut on Windows platform.<br />(Mahadev Konar via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3279">HADOOP-3279</a>. TaskTracker checks for SUCCEEDED task status in addition to
- COMMIT_PENDING status when it fails maps due to lost map.<br />(Devaraj Das)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3286">HADOOP-3286</a>. Prevent collisions in gridmix output dirs by increasing the
- granularity of the timestamp.<br />(Runping Qi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3285">HADOOP-3285</a>. Fix input split locality when the splits align to
- fs blocks.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3372">HADOOP-3372</a>. Fix heap management in streaming tests.<br />(Arun Murthy via
- cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3031">HADOOP-3031</a>. Fix javac warnings in test classes.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3382">HADOOP-3382</a>. Fix memory leak when files are not cleanly closed<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3322">HADOOP-3322</a>. Fix to push MetricsRecord for rpc metrics.<br />(Eric Yang via
- mukund)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.16.4_-_2008-05-05_')">Release 0.16.4 - 2008-05-05
- </a></h3>
- <ul id="release_0.16.4_-_2008-05-05_">
- <li><a href="javascript:toggleList('release_0.16.4_-_2008-05-05_._bug_fixes_')"> BUG FIXES
- </a> (3)
- <ol id="release_0.16.4_-_2008-05-05_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3138">HADOOP-3138</a>. DFS mkdirs() should not throw an exception if the directory
- already exists.<br />(rangadi via mukund)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3294">HADOOP-3294</a>. Fix distcp to check the destination length and retry the copy
- if it doesn't match the src length. (Tsz Wo (Nicholas), SZE via mukund)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3186">HADOOP-3186</a>. Fix incorrect permission checkding for mv and renameTo
- in HDFS. (Tsz Wo (Nicholas), SZE via mukund)
- </li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.16.3_-_2008-04-16_')">Release 0.16.3 - 2008-04-16
- </a></h3>
- <ul id="release_0.16.3_-_2008-04-16_">
- <li><a href="javascript:toggleList('release_0.16.3_-_2008-04-16_._bug_fixes_')"> BUG FIXES
- </a> (7)
- <ol id="release_0.16.3_-_2008-04-16_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3010">HADOOP-3010</a>. Fix ConcurrentModificationException in ipc.Server.Responder.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3154">HADOOP-3154</a>. Catch all Throwables from the SpillThread in MapTask, rather
- than IOExceptions only.<br />(ddas via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3159">HADOOP-3159</a>. Avoid file system cache being overwritten whenever
- configuration is modified. (Tsz Wo (Nicholas), SZE via hairong)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3139">HADOOP-3139</a>. Remove the consistency check for the FileSystem cache in
- closeAll() that causes spurious warnings and a deadlock.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3195">HADOOP-3195</a>. Fix TestFileSystem to be deterministic.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3069">HADOOP-3069</a>. Primary name-node should not truncate image when transferring
- it from the secondary.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3182">HADOOP-3182</a>. Change permissions of the job-submission directory to 777
- from 733 to ensure sharing of HOD clusters works correctly. (Tsz Wo
- (Nicholas), Sze and Amareshwari Sri Ramadasu via acmurthy)
- </li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.16.2_-_2008-04-02_')">Release 0.16.2 - 2008-04-02
- </a></h3>
- <ul id="release_0.16.2_-_2008-04-02_">
- <li><a href="javascript:toggleList('release_0.16.2_-_2008-04-02_._bug_fixes_')"> BUG FIXES
- </a> (18)
- <ol id="release_0.16.2_-_2008-04-02_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3011">HADOOP-3011</a>. Prohibit distcp from overwriting directories on the
- destination filesystem with files.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3033">HADOOP-3033</a>. The BlockReceiver thread in the datanode writes data to
- the block file, changes file position (if needed) and flushes all by
- itself. The PacketResponder thread does not flush block file.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2978">HADOOP-2978</a>. Fixes the JobHistory log format for counters.<br />(Runping Qi via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2985">HADOOP-2985</a>. Fixes LocalJobRunner to tolerate null job output path.
- Also makes the _temporary a constant in MRConstants.java.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3003">HADOOP-3003</a>. FileSystem cache key is updated after a
- FileSystem object is created. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3042">HADOOP-3042</a>. Updates the Javadoc in JobConf.getOutputPath to reflect
- the actual temporary path.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3007">HADOOP-3007</a>. Tolerate mirror failures while DataNode is replicating
- blocks as it used to before.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2944">HADOOP-2944</a>. Fixes a "Run on Hadoop" wizard NPE when creating a
- Location from the wizard.<br />(taton)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3049">HADOOP-3049</a>. Fixes a problem in MultiThreadedMapRunner to do with
- catching RuntimeExceptions.<br />(Alejandro Abdelnur via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3039">HADOOP-3039</a>. Fixes a problem to do with exceptions in tasks not
- killing jobs.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3027">HADOOP-3027</a>. Fixes a problem to do with adding a shutdown hook in
- FileSystem.<br />(Amareshwari Sriramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3056">HADOOP-3056</a>. Fix distcp when the target is an empty directory by
- making sure the directory is created first.<br />(cdouglas and acmurthy
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3070">HADOOP-3070</a>. Protect the trash emptier thread from null pointer
- exceptions.<br />(Koji Noguchi via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3084">HADOOP-3084</a>. Fix HftpFileSystem to work for zero-lenghth files.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3107">HADOOP-3107</a>. Fix NPE when fsck invokes getListings.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3104">HADOOP-3104</a>. Limit MultithreadedMapRunner to have a fixed length queue
- between the RecordReader and the map threads.<br />(Alejandro Abdelnur via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2833">HADOOP-2833</a>. Do not use "Dr. Who" as the default user in JobClient.
- A valid user name is required. (Tsz Wo (Nicholas), SZE via rangadi)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3128">HADOOP-3128</a>. Throw RemoteException in setPermissions and setOwner of
- DistributedFileSystem.<br />(shv via nigel)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.16.1_-_2008-03-13_')">Release 0.16.1 - 2008-03-13
- </a></h3>
- <ul id="release_0.16.1_-_2008-03-13_">
- <li><a href="javascript:toggleList('release_0.16.1_-_2008-03-13_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (1)
- <ol id="release_0.16.1_-_2008-03-13_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2869">HADOOP-2869</a>. Deprecate SequenceFile.setCompressionType in favor of
- SequenceFile.createWriter, SequenceFileOutputFormat.setCompressionType,
- and JobConf.setMapOutputCompressionType. (Arun C Murthy via cdouglas)
- Configuration changes to hadoop-default.xml:
- deprecated io.seqfile.compression.type
- </li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.16.1_-_2008-03-13_._improvements_')"> IMPROVEMENTS
- </a> (2)
- <ol id="release_0.16.1_-_2008-03-13_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2371">HADOOP-2371</a>. User guide for file permissions in HDFS.<br />(Robert Chansler via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3098">HADOOP-3098</a>. Allow more characters in user and group names while
- using -chown and -chgrp commands.<br />(rangadi)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.16.1_-_2008-03-13_._bug_fixes_')"> BUG FIXES
- </a> (31)
- <ol id="release_0.16.1_-_2008-03-13_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2789">HADOOP-2789</a>. Race condition in IPC Server Responder that could close
- connections early.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2785">HADOOP-2785</a>. minor. Fix a typo in Datanode block verification<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2788">HADOOP-2788</a>. minor. Fix help message for chgrp shell command (Raghu Angadi).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1188">HADOOP-1188</a>. fstime file is updated when a storage directory containing
- namespace image becomes inaccessible.<br />(shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2787">HADOOP-2787</a>. An application can set a configuration variable named
- dfs.umask to set the umask that is used by DFS.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2780">HADOOP-2780</a>. The default socket buffer size for DataNodes is 128K.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2716">HADOOP-2716</a>. Superuser privileges for the Balancer.
- (Tsz Wo (Nicholas), SZE via shv)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2754">HADOOP-2754</a>. Filter out .crc files from local file system listing.<br />(Hairong Kuang via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2733">HADOOP-2733</a>. Fix compiler warnings in test code.
- (Tsz Wo (Nicholas), SZE via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2725">HADOOP-2725</a>. Modify distcp to avoid leaving partially copied files at
- the destination after encountering an error. (Tsz Wo (Nicholas), SZE
- via cdouglas)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2391">HADOOP-2391</a>. Cleanup job output directory before declaring a job as
- SUCCESSFUL.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2808">HADOOP-2808</a>. Minor fix to FileUtil::copy to mind the overwrite
- formal.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2683">HADOOP-2683</a>. Moving UGI out of the RPC Server.
- (Tsz Wo (Nicholas), SZE via shv)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2814">HADOOP-2814</a>. Fix for NPE in datanode in unit test TestDataTransferProtocol.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2811">HADOOP-2811</a>. Dump of counters in job history does not add comma between
- groups.<br />(runping via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2735">HADOOP-2735</a>. Enables setting TMPDIR for tasks.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2843">HADOOP-2843</a>. Fix protections on map-side join classes to enable derivation.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2840">HADOOP-2840</a>. Fix gridmix scripts to correctly invoke the java sort through
- the proper jar.<br />(Mukund Madhugiri via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2769">HADOOP-2769</a>. TestNNThroughputBnechmark should not use a fixed port for
- the namenode http port.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2852">HADOOP-2852</a>. Update gridmix benchmark to avoid an artifically long tail.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2894">HADOOP-2894</a>. Fix a problem to do with tasktrackers failing to connect to
- JobTracker upon reinitialization. (Owen O'Malley via ddas).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2903">HADOOP-2903</a>. Fix exception generated by Metrics while using pushMetric().<br />(girish vaitheeswaran via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2904">HADOOP-2904</a>. Fix to RPC metrics to log the correct host name.<br />(girish vaitheeswaran via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2918">HADOOP-2918</a>. Improve error logging so that dfs writes failure with
- "No lease on file" can be diagnosed.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2923">HADOOP-2923</a>. Add SequenceFileAsBinaryInputFormat, which was
- missed in the commit for <a href="http://issues.apache.org/jira/browse/HADOOP-2603">HADOOP-2603</a>.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2931">HADOOP-2931</a>. IOException thrown by DFSOutputStream had wrong stack
- trace in some cases.<br />(Michael Bieniosek via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2883">HADOOP-2883</a>. Write failures and data corruptions on HDFS files.
- The write timeout is back to what it was on 0.15 release. Also, the
- datnodes flushes the block file buffered output stream before
- sending a positive ack for the packet back to the client.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2756">HADOOP-2756</a>. NPE in DFSClient while closing DFSOutputStreams
- under load.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2958">HADOOP-2958</a>. Fixed FileBench which broke due to <a href="http://issues.apache.org/jira/browse/HADOOP-2391">HADOOP-2391</a> which performs
- a check for existence of the output directory and a trivial bug in
- GenericMRLoadGenerator where min/max word lenghts were identical since
- they were looking at the same config variables<br />(Chris Douglas via
- acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2915">HADOOP-2915</a>. Fixed FileSystem.CACHE so that a username is included
- in the cache key. (Tsz Wo (Nicholas), SZE via nigel)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2813">HADOOP-2813</a>. TestDU unit test uses its own directory to run its
- sequence of tests.<br />(Mahadev Konar via dhruba)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.16.0_-_2008-02-07_')">Release 0.16.0 - 2008-02-07
- </a></h3>
- <ul id="release_0.16.0_-_2008-02-07_">
- <li><a href="javascript:toggleList('release_0.16.0_-_2008-02-07_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (14)
- <ol id="release_0.16.0_-_2008-02-07_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1245">HADOOP-1245</a>. Use the mapred.tasktracker.tasks.maximum value
- configured on each tasktracker when allocating tasks, instead of
- the value configured on the jobtracker. InterTrackerProtocol
- version changed from 5 to 6.<br />(Michael Bieniosek via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1843">HADOOP-1843</a>. Removed code from Configuration and JobConf deprecated by
- <a href="http://issues.apache.org/jira/browse/HADOOP-785">HADOOP-785</a> and a minor fix to Configuration.toString. Specifically the
- important change is that mapred-default.xml is no longer supported and
- Configuration no longer supports the notion of default/final resources.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1302">HADOOP-1302</a>. Remove deprecated abacus code from the contrib directory.
- This also fixes a configuration bug in AggregateWordCount, so that the
- job now works.<br />(enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2288">HADOOP-2288</a>. Enhance FileSystem API to support access control.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2184">HADOOP-2184</a>. RPC Support for user permissions and authentication.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2185">HADOOP-2185</a>. RPC Server uses any available port if the specified
- port is zero. Otherwise it uses the specified port. Also combines
- the configuration attributes for the servers' bind address and
- port from "x.x.x.x" and "y" to "x.x.x.x:y".
- Deprecated configuration variables:
- dfs.info.bindAddress
- dfs.info.port
- dfs.datanode.bindAddress
- dfs.datanode.port
- dfs.datanode.info.bindAdress
- dfs.datanode.info.port
- dfs.secondary.info.bindAddress
- dfs.secondary.info.port
- mapred.job.tracker.info.bindAddress
- mapred.job.tracker.info.port
- mapred.task.tracker.report.bindAddress
- tasktracker.http.bindAddress
- tasktracker.http.port
- New configuration variables (post <a href="http://issues.apache.org/jira/browse/HADOOP-2404">HADOOP-2404</a>):
- dfs.secondary.http.address
- dfs.datanode.address
- dfs.datanode.http.address
- dfs.http.address
- mapred.job.tracker.http.address
- mapred.task.tracker.report.address
- mapred.task.tracker.http.address<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2401">HADOOP-2401</a>. Only the current leaseholder can abandon a block for
- a HDFS file. ClientProtocol version changed from 20 to 21.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2381">HADOOP-2381</a>. Support permission information in FileStatus. Client
- Protocol version changed from 21 to 22.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2110">HADOOP-2110</a>. Block report processing creates fewer transient objects.
- Datanode Protocol version changed from 10 to 11.<br />(Sanjay Radia via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2567">HADOOP-2567</a>. Add FileSystem#getHomeDirectory(), which returns the
- user's home directory in a FileSystem as a fully-qualified path.
- FileSystem#getWorkingDirectory() is also changed to return a
- fully-qualified path, which can break applications that attempt
- to, e.g., pass LocalFileSystem#getWorkingDir().toString() directly
- to java.io methods that accept file names.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2514">HADOOP-2514</a>. Change trash feature to maintain a per-user trash
- directory, named ".Trash" in the user's home directory. The
- "fs.trash.root" parameter is no longer used. Full source paths
- are also no longer reproduced within the trash.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2012">HADOOP-2012</a>. Periodic data verification on Datanodes.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1707">HADOOP-1707</a>. The DFSClient does not use a local disk file to cache
- writes to a HDFS file. Changed Data Transfer Version from 7 to 8.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2652">HADOOP-2652</a>. Fix permission issues for HftpFileSystem. This is an
- incompatible change since distcp may not be able to copy files
- from cluster A (compiled with this patch) to cluster B (compiled
- with previous versions). (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.16.0_-_2008-02-07_._new_features_')"> NEW FEATURES
- </a> (13)
- <ol id="release_0.16.0_-_2008-02-07_._new_features_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1857">HADOOP-1857</a>. Ability to run a script when a task fails to capture stack
- traces.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2299">HADOOP-2299</a>. Defination of a login interface. A simple implementation for
- Unix users and groups.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1652">HADOOP-1652</a>. A utility to balance data among datanodes in a HDFS cluster.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2085">HADOOP-2085</a>. A library to support map-side joins of consistently
- partitioned and sorted data sets.<br />(Chris Douglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2336">HADOOP-2336</a>. Shell commands to modify file permissions.<br />(rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1298">HADOOP-1298</a>. Implement file permissions for HDFS.
- (Tsz Wo (Nicholas) & taton via cutting)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2447">HADOOP-2447</a>. HDFS can be configured to limit the total number of
- objects (inodes and blocks) in the file system.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2487">HADOOP-2487</a>. Added an option to get statuses for all submitted/run jobs.
- This information can be used to develop tools for analysing jobs.<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1873">HADOOP-1873</a>. Implement user permissions for Map/Reduce framework.<br />(Hairong Kuang via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2532">HADOOP-2532</a>. Add to MapFile a getClosest method that returns the key
- that comes just before if the key is not present.<br />(stack via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1883">HADOOP-1883</a>. Add versioning to Record I/O.<br />(Vivek Ratan via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2603">HADOOP-2603</a>. Add SeqeunceFileAsBinaryInputFormat, which reads
- sequence files as BytesWritable/BytesWritable regardless of the
- key and value types used to write the file.<br />(cdouglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2367">HADOOP-2367</a>. Add ability to profile a subset of map/reduce tasks and fetch
- the result to the local filesystem of the submitting application. Also
- includes a general IntegerRanges extension to Configuration for setting
- positive, ranged parameters.<br />(Owen O'Malley via cdouglas)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.16.0_-_2008-02-07_._improvements_')"> IMPROVEMENTS
- </a> (54)
- <ol id="release_0.16.0_-_2008-02-07_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2045">HADOOP-2045</a>. Change committer list on website to a table, so that
- folks can list their organization, timezone, etc.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2058">HADOOP-2058</a>. Facilitate creating new datanodes dynamically in
- MiniDFSCluster.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1855">HADOOP-1855</a>. fsck verifies block placement policies and reports
- violations.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1604">HADOOP-1604</a>. An system administrator can finalize namenode upgrades
- without running the cluster.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1839">HADOOP-1839</a>. Link-ify the Pending/Running/Complete/Killed grid in
- jobdetails.jsp to help quickly narrow down and see categorized TIPs'
- details via jobtasks.jsp.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1210">HADOOP-1210</a>. Log counters in job history.<br />(Owen O'Malley via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1912">HADOOP-1912</a>. Datanode has two new commands COPY and REPLACE. These are
- needed for supporting data rebalance.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2086">HADOOP-2086</a>. This patch adds the ability to add dependencies to a job
- (run via JobControl) after construction.<br />(Adrian Woodhead via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1185">HADOOP-1185</a>. Support changing the logging level of a server without
- restarting the server. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2134">HADOOP-2134</a>. Remove developer-centric requirements from overview.html and
- keep it end-user focussed, specifically sections related to subversion and
- building Hadoop.<br />(Jim Kellerman via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1989">HADOOP-1989</a>. Support simulated DataNodes. This helps creating large virtual
- clusters for testing purposes.<br />(Sanjay Radia via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1274">HADOOP-1274</a>. Support different number of mappers and reducers per
- TaskTracker to allow administrators to better configure and utilize
- heterogenous clusters.
- Configuration changes to hadoop-default.xml:
- add mapred.tasktracker.map.tasks.maximum (default value of 2)
- add mapred.tasktracker.reduce.tasks.maximum (default value of 2)
- remove mapred.tasktracker.tasks.maximum (deprecated for 0.16.0)<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2104">HADOOP-2104</a>. Adds a description to the ant targets. This makes the
- output of "ant -projecthelp" sensible.<br />(Chris Douglas via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2127">HADOOP-2127</a>. Added a pipes sort example to benchmark trivial pipes
- application versus trivial java application.<br />(omalley via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2113">HADOOP-2113</a>. A new shell command "dfs -text" to view the contents of
- a gziped or SequenceFile.<br />(Chris Douglas via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2207">HADOOP-2207</a>. Add a "package" target for contrib modules that
- permits each to determine what files are copied into release
- builds.<br />(stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1984">HADOOP-1984</a>. Makes the backoff for failed fetches exponential.
- Earlier, it was a random backoff from an interval.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1327">HADOOP-1327</a>. Include website documentation for streaming.<br />(Rob Weltman
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2000">HADOOP-2000</a>. Rewrite NNBench to measure namenode performance accurately.
- It now uses the map-reduce framework for load generation.<br />(Mukund Madhugiri via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2248">HADOOP-2248</a>. Speeds up the framework w.r.t Counters. Also has API
- updates to the Counters part.<br />(Owen O'Malley via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2326">HADOOP-2326</a>. The initial block report at Datanode startup time has
- a random backoff period.<br />(Sanjay Radia via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2432">HADOOP-2432</a>. HDFS includes the name of the file while throwing
- "File does not exist" exception.<br />(Jim Kellerman via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2457">HADOOP-2457</a>. Added a 'forrest.home' property to the 'docs' target in
- build.xml.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2149">HADOOP-2149</a>. A new benchmark for three name-node operation: file create,
- open, and block report, to evaluate the name-node performance
- for optimizations or new features.<br />(Konstantin Shvachko via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2466">HADOOP-2466</a>. Change FileInputFormat.computeSplitSize to a protected
- non-static method to allow sub-classes to provide alternate
- implementations.<br />(Alejandro Abdelnur via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2425">HADOOP-2425</a>. Change TextOutputFormat to handle Text specifically for better
- performance. Make NullWritable implement Comparable. Make TextOutputFormat
- treat NullWritable like null.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1719">HADOOP-1719</a>. Improves the utilization of shuffle copier threads.<br />(Amar Kamat via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2390">HADOOP-2390</a>. Added documentation for user-controls for intermediate
- map-outputs & final job-outputs and native-hadoop libraries.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1660">HADOOP-1660</a>. Add the cwd of the map/reduce task to the java.library.path
- of the child-jvm to support loading of native libraries distributed via
- the DistributedCache.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2285">HADOOP-2285</a>. Speeds up TextInputFormat. Also includes updates to the
- Text API.<br />(Owen O'Malley via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2233">HADOOP-2233</a>. Adds a generic load generator for modeling MR jobs.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2369">HADOOP-2369</a>. Adds a set of scripts for simulating a mix of user map/reduce
- workloads.<br />(Runping Qi via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2547">HADOOP-2547</a>. Removes use of a 'magic number' in build.xml.<br />(Hrishikesh via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2268">HADOOP-2268</a>. Fix org.apache.hadoop.mapred.jobcontrol classes to use the
- List/Map interfaces rather than concrete ArrayList/HashMap classes
- internally.<br />(Adrian Woodhead via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2406">HADOOP-2406</a>. Add a benchmark for measuring read/write performance through
- the InputFormat interface, particularly with compression.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2131">HADOOP-2131</a>. Allow finer-grained control over speculative-execution. Now
- users can set it for maps and reduces independently.
- Configuration changes to hadoop-default.xml:
- deprecated mapred.speculative.execution
- add mapred.map.tasks.speculative.execution
- add mapred.reduce.tasks.speculative.execution<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1965">HADOOP-1965</a>. Interleave sort/spill in teh map-task along with calls to the
- Mapper.map method. This is done by splitting the 'io.sort.mb' buffer into
- two and using one half for collecting map-outputs and the other half for
- sort/spill.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2464">HADOOP-2464</a>. Unit tests for chmod, chown, and chgrp using DFS.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1876">HADOOP-1876</a>. Persist statuses of completed jobs in HDFS so that the
- JobClient can query and get information about decommissioned jobs and also
- across JobTracker restarts.
- Configuration changes to hadoop-default.xml:
- add mapred.job.tracker.persist.jobstatus.active (default value of false)
- add mapred.job.tracker.persist.jobstatus.hours (default value of 0)
- add mapred.job.tracker.persist.jobstatus.dir (default value of
- /jobtracker/jobsInfo)<br />(Alejandro Abdelnur via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2077">HADOOP-2077</a>. Added version and build information to STARTUP_MSG for all
- hadoop daemons to aid error-reporting, debugging etc.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2398">HADOOP-2398</a>. Additional instrumentation for NameNode and RPC server.
- Add support for accessing instrumentation statistics via JMX.<br />(Sanjay radia via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2449">HADOOP-2449</a>. A return of the non-MR version of NNBench.<br />(Sanjay Radia via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1989">HADOOP-1989</a>. Remove 'datanodecluster' command from bin/hadoop.<br />(Sanjay Radia via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1742">HADOOP-1742</a>. Improve JavaDoc documentation for ClientProtocol, DFSClient,
- and FSNamesystem.<br />(Konstantin Shvachko)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2298">HADOOP-2298</a>. Add Ant target for a binary-only distribution.<br />(Hrishikesh via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2509">HADOOP-2509</a>. Add Ant target for Rat report (Apache license header
- reports).<br />(Hrishikesh via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2469">HADOOP-2469</a>. WritableUtils.clone should take a Configuration
- instead of a JobConf.<br />(stack via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2659">HADOOP-2659</a>. Introduce superuser permissions for admin operations.
- (Tsz Wo (Nicholas), SZE via shv)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2596">HADOOP-2596</a>. Added a SequenceFile.createWriter api which allows the user
- to specify the blocksize, replication factor and the buffersize to be
- used for the underlying HDFS file.<br />(Alejandro Abdelnur via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2431">HADOOP-2431</a>. Test HDFS File Permissions.<br />(Hairong Kuang via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2232">HADOOP-2232</a>. Add an option to disable Nagle's algorithm in the IPC stack.<br />(Clint Morgan via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2342">HADOOP-2342</a>. Created a micro-benchmark for measuring
- local-file versus hdfs reads.<br />(Owen O'Malley via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2529">HADOOP-2529</a>. First version of HDFS User Guide.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2690">HADOOP-2690</a>. Add jar-test target to build.xml, separating compilation
- and packaging of the test classes.<br />(Enis Soztutar via cdouglas)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.16.0_-_2008-02-07_._optimizations_')"> OPTIMIZATIONS
- </a> (4)
- <ol id="release_0.16.0_-_2008-02-07_._optimizations_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1898">HADOOP-1898</a>. Release the lock protecting the last time of the last stack
- dump while the dump is happening.<br />(Amareshwari Sri Ramadasu via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1900">HADOOP-1900</a>. Makes the heartbeat and task event queries interval
- dependent on the cluster size.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2208">HADOOP-2208</a>. Counter update frequency (from TaskTracker to JobTracker) is
- capped at 1 minute.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2284">HADOOP-2284</a>. Reduce the number of progress updates during the sorting in
- the map task.<br />(Amar Kamat via ddas)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.16.0_-_2008-02-07_._bug_fixes_')"> BUG FIXES
- </a> (90)
- <ol id="release_0.16.0_-_2008-02-07_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2583">HADOOP-2583</a>. Fixes a bug in the Eclipse plug-in UI to edit locations.
- Plug-in version is now synchronized with Hadoop version.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2100">HADOOP-2100</a>. Remove faulty check for existence of $HADOOP_PID_DIR and let
- 'mkdir -p' check & create it.<br />(Michael Bieniosek via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1642">HADOOP-1642</a>. Ensure jobids generated by LocalJobRunner are unique to
- avoid collissions and hence job-failures.<br />(Doug Cutting via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2096">HADOOP-2096</a>. Close open file-descriptors held by streams while localizing
- job.xml in the JobTracker and while displaying it on the webui in
- jobconf.jsp.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2098">HADOOP-2098</a>. Log start & completion of empty jobs to JobHistory, which
- also ensures that we close the file-descriptor of the job's history log
- opened during job-submission.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2112">HADOOP-2112</a>. Adding back changes to build.xml lost while reverting
- <a href="http://issues.apache.org/jira/browse/HADOOP-1622">HADOOP-1622</a> i.e. http://svn.apache.org/viewvc?view=rev&revision=588771.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2089">HADOOP-2089</a>. Fixes the command line argument handling to handle multiple
- -cacheArchive in Hadoop streaming.<br />(Lohit Vijayarenu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2071">HADOOP-2071</a>. Fix StreamXmlRecordReader to use a BufferedInputStream
- wrapped over the DFSInputStream since mark/reset aren't supported by
- DFSInputStream anymore.<br />(Lohit Vijayarenu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1348">HADOOP-1348</a>. Allow XML comments inside configuration files.<br />(Rajagopal Natarajan and Enis Soztutar via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1952">HADOOP-1952</a>. Improve handling of invalid, user-specified classes while
- configuring streaming jobs such as combiner, input/output formats etc.
- Now invalid options are caught, logged and jobs are failed early.<br />(Lohit
- Vijayarenu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2151">HADOOP-2151</a>. FileSystem.globPaths validates the list of Paths that
- it returns.<br />(Lohit Vijayarenu via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2121">HADOOP-2121</a>. Cleanup DFSOutputStream when the stream encountered errors
- when Datanodes became full.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1130">HADOOP-1130</a>. The FileSystem.closeAll() method closes all existing
- DFSClients.<br />(Chris Douglas via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2204">HADOOP-2204</a>. DFSTestUtil.waitReplication was not waiting for all replicas
- to get created, thus causing unit test failure.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2078">HADOOP-2078</a>. An zero size file may have no blocks associated with it.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2212">HADOOP-2212</a>. ChecksumFileSystem.getSumBufferSize might throw
- java.lang.ArithmeticException. The fix is to initialize bytesPerChecksum
- to 0.<br />(Michael Bieniosek via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2216">HADOOP-2216</a>. Fix jobtasks.jsp to ensure that it first collects the
- taskids which satisfy the filtering criteria and then use that list to
- print out only the required task-reports, previously it was oblivious to
- the filtering and hence used the wrong index into the array of task-reports.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2272">HADOOP-2272</a>. Fix findbugs target to reflect changes made to the location
- of the streaming jar file by <a href="http://issues.apache.org/jira/browse/HADOOP-2207">HADOOP-2207</a>.<br />(Adrian Woodhead via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2244">HADOOP-2244</a>. Fixes the MapWritable.readFields to clear the instance
- field variable every time readFields is called. (Michael Stack via ddas).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2245">HADOOP-2245</a>. Fixes LocalJobRunner to include a jobId in the mapId. Also,
- adds a testcase for JobControl. (Adrian Woodhead via ddas).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2275">HADOOP-2275</a>. Fix erroneous detection of corrupted file when namenode
- fails to allocate any datanodes for newly allocated block.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2256">HADOOP-2256</a>. Fix a buf in the namenode that could cause it to encounter
- an infinite loop while deleting excess replicas that were created by
- block rebalancing.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2209">HADOOP-2209</a>. SecondaryNamenode process exits if it encounters exceptions
- that it cannot handle.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2314">HADOOP-2314</a>. Prevent TestBlockReplacement from occasionally getting
- into an infinite loop.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2300">HADOOP-2300</a>. This fixes a bug where mapred.tasktracker.tasks.maximum
- would be ignored even if it was set in hadoop-site.xml.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2349">HADOOP-2349</a>. Improve code layout in file system transaction logging code.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2368">HADOOP-2368</a>. Fix unit tests on Windows.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2363">HADOOP-2363</a>. This fix allows running multiple instances of the unit test
- in parallel. The bug was introduced in <a href="http://issues.apache.org/jira/browse/HADOOP-2185">HADOOP-2185</a> that changed
- port-rolling behaviour.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2271">HADOOP-2271</a>. Fix chmod task to be non-parallel.<br />(Adrian Woodhead via
- omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2313">HADOOP-2313</a>. Fail the build if building libhdfs fails.<br />(nigel via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2359">HADOOP-2359</a>. Remove warning for interruptted exception when closing down
- minidfs.<br />(dhruba via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1841">HADOOP-1841</a>. Prevent slow clients from consuming threads in the NameNode.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2323">HADOOP-2323</a>. JobTracker.close() should not print stack traces for
- normal exit.<br />(jimk via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2376">HADOOP-2376</a>. Prevents sort example from overriding the number of maps.<br />(Owen O'Malley via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2434">HADOOP-2434</a>. FSDatasetInterface read interface causes HDFS reads to occur
- in 1 byte chunks, causing performance degradation.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2459">HADOOP-2459</a>. Fix package target so that src/docs/build files are not
- included in the release.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2215">HADOOP-2215</a>. Fix documentation in cluster_setup.html &
- mapred_tutorial.html reflect that mapred.tasktracker.tasks.maximum has
- been superceeded by mapred.tasktracker.{map|reduce}.tasks.maximum.<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2459">HADOOP-2459</a>. Fix package target so that src/docs/build files are not
- included in the release.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2352">HADOOP-2352</a>. Remove AC_CHECK_LIB for libz and liblzo to ensure that
- libhadoop.so doesn't have a dependency on them.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2453">HADOOP-2453</a>. Fix the configuration for wordcount-simple example in Hadoop
- Pipes which currently produces an XML parsing error.<br />(Amareshwari Sri
- Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2476">HADOOP-2476</a>. Unit test failure while reading permission bits of local
- file system (on Windows) fixed.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2247">HADOOP-2247</a>. Fine-tune the strategies for killing mappers and reducers
- due to failures while fetching map-outputs. Now the map-completion times
- and number of currently running reduces are taken into account by the
- JobTracker before killing the mappers, while the progress made by the
- reducer and the number of fetch-failures vis-a-vis total number of
- fetch-attempts are taken into account before teh reducer kills itself.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2452">HADOOP-2452</a>. Fix eclipse plug-in build.xml to refers to the right
- location where hadoop-*-core.jar is generated.<br />(taton)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2492">HADOOP-2492</a>. Additional debugging in the rpc server to better
- diagnose ConcurrentModificationException.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2344">HADOOP-2344</a>. Enhance the utility for executing shell commands to read the
- stdout/stderr streams while waiting for the command to finish (to free up
- the buffers). Also, this patch throws away stderr of the DF utility.
- @deprecated
- org.apache.hadoop.fs.ShellCommand for org.apache.hadoop.util.Shell
- org.apache.hadoop.util.ShellUtil for
- org.apache.hadoop.util.Shell.ShellCommandExecutor<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2511">HADOOP-2511</a>. Fix a javadoc warning in org.apache.hadoop.util.Shell
- introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-2344">HADOOP-2344</a>.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2442">HADOOP-2442</a>. Fix TestLocalFileSystemPermission.testLocalFSsetOwner
- to work on more platforms.<br />(Raghu Angadi via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2488">HADOOP-2488</a>. Fix a regression in random read performance.<br />(Michael Stack via rangadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2523">HADOOP-2523</a>. Fix TestDFSShell.testFilePermissions on Windows.<br />(Raghu Angadi via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2535">HADOOP-2535</a>. Removed support for deprecated mapred.child.heap.size and
- fixed some indentation issues in TaskRunner. (acmurthy)
- Configuration changes to hadoop-default.xml:
- remove mapred.child.heap.size
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2512">HADOOP-2512</a>. Fix error stream handling in Shell. Use exit code to
- detect shell command errors in RawLocalFileSystem.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2446">HADOOP-2446</a>. Fixes TestHDFSServerPorts and TestMRServerPorts so they
- do not rely on statically configured ports and cleanup better.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2537">HADOOP-2537</a>. Make build process compatible with Ant 1.7.0.<br />(Hrishikesh via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1281">HADOOP-1281</a>. Ensure running tasks of completed map TIPs (e.g. speculative
- tasks) are killed as soon as the TIP completed.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2571">HADOOP-2571</a>. Suppress a suprious warning in test code.<br />(cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2481">HADOOP-2481</a>. NNBench report its progress periodically.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2601">HADOOP-2601</a>. Start name-node on a free port for TestNNThroughputBenchmark.<br />(Konstantin Shvachko)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2494">HADOOP-2494</a>. Set +x on contrib/*/bin/* in packaged tar bundle.<br />(stack via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2605">HADOOP-2605</a>. Remove bogus leading slash in task-tracker report bindAddress.<br />(Konstantin Shvachko)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2620">HADOOP-2620</a>. Trivial. 'bin/hadoop fs -help' did not list chmod, chown, and
- chgrp.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2614">HADOOP-2614</a>. The DFS WebUI accesses are configured to be from the user
- specified by dfs.web.ugi. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2543">HADOOP-2543</a>. Implement a "no-permission-checking" mode for smooth
- upgrade from a pre-0.16 install of HDFS.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-290">HADOOP-290</a>. A DataNode log message now prints the target of a replication
- request correctly.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2538">HADOOP-2538</a>. Redirect to a warning, if plaintext parameter is true but
- the filter parameter is not given in TaskLogServlet.<br />(Michael Bieniosek via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2582">HADOOP-2582</a>. Prevent 'bin/hadoop fs -copyToLocal' from creating
- zero-length files when the src does not exist.<br />(Lohit Vijayarenu via cdouglas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2189">HADOOP-2189</a>. Incrementing user counters should count as progress.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2649">HADOOP-2649</a>. The NameNode periodically computes replication work for
- the datanodes. The periodicity of this computation is now configurable.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2549">HADOOP-2549</a>. Correct disk size computation so that data-nodes could switch
- to other local drives if current is full.<br />(Hairong Kuang via shv)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2633">HADOOP-2633</a>. Fsck should call name-node methods directly rather than
- through rpc. (Tsz Wo (Nicholas), SZE via shv)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2687">HADOOP-2687</a>. Modify a few log message generated by dfs client to be
- logged only at INFO level.<br />(stack via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2402">HADOOP-2402</a>. Fix BlockCompressorStream to ensure it buffers data before
- sending it down to the compressor so that each write call doesn't
- compress.<br />(Chris Douglas via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2645">HADOOP-2645</a>. The Metrics initialization code does not throw
- exceptions when servers are restarted by MiniDFSCluster.<br />(Sanjay Radia via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2691">HADOOP-2691</a>. Fix a race condition that was causing the DFSClient
- to erroneously remove a good datanode from a pipeline that actually
- had another datanode that was bad.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1195">HADOOP-1195</a>. All code in FSNamesystem checks the return value
- of getDataNode for null before using it.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2640">HADOOP-2640</a>. Fix a bug in MultiFileSplitInputFormat that was always
- returning 1 split in some circumstances.<br />(Enis Soztutar via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2626">HADOOP-2626</a>. Fix paths with special characters to work correctly
- with the local filesystem.<br />(Thomas Friol via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2646">HADOOP-2646</a>. Fix SortValidator to work with fully-qualified
- working directories.<br />(Arun C Murthy via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2092">HADOOP-2092</a>. Added a ping mechanism to the pipes' task to periodically
- check if the parent Java task is running, and exit if the parent isn't
- alive and responding.<br />(Amareshwari Sri Ramadasu via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2714">HADOOP-2714</a>. TestDecommission failed on windows because the replication
- request was timing out.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2576">HADOOP-2576</a>. Namenode performance degradation over time triggered by
- large heartbeat interval.<br />(Raghu Angadi)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2713">HADOOP-2713</a>. TestDatanodeDeath failed on windows because the replication
- request was timing out.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2639">HADOOP-2639</a>. Fixes a problem to do with incorrect maintenance of values
- for runningMapTasks/runningReduceTasks.<br />(Amar Kamat and Arun Murthy
- via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2723">HADOOP-2723</a>. Fixed the check for checking whether to do user task
- profiling.<br />(Amareshwari Sri Ramadasu via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2734">HADOOP-2734</a>. Link forrest docs to new http://hadoop.apache.org<br />(Doug Cutting via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2641">HADOOP-2641</a>. Added Apache license headers to 95 files.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2732">HADOOP-2732</a>. Fix bug in path globbing.<br />(Hairong Kuang via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2404">HADOOP-2404</a>. Fix backwards compatability with hadoop-0.15 configuration
- files that was broken by <a href="http://issues.apache.org/jira/browse/HADOOP-2185">HADOOP-2185</a>.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2755">HADOOP-2755</a>. Fix fsck performance degradation because of permissions
- issue. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2768">HADOOP-2768</a>. Fix performance regression caused by <a href="http://issues.apache.org/jira/browse/HADOOP-1707">HADOOP-1707</a>.<br />(dhruba borthakur via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-3108">HADOOP-3108</a>. Fix NPE in setPermission and setOwner.<br />(shv)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.15.3_-_2008-01-18_')">Release 0.15.3 - 2008-01-18
- </a></h3>
- <ul id="release_0.15.3_-_2008-01-18_">
- <li><a href="javascript:toggleList('release_0.15.3_-_2008-01-18_._bug_fixes_')"> BUG FIXES
- </a> (4)
- <ol id="release_0.15.3_-_2008-01-18_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2562">HADOOP-2562</a>. globPaths supports {ab,cd}.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2540">HADOOP-2540</a>. fsck reports missing blocks incorrectly.<br />(dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2570">HADOOP-2570</a>. "work" directory created unconditionally, and symlinks
- created from the task cwds.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2574">HADOOP-2574</a>. Fixed mapred_tutorial.xml to correct minor errors with the
- WordCount examples.<br />(acmurthy)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.15.2_-_2008-01-02_')">Release 0.15.2 - 2008-01-02
- </a></h3>
- <ul id="release_0.15.2_-_2008-01-02_">
- <li><a href="javascript:toggleList('release_0.15.2_-_2008-01-02_._bug_fixes_')"> BUG FIXES
- </a> (11)
- <ol id="release_0.15.2_-_2008-01-02_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2246">HADOOP-2246</a>. Moved the changelog for <a href="http://issues.apache.org/jira/browse/HADOOP-1851">HADOOP-1851</a> from the NEW FEATURES
- section to the INCOMPATIBLE CHANGES section.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2238">HADOOP-2238</a>. Fix TaskGraphServlet so that it sets the content type of
- the response appropriately.<br />(Paul Saab via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2129">HADOOP-2129</a>. Fix so that distcp works correctly when source is
- HDFS but not the default filesystem. HDFS paths returned by the
- listStatus() method are now fully-qualified.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2378">HADOOP-2378</a>. Fixes a problem where the last task completion event would
- get created after the job completes.<br />(Alejandro Abdelnur via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2228">HADOOP-2228</a>. Checks whether a job with a certain jobId is already running
- and then tries to create the JobInProgress object.<br />(Johan Oskarsson via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2422">HADOOP-2422</a>. dfs -cat multiple files fail with 'Unable to write to
- output stream'.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2460">HADOOP-2460</a>. When the namenode encounters ioerrors on writing a
- transaction log, it stops writing new transactions to that one.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2227">HADOOP-2227</a>. Use the LocalDirAllocator uniformly for handling all of the
- temporary storage required for a given task. It also implies that
- mapred.local.dir.minspacestart is handled by checking if there is enough
- free-space on any one of the available disks.<br />(Amareshwari Sri Ramadasu
- via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2437">HADOOP-2437</a>. Fix the LocalDirAllocator to choose the seed for the
- round-robin disk selections randomly. This helps in spreading data across
- multiple partitions much better.<br />(acmurhty)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2486">HADOOP-2486</a>. When the list of files from the InMemoryFileSystem is obtained
- for merging, this patch will ensure that only those files whose checksums
- have also got created (renamed) are returned.<br />(ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2456">HADOOP-2456</a>. Hardcode English locale to prevent NumberFormatException
- from occurring when starting the NameNode with certain locales.<br />(Matthias Friedrich via nigel)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.15.2_-_2008-01-02_._improvements_')"> IMPROVEMENTS
- </a> (4)
- <ol id="release_0.15.2_-_2008-01-02_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2160">HADOOP-2160</a>. Remove project-level, non-user documentation from
- releases, since it's now maintained in a separate tree.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1327">HADOOP-1327</a>. Add user documentation for streaming.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2382">HADOOP-2382</a>. Add hadoop-default.html to subversion.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2158">HADOOP-2158</a>. hdfsListDirectory calls FileSystem.listStatus instead
- of FileSystem.listPaths. This reduces the number of RPC calls on the
- namenode, thereby improving scalability.<br />(Christian Kunz via dhruba)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.15.1_-_2007-11-27_')">Release 0.15.1 - 2007-11-27
- </a></h3>
- <ul id="release_0.15.1_-_2007-11-27_">
- <li><a href="javascript:toggleList('release_0.15.1_-_2007-11-27_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (1)
- <ol id="release_0.15.1_-_2007-11-27_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-713">HADOOP-713</a>. Reduce CPU usage on namenode while listing directories.
- FileSystem.listPaths does not return the size of the entire subtree.
- Introduced a new API ClientProtocol.getContentLength that returns the
- size of the subtree.<br />(Dhruba Borthakur via dhruba)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.15.1_-_2007-11-27_._improvements_')"> IMPROVEMENTS
- </a> (1)
- <ol id="release_0.15.1_-_2007-11-27_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1917">HADOOP-1917</a>. Addition of guides/tutorial for better overall
- documentation for Hadoop. Specifically:
- * quickstart.html is targetted towards first-time users and helps them
- setup a single-node cluster and play with Hadoop.
- * cluster_setup.html helps admins to configure and setup non-trivial
- hadoop clusters.
- * mapred_tutorial.html is a comprehensive Map-Reduce tutorial.<br />(acmurthy)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.15.1_-_2007-11-27_._bug_fixes_')"> BUG FIXES
- </a> (3)
- <ol id="release_0.15.1_-_2007-11-27_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2174">HADOOP-2174</a>. Removed the unnecessary Reporter.setStatus call from
- FSCopyFilesMapper.close which led to a NPE since the reporter isn't valid
- in the close method.<br />(Chris Douglas via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2172">HADOOP-2172</a>. Restore performance of random access to local files
- by caching positions of local input streams, avoiding a system
- call.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2205">HADOOP-2205</a>. Regenerate the Hadoop website since some of the changes made
- by <a href="http://issues.apache.org/jira/browse/HADOOP-1917">HADOOP-1917</a> weren't correctly copied over to the trunk/docs directory.
- Also fixed a couple of minor typos and broken links.<br />(acmurthy)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.15.0_-_2007-11-2_')">Release 0.15.0 - 2007-11-2
- </a></h3>
- <ul id="release_0.15.0_-_2007-11-2_">
- <li><a href="javascript:toggleList('release_0.15.0_-_2007-11-2_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (10)
- <ol id="release_0.15.0_-_2007-11-2_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1708">HADOOP-1708</a>. Make files appear in namespace as soon as they are
- created.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-999">HADOOP-999</a>. A HDFS Client immediately informs the NameNode of a new
- file creation. ClientProtocol version changed from 14 to 15.
- (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-932">HADOOP-932</a>. File locking interfaces and implementations (that were
- earlier deprecated) are removed. Client Protocol version changed
- from 15 to 16.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1621">HADOOP-1621</a>. FileStatus is now a concrete class and FileSystem.listPaths
- is deprecated and replaced with listStatus.<br />(Chris Douglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1656">HADOOP-1656</a>. The blockSize of a file is stored persistently in the file
- inode.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1838">HADOOP-1838</a>. The blocksize of files created with an earlier release is
- set to the default block size.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-785">HADOOP-785</a>. Add support for 'final' Configuration parameters,
- removing support for 'mapred-default.xml', and changing
- 'hadoop-site.xml' to not override other files. Now folks should
- generally use 'hadoop-site.xml' for all configurations. Values
- with a 'final' tag may not be overridden by subsequently loaded
- configuration files, e.g., by jobs.<br />(Arun C. Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1846">HADOOP-1846</a>. DatanodeReport in ClientProtocol can report live
- datanodes, dead datanodes or all datanodes. Client Protocol version
- changed from 17 to 18.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1851">HADOOP-1851</a>. Permit specification of map output compression type
- and codec, independent of the final output's compression
- parameters.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1819">HADOOP-1819</a>. Jobtracker cleanups, including binding ports before
- clearing state directories, so that inadvertently starting a
- second jobtracker doesn't trash one that's already running. Removed
- method JobTracker.getTracker() because the static variable, which
- stored the value caused initialization problems.<br />(omalley via cutting)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.15.0_-_2007-11-2_._new_features_')"> NEW FEATURES
- </a> (14)
- <ol id="release_0.15.0_-_2007-11-2_._new_features_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-89">HADOOP-89</a>. A client can access file data even before the creator
- has closed the file. Introduce a new command "tail" from dfs shell.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1636">HADOOP-1636</a>. Allow configuration of the number of jobs kept in
- memory by the JobTracker.<br />(Michael Bieniosek via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1667">HADOOP-1667</a>. Reorganize CHANGES.txt into sections to make it
- easier to read. Also remove numbering, to make merging easier.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1610">HADOOP-1610</a>. Add metrics for failed tasks.<br />(Devaraj Das via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1767">HADOOP-1767</a>. Add "bin/hadoop job -list" sub-command.<br />(taton via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1351">HADOOP-1351</a>. Add "bin/hadoop job [-fail-task|-kill-task]" sub-commands
- to terminate a particular task-attempt.<br />(Enis Soztutar via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1880">HADOOP-1880</a>. SleepJob : An example job that sleeps at each map and
- reduce task.<br />(enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1809">HADOOP-1809</a>. Add a link in web site to #hadoop IRC channel.<br />(enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1894">HADOOP-1894</a>. Add percentage graphs and mapred task completion graphs
- to Web User Interface. Users not using Firefox may install a plugin to
- their browsers to see svg graphics.<br />(enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1914">HADOOP-1914</a>. Introduce a new NamenodeProtocol to allow secondary
- namenodes and rebalancing processes to communicate with a primary
- namenode.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1963">HADOOP-1963</a>. Add a FileSystem implementation for the Kosmos
- Filesystem (KFS).<br />(Sriram Rao via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1822">HADOOP-1822</a>. Allow the specialization and configuration of socket
- factories. Provide a StandardSocketFactory, and a SocksSocketFactory to
- allow the use of SOCKS proxies. (taton).
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1968">HADOOP-1968</a>. FileSystem supports wildcard input syntax "{ }".<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2566">HADOOP-2566</a>. Add globStatus method to the FileSystem interface
- and deprecate globPath and listPath.<br />(Hairong Kuang via hairong)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.15.0_-_2007-11-2_._optimizations_')"> OPTIMIZATIONS
- </a> (8)
- <ol id="release_0.15.0_-_2007-11-2_._optimizations_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1910">HADOOP-1910</a>. Reduce the number of RPCs that DistributedFileSystem.create()
- makes to the namenode.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1565">HADOOP-1565</a>. Reduce memory usage of NameNode by replacing
- TreeMap in HDFS Namespace with ArrayList.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1743">HADOOP-1743</a>. Change DFS INode from a nested class to standalone
- class, with specialized subclasses for directories and files, to
- save memory on the namenode.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1759">HADOOP-1759</a>. Change file name in INode from String to byte[],
- saving memory on the namenode.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1766">HADOOP-1766</a>. Save memory in namenode by having BlockInfo extend
- Block, and replace many uses of Block with BlockInfo.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1687">HADOOP-1687</a>. Save memory in namenode by optimizing BlockMap
- representation.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1774">HADOOP-1774</a>. Remove use of INode.parent in Block CRC upgrade.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1788">HADOOP-1788</a>. Increase the buffer size on the Pipes command socket.<br />(Amareshwari Sri Ramadasu and Christian Kunz via omalley)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.15.0_-_2007-11-2_._bug_fixes_')"> BUG FIXES
- </a> (64)
- <ol id="release_0.15.0_-_2007-11-2_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1946">HADOOP-1946</a>. The Datanode code does not need to invoke du on
- every heartbeat.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1935">HADOOP-1935</a>. Fix a NullPointerException in internalReleaseCreate.<br />(Dhruba Borthakur)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1933">HADOOP-1933</a>. The nodes listed in include and exclude files
- are always listed in the datanode report.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1953">HADOOP-1953</a>. The job tracker should wait beteween calls to try and delete
- the system directory<br />(Owen O'Malley via devaraj)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1932">HADOOP-1932</a>. TestFileCreation fails with message saying filestatus.dat
- is of incorrect size.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1573">HADOOP-1573</a>. Support for 0 reducers in PIPES.<br />(Owen O'Malley via devaraj)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1500">HADOOP-1500</a>. Fix typographical errors in the DFS WebUI.<br />(Nigel Daley via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1076">HADOOP-1076</a>. Periodic checkpoint can continue even if an earlier
- checkpoint encountered an error.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1887">HADOOP-1887</a>. The Namenode encounters an ArrayIndexOutOfBoundsException
- while listing a directory that had a file that was
- being actively written to.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1904">HADOOP-1904</a>. The Namenode encounters an exception because the
- list of blocks per datanode-descriptor was corrupted.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1762">HADOOP-1762</a>. The Namenode fsimage does not contain a list of
- Datanodes.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1890">HADOOP-1890</a>. Removed debugging prints introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-1774">HADOOP-1774</a>.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1763">HADOOP-1763</a>. Too many lost task trackers on large clusters due to
- insufficient number of RPC handler threads on the JobTracker.<br />(Devaraj Das)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1463">HADOOP-1463</a>. HDFS report correct usage statistics for disk space
- used by HDFS.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1692">HADOOP-1692</a>. In DFS ant task, don't cache the Configuration.<br />(Chris Douglas via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1726">HADOOP-1726</a>. Remove lib/jetty-ext/ant.jar.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1772">HADOOP-1772</a>. Fix hadoop-daemon.sh script to get correct hostname
- under Cygwin. (Tsz Wo (Nicholas), SZE via cutting)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1749">HADOOP-1749</a>. Change TestDFSUpgrade to sort files, fixing sporadic
- test failures.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1748">HADOOP-1748</a>. Fix tasktracker to be able to launch tasks when log
- directory is relative.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1775">HADOOP-1775</a>. Fix a NullPointerException and an
- IllegalArgumentException in MapWritable.<br />(Jim Kellerman via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1795">HADOOP-1795</a>. Fix so that jobs can generate output file names with
- special characters.<br />(Fr??d??ric Bertin via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1810">HADOOP-1810</a>. Fix incorrect value type in MRBench (SmallJobs)<br />(Devaraj Das via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1806">HADOOP-1806</a>. Fix ant task to compile again, also fix default
- builds to compile ant tasks.<br />(Chris Douglas via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1758">HADOOP-1758</a>. Fix escape processing in librecordio to not be
- quadratic.<br />(Vivek Ratan via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1817">HADOOP-1817</a>. Fix MultiFileSplit to read and write the split
- length, so that it is not always zero in map tasks.<br />(Thomas Friol via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1853">HADOOP-1853</a>. Fix contrib/streaming to accept multiple -cacheFile
- options.<br />(Prachi Gupta via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1818">HADOOP-1818</a>. Fix MultiFileInputFormat so that it does not return
- empty splits when numPaths < numSplits.<br />(Thomas Friol via enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1840">HADOOP-1840</a>. Fix race condition which leads to task's diagnostic
- messages getting lost.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1885">HADOOP-1885</a>. Fix race condition in MiniDFSCluster shutdown.<br />(Chris Douglas via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1889">HADOOP-1889</a>. Fix path in EC2 scripts for building your own AMI.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1892">HADOOP-1892</a>. Fix a NullPointerException in the JobTracker when
- trying to fetch a task's diagnostic messages from the JobClient.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1897">HADOOP-1897</a>. Completely remove about.html page from the web site.<br />(enis)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1907">HADOOP-1907</a>. Fix null pointer exception when getting task diagnostics
- in JobClient.<br />(Christian Kunz via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1882">HADOOP-1882</a>. Remove spurious asterisks from decimal number displays.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1783">HADOOP-1783</a>. Make S3 FileSystem return Paths fully-qualified with
- scheme and host.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1925">HADOOP-1925</a>. Make pipes' autoconf script look for libsocket and libnsl, so
- that it can compile under Solaris.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1940">HADOOP-1940</a>. TestDFSUpgradeFromImage must shut down its MiniDFSCluster.<br />(Chris Douglas via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1930">HADOOP-1930</a>. Fix the blame for failed fetchs on the right host.<br />(Arun C.
- Murthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1934">HADOOP-1934</a>. Fix the platform name on Mac to use underscores rather than
- spaces.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1959">HADOOP-1959</a>. Use "/" instead of File.separator in the StatusHttpServer.<br />(jimk via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1626">HADOOP-1626</a>. Improve dfsadmin help messages.<br />(Lohit Vijayarenu via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1695">HADOOP-1695</a>. The SecondaryNamenode waits for the Primary NameNode to
- start up.<br />(Dhruba Borthakur)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1983">HADOOP-1983</a>. Have Pipes flush the command socket when progress is sent
- to prevent timeouts during long computations.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1875">HADOOP-1875</a>. Non-existant directories or read-only directories are
- filtered from dfs.client.buffer.dir.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1992">HADOOP-1992</a>. Fix the performance degradation in the sort validator.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1874">HADOOP-1874</a>. Move task-outputs' promotion/discard to a separate thread
- distinct from the main heartbeat-processing thread. The main upside being
- that we do not lock-up the JobTracker during HDFS operations, which
- otherwise may lead to lost tasktrackers if the NameNode is unresponsive.<br />(Devaraj Das via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2026">HADOOP-2026</a>. Namenode prints out one log line for "Number of transactions"
- at most once every minute.<br />(Dhruba Borthakur)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2022">HADOOP-2022</a>. Ensure that status information for successful tasks is correctly
- recorded at the JobTracker, so that, for example, one may view correct
- information via taskdetails.jsp. This bug was introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-1874">HADOOP-1874</a>.<br />(Amar Kamat via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2031">HADOOP-2031</a>. Correctly maintain the taskid which takes the TIP to
- completion, failing which the case of lost tasktrackers isn't handled
- properly i.e. the map TIP is incorrectly left marked as 'complete' and it
- is never rescheduled elsewhere, leading to hung reduces.<br />(Devaraj Das via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2018">HADOOP-2018</a>. The source datanode of a data transfer waits for
- a response from the target datanode before closing the data stream.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2023">HADOOP-2023</a>. Disable TestLocalDirAllocator on Windows.<br />(Hairong Kuang via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2016">HADOOP-2016</a>. Ignore status-updates from FAILED/KILLED tasks at the
- TaskTracker. This fixes a race-condition which caused the tasks to wrongly
- remain in the RUNNING state even after being killed by the JobTracker and
- thus handicap the cleanup of the task's output sub-directory.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1771">HADOOP-1771</a>. Fix a NullPointerException in streaming caused by an
- IOException in MROutputThread.<br />(lohit vijayarenu via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2028">HADOOP-2028</a>. Fix distcp so that the log dir does not need to be
- specified and the destination does not need to exist.<br />(Chris Douglas via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2044">HADOOP-2044</a>. The namenode protects all lease manipulations using a
- sortedLease lock.<br />(Dhruba Borthakur)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2051">HADOOP-2051</a>. The TaskCommit thread should not die for exceptions other
- than the InterruptedException. This behavior is there for the other long
- running threads in the JobTracker.<br />(Arun C Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1973">HADOOP-1973</a>. The FileSystem object would be accessed on the JobTracker
- through a RPC in the InterTrackerProtocol. The check for the object being
- null was missing and hence NPE would be thrown sometimes. This issue fixes
- that problem.<br />(Amareshwari Sri Ramadasu via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2033">HADOOP-2033</a>. The SequenceFile.Writer.sync method was a no-op, which caused
- very uneven splits for applications like distcp that count on them.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2070">HADOOP-2070</a>. Added a flush method to pipes' DownwardProtocol and call
- that before waiting for the application to finish to ensure all buffered
- data is flushed.<br />(Owen O'Malley via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2080">HADOOP-2080</a>. Fixed calculation of the checksum file size when the values
- are large.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2048">HADOOP-2048</a>. Change error handling in distcp so that each map copies
- as much as possible before reporting the error. Also report progress on
- every copy.<br />(Chris Douglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2073">HADOOP-2073</a>. Change size of VERSION file after writing contents to it.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2102">HADOOP-2102</a>. Fix the deprecated ToolBase to pass its Configuration object
- to the superceding ToolRunner to ensure it picks up the appropriate
- configuration resources.<br />(Dennis Kubes and Enis Soztutar via acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2103">HADOOP-2103</a>. Fix minor javadoc bugs introduce by <a href="http://issues.apache.org/jira/browse/HADOOP-2046">HADOOP-2046</a>.<br />(Nigel
- Daley via acmurthy)</li>
- </ol>
- </li>
- <li><a href="javascript:toggleList('release_0.15.0_-_2007-11-2_._improvements_')"> IMPROVEMENTS
- </a> (37)
- <ol id="release_0.15.0_-_2007-11-2_._improvements_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1908">HADOOP-1908</a>. Restructure data node code so that block sending and
- receiving are seperated from data transfer header handling.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1921">HADOOP-1921</a>. Save the configuration of completed/failed jobs and make them
- available via the web-ui.<br />(Amar Kamat via devaraj)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1266">HADOOP-1266</a>. Remove dependency of package org.apache.hadoop.net on
- org.apache.hadoop.dfs.<br />(Hairong Kuang via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1779">HADOOP-1779</a>. Replace INodeDirectory.getINode() by a getExistingPathINodes()
- to allow the retrieval of all existing INodes along a given path in a
- single lookup. This facilitates removal of the 'parent' field in the
- inode.<br />(Christophe Taton via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1756">HADOOP-1756</a>. Add toString() to some Writable-s.<br />(ab)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1727">HADOOP-1727</a>. New classes: MapWritable and SortedMapWritable.<br />(Jim Kellerman via ab)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1651">HADOOP-1651</a>. Improve progress reporting.<br />(Devaraj Das via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1595">HADOOP-1595</a>. dfsshell can wait for a file to achieve its intended
- replication target. (Tsz Wo (Nicholas), SZE via dhruba)
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1693">HADOOP-1693</a>. Remove un-needed log fields in DFS replication classes,
- since the log may be accessed statically.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1231">HADOOP-1231</a>. Add generics to Mapper and Reducer interfaces.<br />(tomwhite via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1436">HADOOP-1436</a>. Improved command-line APIs, so that all tools need
- not subclass ToolBase, and generic parameter parser is public.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1703">HADOOP-1703</a>. DFS-internal code cleanups, removing several uses of
- the obsolete UTF8.<br />(Christophe Taton via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1731">HADOOP-1731</a>. Add Hadoop's version to contrib jar file names.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1689">HADOOP-1689</a>. Make shell scripts more portable. All shell scripts
- now explicitly depend on bash, but do not require that bash be
- installed in a particular location, as long as it is on $PATH.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1744">HADOOP-1744</a>. Remove many uses of the deprecated UTF8 class from
- the HDFS namenode.<br />(Christophe Taton via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1654">HADOOP-1654</a>. Add IOUtils class, containing generic io-related
- utility methods.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1158">HADOOP-1158</a>. Change JobTracker to record map-output transmission
- errors and use them to trigger speculative re-execution of tasks.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1601">HADOOP-1601</a>. Change GenericWritable to use ReflectionUtils for
- instance creation, avoiding classloader issues, and to implement
- Configurable.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1750">HADOOP-1750</a>. Log standard output and standard error when forking
- task processes.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1803">HADOOP-1803</a>. Generalize build.xml to make files in all
- src/contrib/*/bin directories executable.<br />(stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1739">HADOOP-1739</a>. Let OS always choose the tasktracker's umbilical
- port. Also switch default address for umbilical connections to
- loopback.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1812">HADOOP-1812</a>. Let OS choose ports for IPC and RPC unit tests.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1825">HADOOP-1825</a>. Create $HADOOP_PID_DIR when it does not exist.<br />(Michael Bieniosek via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1425">HADOOP-1425</a>. Replace uses of ToolBase with the Tool interface.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1569">HADOOP-1569</a>. Reimplement DistCP to use the standard FileSystem/URI
- code in Hadoop so that you can copy from and to all of the supported file
- systems.<br />(Chris Douglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1018">HADOOP-1018</a>. Improve documentation w.r.t handling of lost hearbeats between
- TaskTrackers and JobTracker.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1718">HADOOP-1718</a>. Add ant targets for measuring code coverage with clover.<br />(simonwillnauer via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1592">HADOOP-1592</a>. Log error messages to the client console when tasks
- fail.<br />(Amar Kamat via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1879">HADOOP-1879</a>. Remove some unneeded casts.<br />(Nilay Vaish via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1878">HADOOP-1878</a>. Add space between priority links on job details
- page.<br />(Thomas Friol via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-120">HADOOP-120</a>. In ArrayWritable, prevent creation with null value
- class, and improve documentation.<br />(Cameron Pope via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1926">HADOOP-1926</a>. Add a random text writer example/benchmark so that we can
- benchmark compression codecs on random data.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1906">HADOOP-1906</a>. Warn the user if they have an obsolete madred-default.xml
- file in their configuration directory.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1971">HADOOP-1971</a>. Warn when job does not specify a jar.<br />(enis via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1942">HADOOP-1942</a>. Increase the concurrency of transaction logging to
- edits log. Reduce the number of syncs by double-buffering the changes
- to the transaction log.<br />(Dhruba Borthakur)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2046">HADOOP-2046</a>. Improve mapred javadoc.<br />(Arun C. Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2105">HADOOP-2105</a>. Improve overview.html to clarify supported platforms,
- software pre-requisites for hadoop, how to install them on various
- platforms and a better general description of hadoop and it's utility.<br />(Jim Kellerman via acmurthy)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.14.4_-_2007-11-26_')">Release 0.14.4 - 2007-11-26
- </a></h3>
- <ul id="release_0.14.4_-_2007-11-26_">
- <li><a href="javascript:toggleList('release_0.14.4_-_2007-11-26_._bug_fixes_')"> BUG FIXES
- </a> (3)
- <ol id="release_0.14.4_-_2007-11-26_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2140">HADOOP-2140</a>. Add missing Apache Licensing text at the front of several
- C and C++ files.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2169">HADOOP-2169</a>. Fix the DT_SONAME field of libhdfs.so to set it to the
- correct value of 'libhdfs.so', currently it is set to the absolute path of
- libhdfs.so.<br />(acmurthy)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2001">HADOOP-2001</a>. Make the job priority updates and job kills synchronized on
- the JobTracker. Deadlock was seen in the JobTracker because of the lack of
- this synchronization.<br />(Arun C Murthy via ddas)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.14.3_-_2007-10-19_')">Release 0.14.3 - 2007-10-19
- </a></h3>
- <ul id="release_0.14.3_-_2007-10-19_">
- <li><a href="javascript:toggleList('release_0.14.3_-_2007-10-19_._bug_fixes_')"> BUG FIXES
- </a> (3)
- <ol id="release_0.14.3_-_2007-10-19_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2053">HADOOP-2053</a>. Fixed a dangling reference to a memory buffer in the map
- output sorter.<br />(acmurthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2036">HADOOP-2036</a>. Fix a NullPointerException in JvmMetrics class.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-2043">HADOOP-2043</a>. Release 0.14.2 was compiled with Java 1.6 rather than
- Java 1.5.<br />(cutting)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.14.2_-_2007-10-09_')">Release 0.14.2 - 2007-10-09
- </a></h3>
- <ul id="release_0.14.2_-_2007-10-09_">
- <li><a href="javascript:toggleList('release_0.14.2_-_2007-10-09_._bug_fixes_')"> BUG FIXES
- </a> (9)
- <ol id="release_0.14.2_-_2007-10-09_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1948">HADOOP-1948</a>. Removed spurious error message during block crc upgrade.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1862">HADOOP-1862</a>. reduces are getting stuck trying to find map outputs.<br />(Arun C. Murthy via ddas)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1977">HADOOP-1977</a>. Fixed handling of ToolBase cli options in JobClient.<br />(enis via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1972">HADOOP-1972</a>. Fix LzoCompressor to ensure the user has actually asked
- to finish compression.<br />(arun via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1970">HADOOP-1970</a>. Fix deadlock in progress reporting in the task.<br />(Vivek
- Ratan via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1978">HADOOP-1978</a>. Name-node removes edits.new after a successful startup.<br />(Konstantin Shvachko via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1955">HADOOP-1955</a>. The Namenode tries to not pick the same source Datanode for
- a replication request if the earlier replication request for the same
- block and that source Datanode had failed.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1961">HADOOP-1961</a>. The -get option to dfs-shell works when a single filename
- is specified.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1997">HADOOP-1997</a>. TestCheckpoint closes the edits file after writing to it,
- otherwise the rename of this file on Windows fails.<br />(Konstantin Shvachko via dhruba)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.14.1_-_2007-09-04_')">Release 0.14.1 - 2007-09-04
- </a></h3>
- <ul id="release_0.14.1_-_2007-09-04_">
- <li><a href="javascript:toggleList('release_0.14.1_-_2007-09-04_._bug_fixes_')"> BUG FIXES
- </a> (3)
- <ol id="release_0.14.1_-_2007-09-04_._bug_fixes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1740">HADOOP-1740</a>. Fix null pointer exception in sorting map outputs.<br />(Devaraj
- Das via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1790">HADOOP-1790</a>. Fix tasktracker to work correctly on multi-homed
- boxes.<br />(Torsten Curdt via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1798">HADOOP-1798</a>. Fix jobtracker to correctly account for failed
- tasks.<br />(omalley via cutting)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.14.0_-_2007-08-17_')">Release 0.14.0 - 2007-08-17
- </a></h3>
- <ul id="release_0.14.0_-_2007-08-17_">
- <li><a href="javascript:toggleList('release_0.14.0_-_2007-08-17_._incompatible_changes_')"> INCOMPATIBLE CHANGES
- </a> (160)
- <ol id="release_0.14.0_-_2007-08-17_._incompatible_changes_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1134">HADOOP-1134</a>.
- CONFIG/API - dfs.block.size must now be a multiple of
- io.byte.per.checksum, otherwise new files can not be written.
- LAYOUT - DFS layout version changed from -6 to -7, which will require an
- upgrade from previous versions.
- PROTOCOL - Datanode RPC protocol version changed from 7 to 8.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1283">HADOOP-1283</a>
- API - deprecated file locking API.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-894">HADOOP-894</a>
- PROTOCOL - changed ClientProtocol to fetch parts of block locations.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1336">HADOOP-1336</a>
- CONFIG - Enable speculative execution by default.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1197">HADOOP-1197</a>
- API - deprecated method for Configuration.getObject, because
- Configurations should only contain strings.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1343">HADOOP-1343</a>
- API - deprecate Configuration.set(String,Object) so that only strings are
- put in Configrations.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1207">HADOOP-1207</a>
- CLI - Fix FsShell 'rm' command to continue when a non-existent file is
- encountered.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1473">HADOOP-1473</a>
- CLI/API - Job, TIP, and Task id formats have changed and are now unique
- across job tracker restarts.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1400">HADOOP-1400</a>
- API - JobClient constructor now takes a JobConf object instead of a
- Configuration object.
- <p/>
- NEW FEATURES and BUG FIXES
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1197">HADOOP-1197</a>. In Configuration, deprecate getObject() and add
- getRaw(), which skips variable expansion.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1343">HADOOP-1343</a>. In Configuration, deprecate set(String,Object) and
- implement Iterable.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1344">HADOOP-1344</a>. Add RunningJob#getJobName().<br />(Michael Bieniosek via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1342">HADOOP-1342</a>. In aggregators, permit one to limit the number of
- unique values per key.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1340">HADOOP-1340</a>. Set the replication factor of the MD5 file in the filecache
- to be the same as the replication factor of the original file.<br />(Dhruba Borthakur via tomwhite.)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1355">HADOOP-1355</a>. Fix null pointer dereference in
- TaskLogAppender.append(LoggingEvent).<br />(Arun C Murthy via tomwhite.)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1357">HADOOP-1357</a>. Fix CopyFiles to correctly avoid removing "/".<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-234">HADOOP-234</a>. Add pipes facility, which permits writing MapReduce
- programs in C++.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1359">HADOOP-1359</a>. Fix a potential NullPointerException in HDFS.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1364">HADOOP-1364</a>. Fix inconsistent synchronization in SequenceFile.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1379">HADOOP-1379</a>. Add findbugs target to build.xml.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1364">HADOOP-1364</a>. Fix various inconsistent synchronization issues.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1393">HADOOP-1393</a>. Remove a potential unexpected negative number from
- uses of random number generator.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1387">HADOOP-1387</a>. A number of "performance" code-cleanups suggested
- by findbugs.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1401">HADOOP-1401</a>. Add contrib/hbase javadoc to tree.<br />(stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-894">HADOOP-894</a>. Change HDFS so that the client only retrieves a limited
- number of block locations per request from the namenode.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1406">HADOOP-1406</a>. Plug a leak in MapReduce's use of metrics.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1394">HADOOP-1394</a>. Implement "performance" code-cleanups in HDFS
- suggested by findbugs.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1413">HADOOP-1413</a>. Add example program that uses Knuth's dancing links
- algorithm to solve pentomino problems.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1226">HADOOP-1226</a>. Change HDFS so that paths it returns are always
- fully qualified.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-800">HADOOP-800</a>. Improvements to HDFS web-based file browser.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1408">HADOOP-1408</a>. Fix a compiler warning by adding a class to replace
- a generic.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1376">HADOOP-1376</a>. Modify RandomWriter example so that it can generate
- data for the Terasort benchmark.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1429">HADOOP-1429</a>. Stop logging exceptions during normal IPC server
- shutdown.<br />(stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1461">HADOOP-1461</a>. Fix the synchronization of the task tracker to
- avoid lockups in job cleanup.<br />(Arun C Murthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1446">HADOOP-1446</a>. Update the TaskTracker metrics while the task is
- running.<br />(Devaraj via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1414">HADOOP-1414</a>. Fix a number of issues identified by FindBugs as
- "Bad Practice".<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1392">HADOOP-1392</a>. Fix "correctness" bugs identified by FindBugs in
- fs and dfs packages.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1412">HADOOP-1412</a>. Fix "dodgy" bugs identified by FindBugs in fs and
- io packages.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1261">HADOOP-1261</a>. Remove redundant events from HDFS namenode's edit
- log when a datanode restarts.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1336">HADOOP-1336</a>. Re-enable speculative execution by
- default.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1311">HADOOP-1311</a>. Fix a bug in BytesWritable#set() where start offset
- was ignored.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1450">HADOOP-1450</a>. Move checksumming closer to user code, so that
- checksums are created before data is stored in large buffers and
- verified after data is read from large buffers, to better catch
- memory errors.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1447">HADOOP-1447</a>. Add support in contrib/data_join for text inputs.<br />(Senthil Subramanian via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1456">HADOOP-1456</a>. Fix TestDecommission assertion failure by setting
- the namenode to ignore the load on datanodes while allocating
- replicas.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1396">HADOOP-1396</a>. Fix FileNotFoundException on DFS block.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1467">HADOOP-1467</a>. Remove redundant counters from WordCount example.<br />(Owen O'Malley via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1139">HADOOP-1139</a>. Log HDFS block transitions at INFO level, to better
- enable diagnosis of problems.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1269">HADOOP-1269</a>. Finer grained locking in HDFS namenode.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1438">HADOOP-1438</a>. Improve HDFS documentation, correcting typos and
- making images appear in PDF. Also update copyright date for all
- docs.<br />(Luke Nezda via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1457">HADOOP-1457</a>. Add counters for monitoring task assignments.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1472">HADOOP-1472</a>. Fix so that timed-out tasks are counted as failures
- rather than as killed.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1234">HADOOP-1234</a>. Fix a race condition in file cache that caused
- tasktracker to not be able to find cached files.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1482">HADOOP-1482</a>. Fix secondary namenode to roll info port.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1300">HADOOP-1300</a>. Improve removal of excess block replicas to be
- rack-aware. Attempts are now made to keep replicas on more
- racks.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1417">HADOOP-1417</a>. Disable a few FindBugs checks that generate a lot
- of spurious warnings.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1320">HADOOP-1320</a>. Rewrite RandomWriter example to bypass reduce.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1449">HADOOP-1449</a>. Add some examples to contrib/data_join.<br />(Senthil Subramanian via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1459">HADOOP-1459</a>. Fix so that, in HDFS, getFileCacheHints() returns
- hostnames instead of IP addresses.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1493">HADOOP-1493</a>. Permit specification of "java.library.path" system
- property in "mapred.child.java.opts" configuration property.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1372">HADOOP-1372</a>. Use LocalDirAllocator for HDFS temporary block
- files, so that disk space, writability, etc. is considered.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1193">HADOOP-1193</a>. Pool allocation of compression codecs. This
- eliminates a memory leak that could cause OutOfMemoryException,
- and also substantially improves performance.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1492">HADOOP-1492</a>. Fix a NullPointerException handling version
- mismatch during datanode registration.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1442">HADOOP-1442</a>. Fix handling of zero-length input splits.<br />(Senthil Subramanian via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1444">HADOOP-1444</a>. Fix HDFS block id generation to check pending
- blocks for duplicates.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1207">HADOOP-1207</a>. Fix FsShell's 'rm' command to not stop when one of
- the named files does not exist.<br />(Tsz Wo Sze via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1475">HADOOP-1475</a>. Clear tasktracker's file cache before it
- re-initializes, to avoid confusion.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1505">HADOOP-1505</a>. Remove spurious stacktrace in ZlibFactory
- introduced in <a href="http://issues.apache.org/jira/browse/HADOOP-1093">HADOOP-1093</a>.<br />(Michael Stack via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1484">HADOOP-1484</a>. Permit one to kill jobs from the web ui. Note that
- this is disabled by default. One must set
- "webinterface.private.actions" to enable this.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1003">HADOOP-1003</a>. Remove flushing of namenode edit log from primary
- namenode lock, increasing namenode throughput.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1023">HADOOP-1023</a>. Add links to searchable mail archives.<br />(tomwhite via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1504">HADOOP-1504</a>. Fix terminate-hadoop-cluster script in contrib/ec2
- to only terminate Hadoop instances, and not other instances
- started by the same user.<br />(tomwhite via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1462">HADOOP-1462</a>. Improve task progress reporting. Progress reports
- are no longer blocking since i/o is performed in a separate
- thread. Reporting during sorting and more is also more
- consistent.<br />(Vivek Ratan via cutting)</li>
- <li>[ intentionally blank ]
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1453">HADOOP-1453</a>. Remove some unneeded calls to FileSystem#exists()
- when opening files, reducing the namenode load somewhat.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1489">HADOOP-1489</a>. Fix text input truncation bug due to mark/reset.
- Add a unittest.<br />(Bwolen Yang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1455">HADOOP-1455</a>. Permit specification of arbitrary job options on
- pipes command line.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1501">HADOOP-1501</a>. Better randomize sending of block reports to
- namenode, so reduce load spikes.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1147">HADOOP-1147</a>. Remove @author tags from Java source files.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1283">HADOOP-1283</a>. Convert most uses of UTF8 in the namenode to be
- String.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1511">HADOOP-1511</a>. Speedup hbase unit tests.<br />(stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1517">HADOOP-1517</a>. Remove some synchronization in namenode to permit
- finer grained locking previously added.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1512">HADOOP-1512</a>. Fix failing TestTextInputFormat on Windows.<br />(Senthil Subramanian via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1518">HADOOP-1518</a>. Add a session id to job metrics, for use by HOD.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1292">HADOOP-1292</a>. Change 'bin/hadoop fs -get' to first copy files to
- a temporary name, then rename them to their final name, so that
- failures don't leave partial files.<br />(Tsz Wo Sze via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1377">HADOOP-1377</a>. Add support for modification time to FileSystem and
- implement in HDFS and local implementations. Also, alter access
- to file properties to be through a new FileStatus interface.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1515">HADOOP-1515</a>. Add MultiFileInputFormat, which can pack multiple,
- typically small, input files into each split.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1514">HADOOP-1514</a>. Make reducers report progress while waiting for map
- outputs, so they're not killed.<br />(Vivek Ratan via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1508">HADOOP-1508</a>. Add an Ant task for FsShell operations. Also add
- new FsShell commands "touchz", "test" and "stat".<br />(Chris Douglas via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1028">HADOOP-1028</a>. Add log messages for server startup and shutdown.<br />(Tsz Wo Sze via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1485">HADOOP-1485</a>. Add metrics for monitoring shuffle.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1536">HADOOP-1536</a>. Remove file locks from libhdfs tests.<br />(Dhruba Borthakur via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1520">HADOOP-1520</a>. Add appropriate synchronization to FSEditsLog.<br />(Dhruba Borthakur via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1513">HADOOP-1513</a>. Fix a race condition in directory creation.<br />(Devaraj via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1546">HADOOP-1546</a>. Remove spurious column from HDFS web UI.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1556">HADOOP-1556</a>. Make LocalJobRunner delete working files at end of
- job run.<br />(Devaraj Das via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1571">HADOOP-1571</a>. Add contrib lib directories to root build.xml
- javadoc classpath.<br />(Michael Stack via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1554">HADOOP-1554</a>. Log killed tasks to the job history and display them on the
- web/ui.<br />(Devaraj Das via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1533">HADOOP-1533</a>. Add persistent error logging for distcp. The logs are stored
- into a specified hdfs directory.<br />(Senthil Subramanian via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1286">HADOOP-1286</a>. Add support to HDFS for distributed upgrades, which
- permits coordinated upgrade of datanode data.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1580">HADOOP-1580</a>. Improve contrib/streaming so that subprocess exit
- status is displayed for errors.<br />(John Heidemann via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1448">HADOOP-1448</a>. In HDFS, randomize lists of non-local block
- locations returned to client, so that load is better balanced.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1578">HADOOP-1578</a>. Fix datanode to send its storage id to namenode
- during registration.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1584">HADOOP-1584</a>. Fix a bug in GenericWritable which limited it to
- 128 types instead of 256.<br />(Espen Amble Kolstad via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1473">HADOOP-1473</a>. Make job ids unique across jobtracker restarts.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1582">HADOOP-1582</a>. Fix hdfslib to return 0 instead of -1 at
- end-of-file, per C conventions.<br />(Christian Kunz via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-911">HADOOP-911</a>. Fix a multithreading bug in libhdfs.<br />(Christian Kunz)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1486">HADOOP-1486</a>. Fix so that fatal exceptions in namenode cause it
- to exit.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1470">HADOOP-1470</a>. Factor checksum generation and validation out of
- ChecksumFileSystem so that it can be reused by FileSystem's with
- built-in checksumming.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1590">HADOOP-1590</a>. Use relative urls in jobtracker jsp pages, so that
- webapp can be used in non-root contexts.<br />(Thomas Friol via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1596">HADOOP-1596</a>. Fix the parsing of taskids by streaming and improve the
- error reporting.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1535">HADOOP-1535</a>. Fix the user-controlled grouping to the reduce function.<br />(Vivek Ratan via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1585">HADOOP-1585</a>. Modify GenericWritable to declare the classes as subtypes
- of Writable<br />(Espen Amble Kolstad via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1576">HADOOP-1576</a>. Fix errors in count of completed tasks when
- speculative execution is enabled.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1598">HADOOP-1598</a>. Fix license headers: adding missing; updating old.<br />(Enis Soztutar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1547">HADOOP-1547</a>. Provide examples for aggregate library.<br />(Runping Qi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1570">HADOOP-1570</a>. Permit jobs to enable and disable the use of
- hadoop's native library.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1433">HADOOP-1433</a>. Add job priority.<br />(Johan Oskarsson via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1597">HADOOP-1597</a>. Add status reports and post-upgrade options to HDFS
- distributed upgrade.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1524">HADOOP-1524</a>. Permit user task logs to appear as they're
- created.<br />(Michael Bieniosek via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1599">HADOOP-1599</a>. Fix distcp bug on Windows.<br />(Senthil Subramanian via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1562">HADOOP-1562</a>. Add JVM metrics, including GC and logging stats.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1613">HADOOP-1613</a>. Fix "DFS Health" page to display correct time of
- last contact.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1134">HADOOP-1134</a>. Add optimized checksum support to HDFS. Checksums
- are now stored with each block, rather than as parallel files.
- This reduces the namenode's memory requirements and increases
- data integrity.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1400">HADOOP-1400</a>. Make JobClient retry requests, so that clients can
- survive jobtracker problems.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1564">HADOOP-1564</a>. Add unit tests for HDFS block-level checksums.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1620">HADOOP-1620</a>. Reduce the number of abstract FileSystem methods,
- simplifying implementations.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1625">HADOOP-1625</a>. Fix a "could not move files" exception in datanode.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1624">HADOOP-1624</a>. Fix an infinite loop in datanode.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1084">HADOOP-1084</a>. Switch mapred file cache to use file modification
- time instead of checksum to detect file changes, as checksums are
- no longer easily accessed.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1623">HADOOP-1623</a>. Fix an infinite loop when copying directories.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1603">HADOOP-1603</a>. Fix a bug in namenode initialization where
- default replication is sometimes reset to one on restart.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1635">HADOOP-1635</a>. Remove hardcoded keypair name and fix launch-hadoop-cluster
- to support later versions of ec2-api-tools.<br />(Stu Hood via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1638">HADOOP-1638</a>. Fix contrib EC2 scripts to support NAT addressing.<br />(Stu Hood via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1632">HADOOP-1632</a>. Fix an IllegalArgumentException in fsck.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1619">HADOOP-1619</a>. Fix FSInputChecker to not attempt to read past EOF.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1640">HADOOP-1640</a>. Fix TestDecommission on Windows.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1587">HADOOP-1587</a>. Fix TestSymLink to get required system properties.<br />(Devaraj Das via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1628">HADOOP-1628</a>. Add block CRC protocol unit tests.<br />(Raghu Angadi via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1653">HADOOP-1653</a>. FSDirectory code-cleanups. FSDirectory.INode
- becomes a static class.<br />(Christophe Taton via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1066">HADOOP-1066</a>. Restructure documentation to make more user
- friendly.<br />(Connie Kleinjans and Jeff Hammerbacher via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1551">HADOOP-1551</a>. libhdfs supports setting replication factor and
- retrieving modification time of files.<br />(Sameer Paranjpye via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1647">HADOOP-1647</a>. FileSystem.getFileStatus returns valid values for "/".<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1657">HADOOP-1657</a>. Fix NNBench to ensure that the block size is a
- multiple of bytes.per.checksum.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1553">HADOOP-1553</a>. Replace user task output and log capture code to use shell
- redirection instead of copier threads in the TaskTracker. Capping the
- size of the output is now done via tail in memory and thus should not be
- large. The output of the tasklog servlet is not forced into UTF8 and is
- not buffered entirely in memory. (omalley)
- Configuration changes to hadoop-default.xml:
- remove mapred.userlog.num.splits
- remove mapred.userlog.purge.splits
- change default mapred.userlog.limit.kb to 0 (no limit)
- change default mapred.userlog.retain.hours to 24
- Configuration changes to log4j.properties:
- remove log4j.appender.TLA.noKeepSplits
- remove log4j.appender.TLA.purgeLogSplits
- remove log4j.appender.TLA.logsRetainHours
- URL changes:
- http://<tasktracker>/tasklog.jsp -> http://<tasktracker>tasklog with
- parameters limited to start and end, which may be positive (from
- start) or negative (from end).
- Environment:
- require bash (v2 or later) and tail
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1659">HADOOP-1659</a>. Fix a job id/job name mixup.<br />(Arun C. Murthy via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1665">HADOOP-1665</a>. With HDFS Trash enabled and the same file was created
- and deleted more than once, the suceeding deletions creates Trash item
- names suffixed with a integer.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1666">HADOOP-1666</a>. FsShell object can be used for multiple fs commands.<br />(Dhruba Borthakur via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1654">HADOOP-1654</a>. Remove performance regression introduced by Block CRC.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1680">HADOOP-1680</a>. Improvements to Block CRC upgrade messages.<br />(Raghu Angadi via dhruba)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-71">HADOOP-71</a>. Allow Text and SequenceFile Map/Reduce inputs from non-default
- filesystems.<br />(omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1568">HADOOP-1568</a>. Expose HDFS as xml/http filesystem to provide cross-version
- compatability.<br />(Chris Douglas via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1668">HADOOP-1668</a>. Added an INCOMPATIBILITY section to CHANGES.txt.<br />(nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1629">HADOOP-1629</a>. Added a upgrade test for <a href="http://issues.apache.org/jira/browse/HADOOP-1134">HADOOP-1134</a>.<br />(Raghu Angadi via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1698">HADOOP-1698</a>. Fix performance problems on map output sorting for jobs
- with large numbers of reduces.<br />(Devaraj Das via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1716">HADOOP-1716</a>. Fix a Pipes wordcount example to remove the 'file:'
- schema from its output path.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1714">HADOOP-1714</a>. Fix TestDFSUpgradeFromImage to work on Windows.<br />(Raghu Angadi via nigel)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1663">HADOOP-1663</a>. Return a non-zero exit code if streaming fails.<br />(Lohit Renu
- via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1712">HADOOP-1712</a>. Fix an unhandled exception on datanode during block
- CRC upgrade.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1717">HADOOP-1717</a>. Fix TestDFSUpgradeFromImage to work on Solaris.<br />(nigel via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1437">HADOOP-1437</a>. Add Eclipse plugin in contrib.<br />(Eugene Hung and Christophe Taton via cutting)</li>
- </ol>
- </li>
- </ul>
- <h3><a href="javascript:toggleList('release_0.13.0_-_2007-06-08_')">Release 0.13.0 - 2007-06-08
- </a></h3>
- <ol id="release_0.13.0_-_2007-06-08_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1047">HADOOP-1047</a>. Fix TestReplication to succeed more reliably.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1063">HADOOP-1063</a>. Fix a race condition in MiniDFSCluster test code.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1101">HADOOP-1101</a>. In web ui, split shuffle statistics from reduce
- statistics, and add some task averages.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1071">HADOOP-1071</a>. Improve handling of protocol version mismatch in
- JobTracker.<br />(Tahir Hashmi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1116">HADOOP-1116</a>. Increase heap size used for contrib unit tests.<br />(Philippe Gassmann via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1120">HADOOP-1120</a>. Add contrib/data_join, tools to simplify joining
- data from multiple sources using MapReduce.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1064">HADOOP-1064</a>. Reduce log level of some DFSClient messages.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1137">HADOOP-1137</a>. Fix StatusHttpServer to work correctly when
- resources are in a jar file.<br />(Benjamin Reed via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1094">HADOOP-1094</a>. Optimize generated Writable implementations for
- records to not allocate a new BinaryOutputArchive or
- BinaryInputArchive per call.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1068">HADOOP-1068</a>. Improve error message for clusters with 0 datanodes.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1122">HADOOP-1122</a>. Fix divide-by-zero exception in FSNamesystem
- chooseTarget method.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1131">HADOOP-1131</a>. Add a closeAll() static method to FileSystem.<br />(Philippe Gassmann via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1085">HADOOP-1085</a>. Improve port selection in HDFS and MapReduce test
- code. Ports are now selected by the OS during testing rather than
- by probing for free ports, improving test reliability.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1153">HADOOP-1153</a>. Fix HDFS daemons to correctly stop their threads.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1146">HADOOP-1146</a>. Add a counter for reduce input keys and rename the
- "reduce input records" counter to be "reduce input groups".<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1165">HADOOP-1165</a>. In records, replace idential generated toString
- methods with a method on the base class.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1164">HADOOP-1164</a>. Fix TestReplicationPolicy to specify port zero, so
- that a free port is automatically selected.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1166">HADOOP-1166</a>. Add a NullOutputFormat and use it in the
- RandomWriter example.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1169">HADOOP-1169</a>. Fix a cut/paste error in CopyFiles utility so that
- S3-based source files are correctly copied.<br />(Michael Stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1167">HADOOP-1167</a>. Remove extra synchronization in InMemoryFileSystem.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1110">HADOOP-1110</a>. Fix an off-by-one error counting map inputs.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1178">HADOOP-1178</a>. Fix a NullPointerException during namenode startup.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1011">HADOOP-1011</a>. Fix a ConcurrentModificationException when viewing
- job history.<br />(Tahir Hashmi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-672">HADOOP-672</a>. Improve help for fs shell commands.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1170">HADOOP-1170</a>. Improve datanode performance by removing device
- checks from common operations.<br />(Igor Bolotin via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1090">HADOOP-1090</a>. Fix SortValidator's detection of whether the input
- file belongs to the sort-input or sort-output directory.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1081">HADOOP-1081</a>. Fix bin/hadoop on Darwin.<br />(Michael Bieniosek via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1045">HADOOP-1045</a>. Add contrib/hbase, a BigTable-like online database.<br />(Jim Kellerman via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1156">HADOOP-1156</a>. Fix a NullPointerException in MiniDFSCluster.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-702">HADOOP-702</a>. Add tools to help automate HDFS upgrades.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1163">HADOOP-1163</a>. Fix ganglia metrics to aggregate metrics from different
- hosts properly.<br />(Michael Bieniosek via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1194">HADOOP-1194</a>. Make compression style record level for map output
- compression.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1187">HADOOP-1187</a>. Improve DFS Scalability: avoid scanning entire list of
- datanodes in getAdditionalBlocks.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1133">HADOOP-1133</a>. Add tool to analyze and debug namenode on a production
- cluster.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1151">HADOOP-1151</a>. Remove spurious printing to stderr in streaming
- PipeMapRed.<br />(Koji Noguchi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-988">HADOOP-988</a>. Change namenode to use a single map of blocks to metadata.<br />(Raghu Angadi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1203">HADOOP-1203</a>. Change UpgradeUtilities used by DFS tests to use
- MiniDFSCluster to start and stop NameNode/DataNodes.<br />(Nigel Daley via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1217">HADOOP-1217</a>. Add test.timeout property to build.xml, so that
- long-running unit tests may be automatically terminated.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1149">HADOOP-1149</a>. Improve DFS Scalability: make
- processOverReplicatedBlock() a no-op if blocks are not
- over-replicated.<br />(Raghu Angadi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1149">HADOOP-1149</a>. Improve DFS Scalability: optimize getDistance(),
- contains(), and isOnSameRack() in NetworkTopology.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1218">HADOOP-1218</a>. Make synchronization on TaskTracker's RunningJob
- object consistent.<br />(Devaraj Das via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1219">HADOOP-1219</a>. Ignore progress report once a task has reported as
- 'done'.<br />(Devaraj Das via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1114">HADOOP-1114</a>. Permit user to specify additional CLASSPATH elements
- with a HADOOP_CLASSPATH environment variable.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1198">HADOOP-1198</a>. Remove ipc.client.timeout parameter override from
- unit test configuration. Using the default is more robust and
- has almost the same run time.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1211">HADOOP-1211</a>. Remove deprecated constructor and unused static
- members in DataNode class.<br />(Konstantin Shvachko via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1136">HADOOP-1136</a>. Fix ArrayIndexOutOfBoundsException in
- FSNamesystem$UnderReplicatedBlocks add() method.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-978">HADOOP-978</a>. Add the client name and the address of the node that
- previously started to create the file to the description of
- AlreadyBeingCreatedException.<br />(Konstantin Shvachko via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1001">HADOOP-1001</a>. Check the type of keys and values generated by the
- mapper against the types specified in JobConf.<br />(Tahir Hashmi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-971">HADOOP-971</a>. Improve DFS Scalability: Improve name node performance
- by adding a hostname to datanodes map.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1189">HADOOP-1189</a>. Fix 'No space left on device' exceptions on datanodes.<br />(Raghu Angadi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-819">HADOOP-819</a>. Change LineRecordWriter to not insert a tab between
- key and value when either is null, and to print nothing when both
- are null.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1204">HADOOP-1204</a>. Rename InputFormatBase to be FileInputFormat, and
- deprecate InputFormatBase. Also make LineRecordReader easier to
- extend.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1213">HADOOP-1213</a>. Improve logging of errors by IPC server, to
- consistently include the service name and the call.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1238">HADOOP-1238</a>. Fix metrics reporting by TaskTracker to correctly
- track maps_running and reduces_running.<br />(Michael Bieniosek via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1093">HADOOP-1093</a>. Fix a race condition in HDFS where blocks were
- sometimes erased before they were reported written.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1239">HADOOP-1239</a>. Add a package name to some testjar test classes.<br />(Jim Kellerman via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1241">HADOOP-1241</a>. Fix NullPointerException in processReport when
- namenode is restarted.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1244">HADOOP-1244</a>. Fix stop-dfs.sh to no longer incorrectly specify
- slaves file for stopping datanode.<br />(Michael Bieniosek via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1253">HADOOP-1253</a>. Fix ConcurrentModificationException and
- NullPointerException in JobControl.<br />(Johan Oskarson via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1256">HADOOP-1256</a>. Fix NameNode so that multiple DataNodeDescriptors
- can no longer be created on startup.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1214">HADOOP-1214</a>. Replace streaming classes with new counterparts
- from Hadoop core.<br />(Runping Qi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1250">HADOOP-1250</a>. Move a chmod utility from streaming to FileUtil.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1258">HADOOP-1258</a>. Fix TestCheckpoint test case to wait for
- MiniDFSCluster to be active.<br />(Nigel Daley via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1148">HADOOP-1148</a>. Re-indent all Java source code to consistently use
- two spaces per indent level.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1251">HADOOP-1251</a>. Add a method to Reporter to get the map InputSplit.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1224">HADOOP-1224</a>. Fix "Browse the filesystem" link to no longer point
- to dead datanodes.<br />(Enis Soztutar via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1154">HADOOP-1154</a>. Fail a streaming task if the threads reading from or
- writing to the streaming process fail.<br />(Koji Noguchi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-968">HADOOP-968</a>. Move shuffle and sort to run in reduce's child JVM,
- rather than in TaskTracker.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1111">HADOOP-1111</a>. Add support for client notification of job
- completion. If the job configuration has a job.end.notification.url
- property it will make a HTTP GET request to the specified URL.
- The number of retries and the interval between retries is also
- configurable.<br />(Alejandro Abdelnur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1275">HADOOP-1275</a>. Fix misspelled job notification property in
- hadoop-default.xml.<br />(Alejandro Abdelnur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1152">HADOOP-1152</a>. Fix race condition in MapOutputCopier.copyOutput file
- rename causing possible reduce task hang.<br />(Tahir Hashmi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1050">HADOOP-1050</a>. Distinguish between failed and killed tasks so as to
- not count a lost tasktracker against the job.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1271">HADOOP-1271</a>. Fix StreamBaseRecordReader to be able to log record
- data that's not UTF-8.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1190">HADOOP-1190</a>. Fix unchecked warnings in main Hadoop code.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1127">HADOOP-1127</a>. Fix AlreadyBeingCreatedException in namenode for
- jobs run with speculative execution.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1282">HADOOP-1282</a>. Omnibus HBase patch. Improved tests & configuration.<br />(Jim Kellerman via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1262">HADOOP-1262</a>. Make dfs client try to read from a different replica
- of the checksum file when a checksum error is detected.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1279">HADOOP-1279</a>. Fix JobTracker to maintain list of recently
- completed jobs by order of completion, not submission.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1284">HADOOP-1284</a>. In contrib/streaming, permit flexible specification
- of field delimiter and fields for partitioning and sorting.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1176">HADOOP-1176</a>. Fix a bug where reduce would hang when a map had
- more than 2GB of output for it.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1293">HADOOP-1293</a>. Fix contrib/streaming to print more than the first
- twenty lines of standard error.<br />(Koji Noguchi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1297">HADOOP-1297</a>. Fix datanode so that requests to remove blocks that
- do not exist no longer causes block reports to be re-sent every
- second.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1216">HADOOP-1216</a>. Change MapReduce so that, when numReduceTasks is
- zero, map outputs are written directly as final output, skipping
- shuffle, sort and reduce. Use this to implement reduce=NONE
- option in contrib/streaming.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1294">HADOOP-1294</a>. Fix unchecked warnings in main Hadoop code under
- Java 6.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1299">HADOOP-1299</a>. Fix so that RPC will restart after RPC.stopClient()
- has been called.<br />(Michael Stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1278">HADOOP-1278</a>. Improve blacklisting of TaskTrackers by JobTracker,
- to reduce false positives.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1290">HADOOP-1290</a>. Move contrib/abacus into mapred/lib/aggregate.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1272">HADOOP-1272</a>. Extract inner classes from FSNamesystem into separate
- classes.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1247">HADOOP-1247</a>. Add support to contrib/streaming for aggregate
- package, formerly called Abacus.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1061">HADOOP-1061</a>. Fix bug in listing files in the S3 filesystem.
- NOTE: this change is not backwards compatible! You should use the
- MigrationTool supplied to migrate existing S3 filesystem data to
- the new format. Please backup your data first before upgrading
- (using 'hadoop distcp' for example).<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1304">HADOOP-1304</a>. Make configurable the maximum number of task
- attempts before a job fails.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1308">HADOOP-1308</a>. Use generics to restrict types when classes are
- passed as parameters to JobConf methods.<br />(Michael Bieniosek via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1312">HADOOP-1312</a>. Fix a ConcurrentModificationException in NameNode
- that killed the heartbeat monitoring thread.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1315">HADOOP-1315</a>. Clean up contrib/streaming, switching it to use core
- classes more and removing unused code.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-485">HADOOP-485</a>. Allow a different comparator for grouping keys in
- calls to reduce.<br />(Tahir Hashmi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1322">HADOOP-1322</a>. Fix TaskTracker blacklisting to work correctly in
- one- and two-node clusters.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1144">HADOOP-1144</a>. Permit one to specify a maximum percentage of tasks
- that can fail before a job is aborted. The default is zero.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1184">HADOOP-1184</a>. Fix HDFS decomissioning to complete when the only
- copy of a block is on a decommissioned node.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1263">HADOOP-1263</a>. Change DFSClient to retry certain namenode calls
- with a random, exponentially increasing backoff time, to avoid
- overloading the namenode on, e.g., job start.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1325">HADOOP-1325</a>. First complete, functioning version of HBase.<br />(Jim Kellerman via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1276">HADOOP-1276</a>. Make tasktracker expiry interval configurable.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1326">HADOOP-1326</a>. Change JobClient#RunJob() to return the job.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1270">HADOOP-1270</a>. Randomize the fetch of map outputs, speeding the
- shuffle.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1200">HADOOP-1200</a>. Restore disk checking lost in <a href="http://issues.apache.org/jira/browse/HADOOP-1170">HADOOP-1170</a>.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1252">HADOOP-1252</a>. Changed MapReduce's allocation of local files to
- use round-robin among available devices, rather than a hashcode.
- More care is also taken to not allocate files on full or offline
- drives.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1324">HADOOP-1324</a>. Change so that an FSError kills only the task that
- generates it rather than the entire task tracker.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1310">HADOOP-1310</a>. Fix unchecked warnings in aggregate code.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1255">HADOOP-1255</a>. Fix a bug where the namenode falls into an infinite
- loop trying to remove a dead node.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1160">HADOOP-1160</a>. Fix DistributedFileSystem.close() to close the
- underlying FileSystem, correctly aborting files being written.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1341">HADOOP-1341</a>. Fix intermittent failures in HBase unit tests
- caused by deadlock.<br />(Jim Kellerman via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1350">HADOOP-1350</a>. Fix shuffle performance problem caused by forcing
- chunked encoding of map outputs.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1345">HADOOP-1345</a>. Fix HDFS to correctly retry another replica when a
- checksum error is encountered.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1205">HADOOP-1205</a>. Improve synchronization around HDFS block map.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1353">HADOOP-1353</a>. Fix a potential NullPointerException in namenode.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1354">HADOOP-1354</a>. Fix a potential NullPointerException in FsShell.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1358">HADOOP-1358</a>. Fix a potential bug when DFSClient calls skipBytes.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1356">HADOOP-1356</a>. Fix a bug in ValueHistogram.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1363">HADOOP-1363</a>. Fix locking bug in JobClient#waitForCompletion().<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1368">HADOOP-1368</a>. Fix inconsistent synchronization in JobInProgress.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1369">HADOOP-1369</a>. Fix inconsistent synchronization in TaskTracker.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1361">HADOOP-1361</a>. Fix various calls to skipBytes() to check return
- value.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1388">HADOOP-1388</a>. Fix a potential NullPointerException in web ui.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1385">HADOOP-1385</a>. Fix MD5Hash#hashCode() to generally hash to more
- than 256 values.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1386">HADOOP-1386</a>. Fix Path to not permit the empty string as a
- path, as this has lead to accidental file deletion. Instead
- force applications to use "." to name the default directory.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1407">HADOOP-1407</a>. Fix integer division bug in JobInProgress which
- meant failed tasks didn't cause the job to fail.<br />(Arun C Murthy via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1427">HADOOP-1427</a>. Fix a typo that caused GzipCodec to incorrectly use
- a very small input buffer.<br />(Espen Amble Kolstad via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1435">HADOOP-1435</a>. Fix globbing code to no longer use the empty string
- to indicate the default directory, per <a href="http://issues.apache.org/jira/browse/HADOOP-1386">HADOOP-1386</a>.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1411">HADOOP-1411</a>. Make task retry framework handle
- AlreadyBeingCreatedException when wrapped as a RemoteException.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1242">HADOOP-1242</a>. Improve handling of DFS upgrades.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1332">HADOOP-1332</a>. Fix so that TaskTracker exits reliably during unit
- tests on Windows.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1431">HADOOP-1431</a>. Fix so that sort progress reporting during map runs
- only while sorting, so that stuck maps are correctly terminated.<br />(Devaraj Das and Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1452">HADOOP-1452</a>. Change TaskTracker.MapOutputServlet.doGet.totalRead
- to a long, permitting map outputs to exceed 2^31 bytes.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1443">HADOOP-1443</a>. Fix a bug opening zero-length files in HDFS.<br />(Konstantin Shvachko via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.12.3_-_2007-04-06_')">Release 0.12.3 - 2007-04-06
- </a></h3>
- <ol id="release_0.12.3_-_2007-04-06_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1162">HADOOP-1162</a>. Fix bug in record CSV and XML serialization of
- binary values.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1123">HADOOP-1123</a>. Fix NullPointerException in LocalFileSystem when
- trying to recover from a checksum error.<br />(Hairong Kuang & Nigel Daley via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1177">HADOOP-1177</a>. Fix bug where IOException in MapOutputLocation.getFile
- was not being logged.<br />(Devaraj Das via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1175">HADOOP-1175</a>. Fix bugs in JSP for displaying a task's log messages.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1191">HADOOP-1191</a>. Fix map tasks to wait until sort progress thread has
- stopped before reporting the task done.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1192">HADOOP-1192</a>. Fix an integer overflow bug in FSShell's 'dus'
- command and a performance problem in HDFS's implementation of it.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1105">HADOOP-1105</a>. Fix reducers to make "progress" while iterating
- through values.<br />(Devaraj Das & Owen O'Malley via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1179">HADOOP-1179</a>. Make Task Tracker close index file as soon as the read
- is done when serving get-map-output requests.<br />(Devaraj Das via tomwhite)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.12.2_-_2007-23-17_')">Release 0.12.2 - 2007-23-17
- </a></h3>
- <ol id="release_0.12.2_-_2007-23-17_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1135">HADOOP-1135</a>. Fix bug in block report processing which may cause
- the namenode to delete blocks.<br />(Dhruba Borthakur via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1145">HADOOP-1145</a>. Make XML serializer and deserializer classes public
- in record package.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1140">HADOOP-1140</a>. Fix a deadlock in metrics.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1150">HADOOP-1150</a>. Fix streaming -reducer and -mapper to give them
- defaults.<br />(Owen O'Malley via tomwhite)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.12.1_-_2007-03-17_')">Release 0.12.1 - 2007-03-17
- </a></h3>
- <ol id="release_0.12.1_-_2007-03-17_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1035">HADOOP-1035</a>. Fix a StackOverflowError in FSDataSet.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1053">HADOOP-1053</a>. Fix VInt representation of negative values. Also
- remove references in generated record code to methods outside of
- the record package and improve some record documentation.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1067">HADOOP-1067</a>. Compile fails if Checkstyle jar is present in lib
- directory. Also remove dependency on a particular Checkstyle
- version number.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1060">HADOOP-1060</a>. Fix an IndexOutOfBoundsException in the JobTracker
- that could cause jobs to hang.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1077">HADOOP-1077</a>. Fix a race condition fetching map outputs that could
- hang reduces.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1083">HADOOP-1083</a>. Fix so that when a cluster restarts with a missing
- datanode, its blocks are replicated.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1082">HADOOP-1082</a>. Fix a NullPointerException in ChecksumFileSystem.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1088">HADOOP-1088</a>. Fix record serialization of negative values.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1080">HADOOP-1080</a>. Fix bug in bin/hadoop on Windows when native
- libraries are present.<br />(ab via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1091">HADOOP-1091</a>. Fix a NullPointerException in MetricsRecord.<br />(David Bowen via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1092">HADOOP-1092</a>. Fix a NullPointerException in HeartbeatMonitor
- thread.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1112">HADOOP-1112</a>. Fix a race condition in Hadoop metrics.<br />(David Bowen via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1108">HADOOP-1108</a>. Checksummed file system should retry reading if a
- different replica is found when handling ChecksumException.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1070">HADOOP-1070</a>. Fix a problem with number of racks and datanodes
- temporarily doubling.<br />(Konstantin Shvachko via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1099">HADOOP-1099</a>. Fix NullPointerException in JobInProgress.<br />(Gautam Kowshik via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1115">HADOOP-1115</a>. Fix bug where FsShell copyToLocal doesn't
- copy directories.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1109">HADOOP-1109</a>. Fix NullPointerException in StreamInputFormat.<br />(Koji Noguchi via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1117">HADOOP-1117</a>. Fix DFS scalability: when the namenode is
- restarted it consumes 80% CPU.<br />(Dhruba Borthakur via
- tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1089">HADOOP-1089</a>. Make the C++ version of write and read v-int
- agree with the Java versions.<br />(Milind Bhandarkar via
- tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1096">HADOOP-1096</a>. Rename InputArchive and OutputArchive and
- make them public.<br />(Milind Bhandarkar via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1128">HADOOP-1128</a>. Fix missing progress information in map tasks.<br />(Espen Amble Kolstad, Andrzej Bialecki, and Owen O'Malley
- via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1129">HADOOP-1129</a>. Fix DFSClient to not hide IOExceptions in
- flush method.<br />(Hairong Kuang via tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1126">HADOOP-1126</a>. Optimize CPU usage for under replicated blocks
- when cluster restarts.<br />(Hairong Kuang via tomwhite)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.12.0_-_2007-03-02_')">Release 0.12.0 - 2007-03-02
- </a></h3>
- <ol id="release_0.12.0_-_2007-03-02_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-975">HADOOP-975</a>. Separate stdout and stderr from tasks.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-982">HADOOP-982</a>. Add some setters and a toString() method to
- BytesWritable.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-858">HADOOP-858</a>. Move contrib/smallJobsBenchmark to src/test, removing
- obsolete bits.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-992">HADOOP-992</a>. Fix MiniMR unit tests to use MiniDFS when specified,
- rather than the local FS.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-954">HADOOP-954</a>. Change use of metrics to use callback mechanism.
- Also rename utility class Metrics to MetricsUtil.<br />(David Bowen & Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-893">HADOOP-893</a>. Improve HDFS client's handling of dead datanodes.
- The set is no longer reset with each block, but rather is now
- maintained for the life of an open file.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-882">HADOOP-882</a>. Upgrade to jets3t version 0.5, used by the S3
- FileSystem. This version supports retries.<br />(Michael Stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-977">HADOOP-977</a>. Send task's stdout and stderr to JobClient's stdout
- and stderr respectively, with each line tagged by the task's name.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-761">HADOOP-761</a>. Change unit tests to not use /tmp.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1007">HADOOP-1007</a>. Make names of metrics used in Hadoop unique.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-491">HADOOP-491</a>. Change mapred.task.timeout to be per-job, and make a
- value of zero mean no timeout. Also change contrib/streaming to
- disable task timeouts.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1010">HADOOP-1010</a>. Add Reporter.NULL, a Reporter implementation that
- does nothing.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-923">HADOOP-923</a>. In HDFS NameNode, move replication computation to a
- separate thread, to improve heartbeat processing time.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-476">HADOOP-476</a>. Rewrite contrib/streaming command-line processing,
- improving parameter validation.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-973">HADOOP-973</a>. Improve error messages in Namenode. This should help
- to track down a problem that was appearing as a
- NullPointerException.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-649">HADOOP-649</a>. Fix so that jobs with no tasks are not lost.<br />(Thomas Friol via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-803">HADOOP-803</a>. Reduce memory use by HDFS namenode, phase I.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1021">HADOOP-1021</a>. Fix MRCaching-based unit tests on Windows.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-889">HADOOP-889</a>. Remove duplicate code from HDFS unit tests.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-943">HADOOP-943</a>. Improve HDFS's fsck command to display the filename
- for under-replicated blocks.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-333">HADOOP-333</a>. Add validator for sort benchmark output.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-947">HADOOP-947</a>. Improve performance of datanode decomissioning.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-442">HADOOP-442</a>. Permit one to specify hosts allowed to connect to
- namenode and jobtracker with include and exclude files.<br />(Wendy
- Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1017">HADOOP-1017</a>. Cache constructors, for improved performance.<br />(Ron Bodkin via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-867">HADOOP-867</a>. Move split creation out of JobTracker to client.
- Splits are now saved in a separate file, read by task processes
- directly, so that user code is no longer required in the
- JobTracker.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1006">HADOOP-1006</a>. Remove obsolete '-local' option from test code.<br />(Gautam Kowshik via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-952">HADOOP-952</a>. Create a public (shared) Hadoop EC2 AMI.
- The EC2 scripts now support launch of public AMIs.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1025">HADOOP-1025</a>. Remove some obsolete code in ipc.Server.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-997">HADOOP-997</a>. Implement S3 retry mechanism for failed block
- transfers. This includes a generic retry mechanism for use
- elsewhere in Hadoop.<br />(tomwhite)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-990">HADOOP-990</a>. Improve HDFS support for full datanode volumes.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-564">HADOOP-564</a>. Replace uses of "dfs://" URIs with the more standard
- "hdfs://".<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1030">HADOOP-1030</a>. In unit tests, unify setting of ipc.client.timeout.
- Also increase the value used from one to two seconds, in hopes of
- making tests complete more reliably.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-654">HADOOP-654</a>. Stop assigning tasks to a tasktracker if it has
- failed more than a specified number in the job.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-985">HADOOP-985</a>. Change HDFS to identify nodes by IP address rather
- than by DNS hostname.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-248">HADOOP-248</a>. Optimize location of map outputs to not use random
- probes.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1029">HADOOP-1029</a>. Fix streaming's input format to correctly seek to
- the start of splits.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-492">HADOOP-492</a>. Add per-job and per-task counters. These are
- incremented via the Reporter interface and available through the
- web ui and the JobClient API. The mapreduce framework maintains a
- few basic counters, and applications may add their own. Counters
- are also passed to the metrics system.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1034">HADOOP-1034</a>. Fix datanode to better log exceptions.<br />(Philippe Gassmann via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-878">HADOOP-878</a>. In contrib/streaming, fix reducer=NONE to work with
- multiple maps.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1039">HADOOP-1039</a>. In HDFS's TestCheckpoint, avoid restarting
- MiniDFSCluster so often, speeding this test.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1040">HADOOP-1040</a>. Update RandomWriter example to use counters and
- user-defined input and output formats.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1027">HADOOP-1027</a>. Fix problems with in-memory merging during shuffle
- and re-enable this optimization.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1036">HADOOP-1036</a>. Fix exception handling in TaskTracker to keep tasks
- from being lost.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1042">HADOOP-1042</a>. Improve the handling of failed map output fetches.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-928">HADOOP-928</a>. Make checksums optional per FileSystem.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1044">HADOOP-1044</a>. Fix HDFS's TestDecommission to not spuriously fail.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-972">HADOOP-972</a>. Optimize HDFS's rack-aware block placement algorithm.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1043">HADOOP-1043</a>. Optimize shuffle, increasing parallelism.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-940">HADOOP-940</a>. Improve HDFS's replication scheduling.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1020">HADOOP-1020</a>. Fix a bug in Path resolution, and a with unit tests
- on Windows.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-941">HADOOP-941</a>. Enhance record facility.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1000">HADOOP-1000</a>. Fix so that log messages in task subprocesses are
- not written to a task's standard error.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1037">HADOOP-1037</a>. Fix bin/slaves.sh, which currently only works with
- /bin/bash, to specify /bin/bash rather than /bin/sh.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1046">HADOOP-1046</a>. Clean up tmp from partially received stale block files.<br />(ab)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1041">HADOOP-1041</a>. Optimize mapred counter implementation. Also group
- counters by their declaring Enum.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1032">HADOOP-1032</a>. Permit one to specify jars that will be cached
- across multiple jobs.<br />(Gautam Kowshik via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1051">HADOOP-1051</a>. Add optional checkstyle task to build.xml. To use
- this developers must download the (LGPL'd) checkstyle jar
- themselves.<br />(tomwhite via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1049">HADOOP-1049</a>. Fix a race condition in IPC client.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1056">HADOOP-1056</a>. Check HDFS include/exclude node lists with both IP
- address and hostname.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-994">HADOOP-994</a>. In HDFS, limit the number of blocks invalidated at
- once. Large lists were causing datenodes to timeout.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-432">HADOOP-432</a>. Add a trash feature, disabled by default. When
- enabled, the FSShell 'rm' command will move things to a trash
- directory in the filesystem. In HDFS, a thread periodically
- checkpoints the trash and removes old checkpoints.<br />(cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.11.2_-_2007-02-16_')">Release 0.11.2 - 2007-02-16
- </a></h3>
- <ol id="release_0.11.2_-_2007-02-16_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1009">HADOOP-1009</a>. Fix an infinite loop in the HDFS namenode.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-1014">HADOOP-1014</a>. Disable in-memory merging during shuffle, as this is
- causing data corruption.<br />(Devaraj Das via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.11.1_-_2007-02-09_')">Release 0.11.1 - 2007-02-09
- </a></h3>
- <ol id="release_0.11.1_-_2007-02-09_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-976">HADOOP-976</a>. Make SequenceFile.Metadata public.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-917">HADOOP-917</a>. Fix a NullPointerException in SequenceFile's merger
- with large map outputs.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-984">HADOOP-984</a>. Fix a bug in shuffle error handling introduced by
- <a href="http://issues.apache.org/jira/browse/HADOOP-331">HADOOP-331</a>. If a map output is unavailable, the job tracker is
- once more informed.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-987">HADOOP-987</a>. Fix a problem in HDFS where blocks were not removed
- from neededReplications after a replication target was selected.<br />(Hairong Kuang via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.11.0_-_2007-02-02_')">Release 0.11.0 - 2007-02-02
- </a></h3>
- <ol id="release_0.11.0_-_2007-02-02_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-781">HADOOP-781</a>. Remove methods deprecated in 0.10 that are no longer
- widely used.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-842">HADOOP-842</a>. Change HDFS protocol so that the open() method is
- passed the client hostname, to permit the namenode to order block
- locations on the basis of network topology.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-852">HADOOP-852</a>. Add an ant task to compile record definitions, and
- use it to compile record unit tests.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-757">HADOOP-757</a>. Fix "Bad File Descriptor" exception in HDFS client
- when an output file is closed twice.<br />(Raghu Angadi via cutting)</li>
- <li>[ intentionally blank ]
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-890">HADOOP-890</a>. Replace dashes in metric names with underscores,
- for better compatibility with some monitoring systems.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-801">HADOOP-801</a>. Add to jobtracker a log of task completion events.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-855">HADOOP-855</a>. In HDFS, try to repair files with checksum errors.
- An exception is still thrown, but corrupt blocks are now removed
- when they have replicas.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-886">HADOOP-886</a>. Reduce number of timer threads created by metrics API
- by pooling contexts.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-897">HADOOP-897</a>. Add a "javac.args" property to build.xml that permits
- one to pass arbitrary options to javac.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-899">HADOOP-899</a>. Update libhdfs for changes in <a href="http://issues.apache.org/jira/browse/HADOOP-871">HADOOP-871</a>.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-905">HADOOP-905</a>. Remove some dead code from JobClient.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-902">HADOOP-902</a>. Fix a NullPointerException in HDFS client when
- closing output streams.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-735">HADOOP-735</a>. Switch generated record code to use BytesWritable to
- represent fields of type 'buffer'.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-830">HADOOP-830</a>. Improve mapreduce merge performance by buffering and
- merging multiple map outputs as they arrive at reduce nodes before
- they're written to disk.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-908">HADOOP-908</a>. Add a new contrib package, Abacus, that simplifies
- counting and aggregation, built on MapReduce.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-901">HADOOP-901</a>. Add support for recursive renaming to the S3 filesystem.<br />(Tom White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-912">HADOOP-912</a>. Fix a bug in TaskTracker.isIdle() that was
- sporadically causing unit test failures.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-909">HADOOP-909</a>. Fix the 'du' command to correctly compute the size of
- FileSystem directory trees.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-731">HADOOP-731</a>. When a checksum error is encountered on a file stored
- in HDFS, try another replica of the data, if any.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-732">HADOOP-732</a>. Add support to SequenceFile for arbitrary metadata,
- as a set of attribute value pairs.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-929">HADOOP-929</a>. Fix PhasedFileSystem to pass configuration to
- underlying FileSystem.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-935">HADOOP-935</a>. Fix contrib/abacus to not delete pre-existing output
- files, but rather to fail in this case.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-936">HADOOP-936</a>. More metric renamings, as in <a href="http://issues.apache.org/jira/browse/HADOOP-890">HADOOP-890</a>.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-856">HADOOP-856</a>. Fix HDFS's fsck command to not report that
- non-existent filesystems are healthy.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-602">HADOOP-602</a>. Remove the dependency on Lucene's PriorityQueue
- utility, by copying it into Hadoop. This facilitates using Hadoop
- with different versions of Lucene without worrying about CLASSPATH
- order.<br />(Milind Bhandarkar via cutting)</li>
- <li>[ intentionally blank ]
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-227">HADOOP-227</a>. Add support for backup namenodes, which periodically
- get snapshots of the namenode state.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-884">HADOOP-884</a>. Add scripts in contrib/ec2 to facilitate running
- Hadoop on an Amazon's EC2 cluster.<br />(Tom White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-937">HADOOP-937</a>. Change the namenode to request re-registration of
- datanodes in more circumstances.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-922">HADOOP-922</a>. Optimize small forward seeks in HDFS. If data is has
- likely already in flight, skip ahead rather than re-opening the
- block.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-961">HADOOP-961</a>. Add a 'job -events' sub-command that prints job
- events, including task completions and failures.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-959">HADOOP-959</a>. Fix namenode snapshot code added in <a href="http://issues.apache.org/jira/browse/HADOOP-227">HADOOP-227</a> to
- work on Windows.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-934">HADOOP-934</a>. Fix TaskTracker to catch metrics exceptions that were
- causing heartbeats to fail.<br />(Arun Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-881">HADOOP-881</a>. Fix JobTracker web interface to display the correct
- number of task failures.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-788">HADOOP-788</a>. Change contrib/streaming to subclass TextInputFormat,
- permitting it to take advantage of native compression facilities.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-962">HADOOP-962</a>. In contrib/ec2: make scripts executable in tar file;
- add a README; make the environment file use a template.<br />(Tom White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-549">HADOOP-549</a>. Fix a NullPointerException in TaskReport's
- serialization.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-963">HADOOP-963</a>. Fix remote exceptions to have the stack trace of the
- caller thread, not the IPC listener thread.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-967">HADOOP-967</a>. Change RPC clients to start sending a version header.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-964">HADOOP-964</a>. Fix a bug introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-830">HADOOP-830</a> where jobs failed
- whose comparators and/or i/o types were in the job's jar.<br />(Dennis Kubes via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-969">HADOOP-969</a>. Fix a deadlock in JobTracker.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-862">HADOOP-862</a>. Add support for the S3 FileSystem to the CopyFiles
- tool.<br />(Michael Stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-965">HADOOP-965</a>. Fix IsolationRunner so that job's jar can be found.<br />(Dennis Kubes via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-309">HADOOP-309</a>. Fix two NullPointerExceptions in StatusHttpServer.<br />(navychen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-692">HADOOP-692</a>. Add rack awareness to HDFS's placement of blocks.<br />(Hairong Kuang via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.10.1_-_2007-01-10_')">Release 0.10.1 - 2007-01-10
- </a></h3>
- <ol id="release_0.10.1_-_2007-01-10_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-857">HADOOP-857</a>. Fix S3 FileSystem implementation to permit its use
- for MapReduce input and output.<br />(Tom White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-863">HADOOP-863</a>. Reduce logging verbosity introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-813">HADOOP-813</a>.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-815">HADOOP-815</a>. Fix memory leaks in JobTracker.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-600">HADOOP-600</a>. Fix a race condition in JobTracker.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-864">HADOOP-864</a>. Fix 'bin/hadoop -jar' to operate correctly when
- hadoop.tmp.dir does not yet exist.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-866">HADOOP-866</a>. Fix 'dfs -get' command to remove existing crc files,
- if any.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-871">HADOOP-871</a>. Fix a bug in bin/hadoop setting JAVA_LIBRARY_PATH.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-868">HADOOP-868</a>. Decrease the number of open files during map,
- respecting io.sort.fa ctor.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-865">HADOOP-865</a>. Fix S3 FileSystem so that partially created files can
- be deleted.<br />(Tom White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-873">HADOOP-873</a>. Pass java.library.path correctly to child processes.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-851">HADOOP-851</a>. Add support for the LZO codec. This is much faster
- than the default, zlib-based compression, but it is only available
- when the native library is built.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-880">HADOOP-880</a>. Fix S3 FileSystem to remove directories.<br />(Tom White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-879">HADOOP-879</a>. Fix InputFormatBase to handle output generated by
- MapFileOutputFormat.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-659">HADOOP-659</a>. In HDFS, prioritize replication of blocks based on
- current replication level. Blocks which are severely
- under-replicated should be further replicated before blocks which
- are less under-replicated.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-726">HADOOP-726</a>. Deprecate FileSystem locking methods. They are not
- currently usable. Locking should eventually provided as an
- independent service.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-758">HADOOP-758</a>. Fix exception handling during reduce so that root
- exceptions are not masked by exceptions in cleanups.<br />(Raghu Angadi via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.10.0_-_2007-01-05_')">Release 0.10.0 - 2007-01-05
- </a></h3>
- <ol id="release_0.10.0_-_2007-01-05_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-763">HADOOP-763</a>. Change DFS namenode benchmark to not use MapReduce.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-777">HADOOP-777</a>. Use fully-qualified hostnames for tasktrackers and
- datanodes.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-621">HADOOP-621</a>. Change 'dfs -cat' to exit sooner when output has been
- closed.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-752">HADOOP-752</a>. Rationalize some synchronization in DFS namenode.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-629">HADOOP-629</a>. Fix RPC services to better check the protocol name and
- version.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-774">HADOOP-774</a>. Limit the number of invalid blocks returned with
- heartbeats by the namenode to datanodes. Transmitting and
- processing very large invalid block lists can tie up both the
- namenode and datanode for too long.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-738">HADOOP-738</a>. Change 'dfs -get' command to not create CRC files by
- default, adding a -crc option to force their creation.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-676">HADOOP-676</a>. Improved exceptions and error messages for common job
- input specification errors.<br />(Sanjay Dahiya via cutting)</li>
- <li>[Included in 0.9.2 release]
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-756">HADOOP-756</a>. Add new dfsadmin option to wait for filesystem to be
- operational.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-770">HADOOP-770</a>. Fix jobtracker web interface to display, on restart,
- jobs that were running when it was last stopped.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-331">HADOOP-331</a>. Write all map outputs to a single file with an index,
- rather than to a separate file per reduce task. This should both
- speed the shuffle and make things more scalable.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-818">HADOOP-818</a>. Fix contrib unit tests to not depend on core unit
- tests.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-786">HADOOP-786</a>. Log common exception at debug level.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-796">HADOOP-796</a>. Provide more convenient access to failed task
- information in the web interface.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-764">HADOOP-764</a>. Reduce memory allocations in namenode some.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-802">HADOOP-802</a>. Update description of mapred.speculative.execution to
- mention reduces.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-806">HADOOP-806</a>. Include link to datanodes on front page of namenode
- web interface.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-618">HADOOP-618</a>. Make JobSubmissionProtocol public.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-782">HADOOP-782</a>. Fully remove killed tasks.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-792">HADOOP-792</a>. Fix 'dfs -mv' to return correct status.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-673">HADOOP-673</a>. Give each task its own working directory again.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-571">HADOOP-571</a>. Extend the syntax of Path to be a URI; to be
- optionally qualified with a scheme and authority. The scheme
- determines the FileSystem implementation, while the authority
- determines the FileSystem instance. New FileSystem
- implementations may be provided by defining an fs.<scheme>.impl
- property, naming the FileSystem implementation class. This
- permits easy integration of new FileSystem implementations.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-720">HADOOP-720</a>. Add an HDFS white paper to website.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-794">HADOOP-794</a>. Fix a divide-by-zero exception when a job specifies
- zero map tasks.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-454">HADOOP-454</a>. Add a 'dfs -dus' command that provides summary disk
- usage.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-574">HADOOP-574</a>. Add an Amazon S3 implementation of FileSystem. To
- use this, one need only specify paths of the form
- s3://id:secret@bucket/. Alternately, the AWS access key id and
- secret can be specified in your config, with the properties
- fs.s3.awsAccessKeyId and fs.s3.awsSecretAccessKey.<br />(Tom White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-824">HADOOP-824</a>. Rename DFSShell to be FsShell, since it applies
- generically to all FileSystem implementations.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-813">HADOOP-813</a>. Fix map output sorting to report progress, so that
- sorts which take longer than the task timeout do not fail.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-825">HADOOP-825</a>. Fix HDFS daemons when configured with new URI syntax.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-596">HADOOP-596</a>. Fix a bug in phase reporting during reduce.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-811">HADOOP-811</a>. Add a utility, MultithreadedMapRunner.<br />(Alejandro Abdelnur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-829">HADOOP-829</a>. Within HDFS, clearly separate three different
- representations for datanodes: one for RPCs, one for
- namenode-internal use, and one for namespace persistence.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-823">HADOOP-823</a>. Fix problem starting datanode when not all configured
- data directories exist.<br />(Bryan Pendleton via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-451">HADOOP-451</a>. Add a Split interface. CAUTION: This incompatibly
- changes the InputFormat and RecordReader interfaces. Not only is
- FileSplit replaced with Split, but a FileSystem parameter is no
- longer passed in several methods, input validation has changed,
- etc.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-814">HADOOP-814</a>. Optimize locking in namenode.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-738">HADOOP-738</a>. Change 'fs -put' and 'fs -get' commands to accept
- standard input and output, respectively. Standard i/o is
- specified by a file named '-'.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-835">HADOOP-835</a>. Fix a NullPointerException reading record-compressed
- SequenceFiles.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-836">HADOOP-836</a>. Fix a MapReduce bug on Windows, where the wrong
- FileSystem was used. Also add a static FileSystem.getLocal()
- method and better Path checking in HDFS, to help avoid such issues
- in the future.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-837">HADOOP-837</a>. Improve RunJar utility to unpack jar file
- hadoop.tmp.dir, rather than the system temporary directory.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-841">HADOOP-841</a>. Fix native library to build 32-bit version even when
- on a 64-bit host, if a 32-bit JVM is used.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-838">HADOOP-838</a>. Fix tasktracker to pass java.library.path to
- sub-processes, so that libhadoop.a is found.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-844">HADOOP-844</a>. Send metrics messages on a fixed-delay schedule
- instead of a fixed-rate schedule.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-849">HADOOP-849</a>. Fix OutOfMemory exceptions in TaskTracker due to a
- file handle leak in SequenceFile.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-745">HADOOP-745</a>. Fix a synchronization bug in the HDFS namenode.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-850">HADOOP-850</a>. Add Writable implementations for variable-length
- integers.<br />(ab via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-525">HADOOP-525</a>. Add raw comparators to record types. This greatly
- improves record sort performance.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-628">HADOOP-628</a>. Fix a problem with 'fs -cat' command, where some
- characters were replaced with question marks.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-804">HADOOP-804</a>. Reduce verbosity of MapReduce logging.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-853">HADOOP-853</a>. Rename 'site' to 'docs', in preparation for inclusion
- in releases.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-371">HADOOP-371</a>. Include contrib jars and site documentation in
- distributions. Also add contrib and example documentation to
- distributed javadoc, in separate sections.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-846">HADOOP-846</a>. Report progress during entire map, as sorting of
- intermediate outputs may happen at any time, potentially causing
- task timeouts.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-840">HADOOP-840</a>. In task tracker, queue task cleanups and perform them
- in a separate thread.<br />(omalley & Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-681">HADOOP-681</a>. Add to HDFS the ability to decommission nodes. This
- causes their blocks to be re-replicated on other nodes, so that
- they may be removed from a cluster.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-470">HADOOP-470</a>. In HDFS web ui, list the datanodes containing each
- copy of a block.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-700">HADOOP-700</a>. Change bin/hadoop to only include core jar file on
- classpath, not example, test, etc. Also rename core jar to
- hadoop-${version}-core.jar so that it can be more easily
- identified.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-619">HADOOP-619</a>. Extend InputFormatBase to accept individual files and
- glob patterns as MapReduce inputs, not just directories. Also
- change contrib/streaming to use this.<br />(Sanjay Dahia via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.9.2_-_2006-12-15_')">Release 0.9.2 - 2006-12-15
- </a></h3>
- <ol id="release_0.9.2_-_2006-12-15_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-639">HADOOP-639</a>. Restructure InterTrackerProtocol to make task
- accounting more reliable.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-827">HADOOP-827</a>. Turn off speculative execution by default, since it's
- currently broken.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-791">HADOOP-791</a>. Fix a deadlock in the task tracker.<br />(Mahadev Konar via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.9.1_-_2006-12-06_')">Release 0.9.1 - 2006-12-06
- </a></h3>
- <ol id="release_0.9.1_-_2006-12-06_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-780">HADOOP-780</a>. Use ReflectionUtils to instantiate key and value
- objects.<br />(ab)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-779">HADOOP-779</a>. Fix contrib/streaming to work correctly with gzipped
- input files.<br />(Hairong Kuang via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.9.0_-_2006-12-01_')">Release 0.9.0 - 2006-12-01
- </a></h3>
- <ol id="release_0.9.0_-_2006-12-01_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-655">HADOOP-655</a>. Remove most deprecated code. A few deprecated things
- remain, notably UTF8 and some methods that are still required.
- Also cleaned up constructors for SequenceFile, MapFile, SetFile,
- and ArrayFile a bit.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-565">HADOOP-565</a>. Upgrade to Jetty version 6.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-682">HADOOP-682</a>. Fix DFS format command to work correctly when
- configured with a non-existent directory.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-645">HADOOP-645</a>. Fix a bug in contrib/streaming when -reducer is NONE.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-687">HADOOP-687</a>. Fix a classpath bug in bin/hadoop that blocked the
- servers from starting.<br />(Sameer Paranjpye via omalley)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-683">HADOOP-683</a>. Remove a script dependency on bash, so it works with
- dash, the new default for /bin/sh on Ubuntu.<br />(James Todd via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-382">HADOOP-382</a>. Extend unit tests to run multiple datanodes.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-604">HADOOP-604</a>. Fix some synchronization issues and a
- NullPointerException in DFS datanode.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-459">HADOOP-459</a>. Fix memory leaks and a host of other issues with
- libhdfs.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-694">HADOOP-694</a>. Fix a NullPointerException in jobtracker.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-637">HADOOP-637</a>. Fix a memory leak in the IPC server. Direct buffers
- are not collected like normal buffers, and provided little
- advantage.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-696">HADOOP-696</a>. Fix TestTextInputFormat unit test to not rely on the
- order of directory listings.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-611">HADOOP-611</a>. Add support for iterator-based merging to
- SequenceFile.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-688">HADOOP-688</a>. Move DFS administrative commands to a separate
- command named 'dfsadmin'.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-708">HADOOP-708</a>. Fix test-libhdfs to return the correct status, so
- that failures will break the build.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-646">HADOOP-646</a>. Fix namenode to handle edits files larger than 2GB.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-705">HADOOP-705</a>. Fix a bug in the JobTracker when failed jobs were
- not completely cleaned up.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-613">HADOOP-613</a>. Perform final merge while reducing. This removes one
- sort pass over the data and should consequently significantly
- decrease overall processing time.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-661">HADOOP-661</a>. Make each job's configuration visible through the web
- ui.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-489">HADOOP-489</a>. In MapReduce, separate user logs from system logs.
- Each task's log output is now available through the web ui.<br />(Arun
- C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-712">HADOOP-712</a>. Fix record io's xml serialization to correctly handle
- control-characters.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-668">HADOOP-668</a>. Improvements to the web-based DFS browser.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-715">HADOOP-715</a>. Fix build.xml so that test logs are written in build
- directory, rather than in CWD.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-538">HADOOP-538</a>. Add support for building an optional native library,
- libhadoop.so, that improves the performance of zlib-based
- compression. To build this, specify -Dcompile.native to Ant.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-610">HADOOP-610</a>. Fix an problem when the DFS block size is configured
- to be smaller than the buffer size, typically only when debugging.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-695">HADOOP-695</a>. Fix a NullPointerException in contrib/streaming.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-652">HADOOP-652</a>. In DFS, when a file is deleted, the block count is
- now decremented.<br />(Vladimir Krokhmalyov via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-725">HADOOP-725</a>. In DFS, optimize block placement algorithm,
- previously a performance bottleneck.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-723">HADOOP-723</a>. In MapReduce, fix a race condition during the
- shuffle, which resulted in FileNotFoundExceptions.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-447">HADOOP-447</a>. In DFS, fix getBlockSize(Path) to work with relative
- paths.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-733">HADOOP-733</a>. Make exit codes in DFShell consistent and add a unit
- test.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-709">HADOOP-709</a>. Fix contrib/streaming to work with commands that
- contain control characters.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-677">HADOOP-677</a>. In IPC, permit a version header to be transmitted
- when connections are established. This will permit us to change
- the format of IPC requests back-compatibly in subsequent releases.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-699">HADOOP-699</a>. Fix DFS web interface so that filesystem browsing
- works correctly, using the right port number. Also add support
- for sorting datanode list by various columns.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-76">HADOOP-76</a>. Implement speculative reduce. Now when a job is
- configured for speculative execution, both maps and reduces will
- execute speculatively. Reduce outputs are written to temporary
- location and moved to the final location when reduce is complete.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-736">HADOOP-736</a>. Roll back to Jetty 5.1.4, due to performance problems
- with Jetty 6.0.1.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-739">HADOOP-739</a>. Fix TestIPC to use different port number, making it
- more reliable.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-749">HADOOP-749</a>. Fix a NullPointerException in jobfailures.jsp.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-747">HADOOP-747</a>. Fix record serialization to work correctly when
- records are embedded in Maps.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-698">HADOOP-698</a>. Fix HDFS client not to retry the same datanode on
- read failures.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-689">HADOOP-689</a>. Add GenericWritable, to facilitate polymorphism in
- MapReduce, SequenceFile, etc.<br />(Feng Jiang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-430">HADOOP-430</a>. Stop datanode's HTTP server when registration with
- namenode fails.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-750">HADOOP-750</a>. Fix a potential race condition during mapreduce
- shuffle.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-728">HADOOP-728</a>. Fix contrib/streaming-related issues, including
- '-reducer NONE'.<br />(Sanjay Dahiya via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.8.0_-_2006-11-03_')">Release 0.8.0 - 2006-11-03
- </a></h3>
- <ol id="release_0.8.0_-_2006-11-03_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-477">HADOOP-477</a>. Extend contrib/streaming to scan the PATH environment
- variables when resolving executable program names.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-583">HADOOP-583</a>. In DFSClient, reduce the log level of re-connect
- attempts from 'info' to 'debug', so they are not normally shown.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-498">HADOOP-498</a>. Re-implement DFS integrity checker to run server-side,
- for much improved performance.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-586">HADOOP-586</a>. Use the jar name for otherwise un-named jobs.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-514">HADOOP-514</a>. Make DFS heartbeat interval configurable.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-588">HADOOP-588</a>. Fix logging and accounting of failed tasks.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-462">HADOOP-462</a>. Improve command line parsing in DFSShell, so that
- incorrect numbers of arguments result in informative errors rather
- than ArrayOutOfBoundsException.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-561">HADOOP-561</a>. Fix DFS so that one replica of each block is written
- locally, if possible. This was the intent, but there as a bug.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-610">HADOOP-610</a>. Fix TaskTracker to survive more exceptions, keeping
- tasks from becoming lost.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-625">HADOOP-625</a>. Add a servlet to all http daemons that displays a
- stack dump, useful for debugging.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-554">HADOOP-554</a>. Fix DFSShell to return -1 for errors.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-626">HADOOP-626</a>. Correct the documentation in the NNBench example
- code, and also remove a mistaken call there.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-634">HADOOP-634</a>. Add missing license to many files.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-627">HADOOP-627</a>. Fix some synchronization problems in MiniMRCluster
- that sometimes caused unit tests to fail.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-563">HADOOP-563</a>. Improve the NameNode's lease policy so that leases
- are held for one hour without renewal (instead of one minute).
- However another attempt to create the same file will still succeed
- if the lease has not been renewed within a minute. This prevents
- communication or scheduling problems from causing a write to fail
- for up to an hour, barring some other process trying to create the
- same file.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-635">HADOOP-635</a>. In DFSShell, permit specification of multiple files
- as the source for file copy and move commands.<br />(Dhruba Borthakur via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-641">HADOOP-641</a>. Change NameNode to request a fresh block report from
- a re-discovered DataNode, so that no-longer-needed replications
- are stopped promptly.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-642">HADOOP-642</a>. Change IPC client to specify an explicit connect
- timeout.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-638">HADOOP-638</a>. Fix an unsynchronized access to TaskTracker's
- internal state.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-624">HADOOP-624</a>. Fix servlet path to stop a Jetty warning on startup.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-578">HADOOP-578</a>. Failed tasks are no longer placed at the end of the
- task queue. This was originally done to work around other
- problems that have now been fixed. Re-executing failed tasks
- sooner causes buggy jobs to fail faster.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-658">HADOOP-658</a>. Update source file headers per Apache policy.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-636">HADOOP-636</a>. Add MapFile & ArrayFile constructors which accept a
- Progressable, and pass it down to SequenceFile. This permits
- reduce tasks which use MapFile to still report progress while
- writing blocks to the filesystem.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-576">HADOOP-576</a>. Enable contrib/streaming to use the file cache. Also
- extend the cache to permit symbolic links to cached items, rather
- than local file copies.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-482">HADOOP-482</a>. Fix unit tests to work when a cluster is running on
- the same machine, removing port conflicts.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-90">HADOOP-90</a>. Permit dfs.name.dir to list multiple directories,
- where namenode data is to be replicated.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-651">HADOOP-651</a>. Fix DFSCk to correctly pass parameters to the servlet
- on the namenode.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-553">HADOOP-553</a>. Change main() routines of DataNode and NameNode to
- log exceptions rather than letting the JVM print them to standard
- error. Also, change the hadoop-daemon.sh script to rotate
- standard i/o log files.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-399">HADOOP-399</a>. Fix javadoc warnings.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-599">HADOOP-599</a>. Fix web ui and command line to correctly report DFS
- filesystem size statistics. Also improve web layout.<br />(Raghu Angadi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-660">HADOOP-660</a>. Permit specification of junit test output format.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-663">HADOOP-663</a>. Fix a few unit test issues.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-664">HADOOP-664</a>. Cause entire build to fail if libhdfs tests fail.<br />(Nigel Daley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-633">HADOOP-633</a>. Keep jobtracker from dying when job initialization
- throws exceptions. Also improve exception handling in a few other
- places and add more informative thread names.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-669">HADOOP-669</a>. Fix a problem introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-90">HADOOP-90</a> that can cause
- DFS to lose files.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-373">HADOOP-373</a>. Consistently check the value returned by
- FileSystem.mkdirs().<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-670">HADOOP-670</a>. Code cleanups in some DFS internals: use generic
- types, replace Vector with ArrayList, etc.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-647">HADOOP-647</a>. Permit map outputs to use a different compression
- type than the job output.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-671">HADOOP-671</a>. Fix file cache to check for pre-existence before
- creating .<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-665">HADOOP-665</a>. Extend many DFSShell commands to accept multiple
- arguments. Now commands like "ls", "rm", etc. will operate on
- multiple files.<br />(Dhruba Borthakur via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.7.2_-_2006-10-18_')">Release 0.7.2 - 2006-10-18
- </a></h3>
- <ol id="release_0.7.2_-_2006-10-18_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-607">HADOOP-607</a>. Fix a bug where classes included in job jars were not
- found by tasks.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-609">HADOOP-609</a>. Add a unit test that checks that classes in job jars
- can be found by tasks. Also modify unit tests to specify multiple
- local directories.<br />(Mahadev Konar via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.7.1_-_2006-10-11_')">Release 0.7.1 - 2006-10-11
- </a></h3>
- <ol id="release_0.7.1_-_2006-10-11_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-593">HADOOP-593</a>. Fix a NullPointerException in the JobTracker.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-592">HADOOP-592</a>. Fix a NullPointerException in the IPC Server. Also
- consistently log when stale calls are discarded.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-594">HADOOP-594</a>. Increase the DFS safe-mode threshold from .95 to
- .999, so that nearly all blocks must be reported before filesystem
- modifications are permitted.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-598">HADOOP-598</a>. Fix tasks to retry when reporting completion, so that
- a single RPC timeout won't fail a task.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-597">HADOOP-597</a>. Fix TaskTracker to not discard map outputs for errors
- in transmitting them to reduce nodes.<br />(omalley via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.7.0_-_2006-10-06_')">Release 0.7.0 - 2006-10-06
- </a></h3>
- <ol id="release_0.7.0_-_2006-10-06_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-243">HADOOP-243</a>. Fix rounding in the display of task and job progress
- so that things are not shown to be 100% complete until they are in
- fact finished.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-438">HADOOP-438</a>. Limit the length of absolute paths in DFS, since the
- file format used to store pathnames has some limitations.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-530">HADOOP-530</a>. Improve error messages in SequenceFile when keys or
- values are of the wrong type.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-288">HADOOP-288</a>. Add a file caching system and use it in MapReduce to
- cache job jar files on slave nodes.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-533">HADOOP-533</a>. Fix unit test to not modify conf directory.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-527">HADOOP-527</a>. Permit specification of the local address that various
- Hadoop daemons should bind to.<br />(Philippe Gassmann via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-542">HADOOP-542</a>. Updates to contrib/streaming: reformatted source code,
- on-the-fly merge sort, a fix for <a href="http://issues.apache.org/jira/browse/HADOOP-540">HADOOP-540</a>, etc.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-545">HADOOP-545</a>. Remove an unused config file parameter.<br />(Philippe Gassmann via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-548">HADOOP-548</a>. Add an Ant property "test.output" to build.xml that
- causes test output to be logged to the console.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-261">HADOOP-261</a>. Record an error message when map output is lost.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-293">HADOOP-293</a>. Report the full list of task error messages in the
- web ui, not just the most recent.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-551">HADOOP-551</a>. Restore JobClient's console printouts to only include
- a maximum of one update per one percent of progress.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-306">HADOOP-306</a>. Add a "safe" mode to DFS. The name node enters this
- when less than a specified percentage of file data is complete.
- Currently safe mode is only used on startup, but eventually it
- will also be entered when datanodes disconnect and file data
- becomes incomplete. While in safe mode no filesystem
- modifications are permitted and block replication is inhibited.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-431">HADOOP-431</a>. Change 'dfs -rm' to not operate recursively and add a
- new command, 'dfs -rmr' which operates recursively.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-263">HADOOP-263</a>. Include timestamps for job transitions. The web
- interface now displays the start and end times of tasks and the
- start times of sorting and reducing for reduce tasks. Also,
- extend ObjectWritable to handle enums, so that they can be passed
- as RPC parameters.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-556">HADOOP-556</a>. Contrib/streaming: send keep-alive reports to task
- tracker every 10 seconds rather than every 100 records, to avoid
- task timeouts.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-547">HADOOP-547</a>. Fix reduce tasks to ping tasktracker while copying
- data, rather than only between copies, avoiding task timeouts.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-537">HADOOP-537</a>. Fix src/c++/libhdfs build process to create files in
- build/, no longer modifying the source tree.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-487">HADOOP-487</a>. Throw a more informative exception for unknown RPC
- hosts.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-559">HADOOP-559</a>. Add file name globbing (pattern matching) support to
- the FileSystem API, and use it in DFSShell ('bin/hadoop dfs')
- commands.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-508">HADOOP-508</a>. Fix a bug in FSDataInputStream. Incorrect data was
- returned after seeking to a random location.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-560">HADOOP-560</a>. Add a "killed" task state. This can be used to
- distinguish kills from other failures. Task state has also been
- converted to use an enum type instead of an int, uncovering a bug
- elsewhere. The web interface is also updated to display killed
- tasks.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-423">HADOOP-423</a>. Normalize Paths containing directories named "." and
- "..", using the standard, unix interpretation. Also add checks in
- DFS, prohibiting the use of "." or ".." as directory or file
- names.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-513">HADOOP-513</a>. Replace map output handling with a servlet, rather
- than a JSP page. This fixes an issue where
- IllegalStateException's were logged, sets content-length
- correctly, and better handles some errors.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-552">HADOOP-552</a>. Improved error checking when copying map output files
- to reduce nodes.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-566">HADOOP-566</a>. Fix scripts to work correctly when accessed through
- relative symbolic links.<br />(Lee Faris via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-519">HADOOP-519</a>. Add positioned read methods to FSInputStream. These
- permit one to read from a stream without moving its position, and
- can hence be performed by multiple threads at once on a single
- stream. Implement an optimized version for DFS and local FS.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-522">HADOOP-522</a>. Permit block compression with MapFile and SetFile.
- Since these formats are always sorted, block compression can
- provide a big advantage.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-567">HADOOP-567</a>. Record version and revision information in builds. A
- package manifest is added to the generated jar file containing
- version information, and a VersionInfo utility is added that
- includes further information, including the build date and user,
- and the subversion revision and repository. A 'bin/hadoop
- version' comand is added to show this information, and it is also
- added to various web interfaces.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-568">HADOOP-568</a>. Fix so that errors while initializing tasks on a
- tasktracker correctly report the task as failed to the jobtracker,
- so that it will be rescheduled.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-550">HADOOP-550</a>. Disable automatic UTF-8 validation in Text. This
- permits, e.g., TextInputFormat to again operate on non-UTF-8 data.<br />(Hairong and Mahadev via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-343">HADOOP-343</a>. Fix mapred copying so that a failed tasktracker
- doesn't cause other copies to slow.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-239">HADOOP-239</a>. Add a persistent job history mechanism, so that basic
- job statistics are not lost after 24 hours and/or when the
- jobtracker is restarted.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-506">HADOOP-506</a>. Ignore heartbeats from stale task trackers.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-255">HADOOP-255</a>. Discard stale, queued IPC calls. Do not process
- calls whose clients will likely time out before they receive a
- response. When the queue is full, new calls are now received and
- queued, and the oldest calls are discarded, so that, when servers
- get bogged down, they no longer develop a backlog on the socket.
- This should improve some DFS namenode failure modes.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-581">HADOOP-581</a>. Fix datanode to not reset itself on communications
- errors with the namenode. If a request to the namenode fails, the
- datanode should retry, not restart. This reduces the load on the
- namenode, since restarts cause a resend of the block report.<br />(omalley via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.6.2_-_2006-09-18_')">Release 0.6.2 - 2006-09-18
- </a></h3>
- <ol id="release_0.6.2_-_2006-09-18_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-532">HADOOP-532</a>. Fix a bug reading value-compressed sequence files,
- where an exception was thrown reporting that the full value had not
- been read.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-534">HADOOP-534</a>. Change the default value class in JobConf to be Text
- instead of the now-deprecated UTF8. This fixes the Grep example
- program, which was updated to use Text, but relies on this
- default.<br />(Hairong Kuang via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.6.1_-_2006-09-13_')">Release 0.6.1 - 2006-09-13
- </a></h3>
- <ol id="release_0.6.1_-_2006-09-13_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-520">HADOOP-520</a>. Fix a bug in libhdfs, where write failures were not
- correctly returning error codes.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-523">HADOOP-523</a>. Fix a NullPointerException when TextInputFormat is
- explicitly specified. Also add a test case for this.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-521">HADOOP-521</a>. Fix another NullPointerException finding the
- ClassLoader when using libhdfs.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-526">HADOOP-526</a>. Fix a NullPointerException when attempting to start
- two datanodes in the same directory.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-529">HADOOP-529</a>. Fix a NullPointerException when opening
- value-compressed sequence files generated by pre-0.6.0 Hadoop.<br />(omalley via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.6.0_-_2006-09-08_')">Release 0.6.0 - 2006-09-08
- </a></h3>
- <ol id="release_0.6.0_-_2006-09-08_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-427">HADOOP-427</a>. Replace some uses of DatanodeDescriptor in the DFS
- web UI code with DatanodeInfo, the preferred public class.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-426">HADOOP-426</a>. Fix streaming contrib module to work correctly on
- Solaris. This was causing nightly builds to fail.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-400">HADOOP-400</a>. Improvements to task assignment. Tasks are no longer
- re-run on nodes where they have failed (unless no other node is
- available). Also, tasks are better load-balanced among nodes.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-324">HADOOP-324</a>. Fix datanode to not exit when a disk is full, but
- rather simply to fail writes.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-434">HADOOP-434</a>. Change smallJobsBenchmark to use standard Hadoop
- scripts.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-453">HADOOP-453</a>. Fix a bug in Text.setCapacity().<br />(siren via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-450">HADOOP-450</a>. Change so that input types are determined by the
- RecordReader rather than specified directly in the JobConf. This
- facilitates jobs with a variety of input types.
- <p/>
- WARNING: This contains incompatible API changes! The RecordReader
- interface has two new methods that all user-defined InputFormats
- must now define. Also, the values returned by TextInputFormat are
- no longer of class UTF8, but now of class Text.
- </li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-436">HADOOP-436</a>. Fix an error-handling bug in the web ui.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-455">HADOOP-455</a>. Fix a bug in Text, where DEL was not permitted.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-456">HADOOP-456</a>. Change the DFS namenode to keep a persistent record
- of the set of known datanodes. This will be used to implement a
- "safe mode" where filesystem changes are prohibited when a
- critical percentage of the datanodes are unavailable.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-322">HADOOP-322</a>. Add a job control utility. This permits one to
- specify job interdependencies. Each job is submitted only after
- the jobs it depends on have successfully completed.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-176">HADOOP-176</a>. Fix a bug in IntWritable.Comparator.<br />(Dick King via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-421">HADOOP-421</a>. Replace uses of String in recordio package with Text
- class, for improved handling of UTF-8 data.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-464">HADOOP-464</a>. Improved error message when job jar not found.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-469">HADOOP-469</a>. Fix /bin/bash specifics that have crept into our
- /bin/sh scripts since <a href="http://issues.apache.org/jira/browse/HADOOP-352">HADOOP-352</a>.<br />(Jean-Baptiste Quenot via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-468">HADOOP-468</a>. Add HADOOP_NICENESS environment variable to set
- scheduling priority for daemons.<br />(Vetle Roeim via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-473">HADOOP-473</a>. Fix TextInputFormat to correctly handle more EOL
- formats. Things now work correctly with CR, LF or CRLF.<br />(Dennis Kubes & James White via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-461">HADOOP-461</a>. Make Java 1.5 an explicit requirement.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-54">HADOOP-54</a>. Add block compression to SequenceFile. One may now
- specify that blocks of keys and values are compressed together,
- improving compression for small keys and values.
- SequenceFile.Writer's constructor is now deprecated and replaced
- with a factory method.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-281">HADOOP-281</a>. Prohibit DFS files that are also directories.<br />(Wendy Chien via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-486">HADOOP-486</a>. Add the job username to JobStatus instances returned
- by JobClient.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-437">HADOOP-437</a>. contrib/streaming: Add support for gzipped inputs.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-463">HADOOP-463</a>. Add variable expansion to config files.
- Configuration property values may now contain variable
- expressions. A variable is referenced with the syntax
- '${variable}'. Variables values are found first in the
- configuration, and then in Java system properties. The default
- configuration is modified so that temporary directories are now
- under ${hadoop.tmp.dir}, which is, by default,
- /tmp/hadoop-${user.name}.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-419">HADOOP-419</a>. Fix a NullPointerException finding the ClassLoader
- when using libhdfs.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-460">HADOOP-460</a>. Fix contrib/smallJobsBenchmark to use Text instead of
- UTF8.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-196">HADOOP-196</a>. Fix Configuration(Configuration) constructor to work
- correctly.<br />(Sami Siren via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-501">HADOOP-501</a>. Fix Configuration.toString() to handle URL resources.<br />(Thomas Friol via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-499">HADOOP-499</a>. Reduce the use of Strings in contrib/streaming,
- replacing them with Text for better performance.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-64">HADOOP-64</a>. Manage multiple volumes with a single DataNode.
- Previously DataNode would create a separate daemon per configured
- volume, each with its own connection to the NameNode. Now all
- volumes are handled by a single DataNode daemon, reducing the load
- on the NameNode.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-424">HADOOP-424</a>. Fix MapReduce so that jobs which generate zero splits
- do not fail.<br />(Fr??d??ric Bertin via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-408">HADOOP-408</a>. Adjust some timeouts and remove some others so that
- unit tests run faster.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-507">HADOOP-507</a>. Fix an IllegalAccessException in DFS.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-320">HADOOP-320</a>. Fix so that checksum files are correctly copied when
- the destination of a file copy is a directory.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-286">HADOOP-286</a>. In DFSClient, avoid pinging the NameNode with
- renewLease() calls when no files are being written.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-312">HADOOP-312</a>. Close idle IPC connections. All IPC connections were
- cached forever. Now, after a connection has been idle for more
- than a configurable amount of time (one second by default), the
- connection is closed, conserving resources on both client and
- server.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-497">HADOOP-497</a>. Permit the specification of the network interface and
- nameserver to be used when determining the local hostname
- advertised by datanodes and tasktrackers.<br />(Lorenzo Thione via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-441">HADOOP-441</a>. Add a compression codec API and extend SequenceFile
- to use it. This will permit the use of alternate compression
- codecs in SequenceFile.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-483">HADOOP-483</a>. Improvements to libhdfs build and documentation.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-458">HADOOP-458</a>. Fix a memory corruption bug in libhdfs.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-517">HADOOP-517</a>. Fix a contrib/streaming bug in end-of-line detection.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-474">HADOOP-474</a>. Add CompressionCodecFactory, and use it in
- TextInputFormat and TextOutputFormat. Compressed input files are
- automatically decompressed when they have the correct extension.
- Output files will, when output compression is specified, be
- generated with an approprate extension. Also add a gzip codec and
- fix problems with UTF8 text inputs.<br />(omalley via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.5.0_-_2006-08-04_')">Release 0.5.0 - 2006-08-04
- </a></h3>
- <ol id="release_0.5.0_-_2006-08-04_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-352">HADOOP-352</a>. Fix shell scripts to use /bin/sh instead of
- /bin/bash, for better portability.<br />(Jean-Baptiste Quenot via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-313">HADOOP-313</a>. Permit task state to be saved so that single tasks
- may be manually re-executed when debugging.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-339">HADOOP-339</a>. Add method to JobClient API listing jobs that are
- not yet complete, i.e., that are queued or running.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-355">HADOOP-355</a>. Updates to the streaming contrib module, including
- API fixes, making reduce optional, and adding an input type for
- StreamSequenceRecordReader.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-358">HADOOP-358</a>. Fix a NPE bug in Path.equals().<br />(Fr??d??ric Bertin via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-327">HADOOP-327</a>. Fix ToolBase to not call System.exit() when
- exceptions are thrown.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-359">HADOOP-359</a>. Permit map output to be compressed.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-341">HADOOP-341</a>. Permit input URI to CopyFiles to use the HTTP
- protocol. This lets one, e.g., more easily copy log files into
- DFS.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-361">HADOOP-361</a>. Remove unix dependencies from streaming contrib
- module tests, making them pure java.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-354">HADOOP-354</a>. Make public methods to stop DFS daemons.<br />(Barry Kaplan via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-252">HADOOP-252</a>. Add versioning to RPC protocols.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-356">HADOOP-356</a>. Add contrib to "compile" and "test" build targets, so
- that this code is better maintained.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-307">HADOOP-307</a>. Add smallJobsBenchmark contrib module. This runs
- lots of small jobs, in order to determine per-task overheads.<br />(Sanjay Dahiya via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-342">HADOOP-342</a>. Add a tool for log analysis: Logalyzer.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-347">HADOOP-347</a>. Add web-based browsing of DFS content. The namenode
- redirects browsing requests to datanodes. Content requests are
- redirected to datanodes where the data is local when possible.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-351">HADOOP-351</a>. Make Hadoop IPC kernel independent of Jetty.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-237">HADOOP-237</a>. Add metric reporting to DFS and MapReduce. With only
- minor configuration changes, one can now monitor many Hadoop
- system statistics using Ganglia or other monitoring systems.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-376">HADOOP-376</a>. Fix datanode's HTTP server to scan for a free port.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-260">HADOOP-260</a>. Add --config option to shell scripts, specifying an
- alternate configuration directory.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-381">HADOOP-381</a>. Permit developers to save the temporary files for
- tasks whose names match a regular expression, to facilliate
- debugging.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-344">HADOOP-344</a>. Fix some Windows-related problems with DF.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-380">HADOOP-380</a>. Fix reduce tasks to poll less frequently for map
- outputs.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-321">HADOOP-321</a>. Refactor DatanodeInfo, in preparation for
- <a href="http://issues.apache.org/jira/browse/HADOOP-306">HADOOP-306</a>.<br />(Konstantin Shvachko & omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-385">HADOOP-385</a>. Fix some bugs in record io code generation.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-302">HADOOP-302</a>. Add new Text class to replace UTF8, removing
- limitations of that class. Also refactor utility methods for
- writing zero-compressed integers (VInts and VLongs).<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-335">HADOOP-335</a>. Refactor DFS namespace/transaction logging in
- namenode.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-375">HADOOP-375</a>. Fix handling of the datanode HTTP daemon's port so
- that multiple datanode's can be run on a single host.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-386">HADOOP-386</a>. When removing excess DFS block replicas, remove those
- on nodes with the least free space first.<br />(Johan Oskarson via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-389">HADOOP-389</a>. Fix intermittent failures of mapreduce unit tests.
- Also fix some build dependencies.<br />(Mahadev & Konstantin via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-362">HADOOP-362</a>. Fix a problem where jobs hang when status messages
- are recieved out-of-order.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-394">HADOOP-394</a>. Change order of DFS shutdown in unit tests to
- minimize errors logged.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-396">HADOOP-396</a>. Make DatanodeID implement Writable.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-377">HADOOP-377</a>. Permit one to add URL resources to a Configuration.<br />(Jean-Baptiste Quenot via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-345">HADOOP-345</a>. Permit iteration over Configuration key/value pairs.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-409">HADOOP-409</a>. Streaming contrib module: make configuration
- properties available to commands as environment variables.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-369">HADOOP-369</a>. Add -getmerge option to dfs command that appends all
- files in a directory into a single local file.<br />(Johan Oskarson via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-410">HADOOP-410</a>. Replace some TreeMaps with HashMaps in DFS, for
- a 17% performance improvement.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-411">HADOOP-411</a>. Add unit tests for command line parser.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-412">HADOOP-412</a>. Add MapReduce input formats that support filtering
- of SequenceFile data, including sampling and regex matching.
- Also, move JobConf.newInstance() to a new utility class.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-226">HADOOP-226</a>. Fix fsck command to properly consider replication
- counts, now that these can vary per file.<br />(Bryan Pendleton via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-425">HADOOP-425</a>. Add a Python MapReduce example, using Jython.<br />(omalley via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.4.0_-_2006-06-28_')">Release 0.4.0 - 2006-06-28
- </a></h3>
- <ol id="release_0.4.0_-_2006-06-28_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-298">HADOOP-298</a>. Improved progress reports for CopyFiles utility, the
- distributed file copier.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-299">HADOOP-299</a>. Fix the task tracker, permitting multiple jobs to
- more easily execute at the same time.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-250">HADOOP-250</a>. Add an HTTP user interface to the namenode, running
- on port 50070.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-123">HADOOP-123</a>. Add MapReduce unit tests that run a jobtracker and
- tasktracker, greatly increasing code coverage.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-271">HADOOP-271</a>. Add links from jobtracker's web ui to tasktracker's
- web ui. Also attempt to log a thread dump of child processes
- before they're killed.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-210">HADOOP-210</a>. Change RPC server to use a selector instead of a
- thread per connection. This should make it easier to scale to
- larger clusters. Note that this incompatibly changes the RPC
- protocol: clients and servers must both be upgraded to the new
- version to ensure correct operation.<br />(Devaraj Das via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-311">HADOOP-311</a>. Change DFS client to retry failed reads, so that a
- single read failure will not alone cause failure of a task.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-314">HADOOP-314</a>. Remove the "append" phase when reducing. Map output
- files are now directly passed to the sorter, without first
- appending them into a single file. Now, the first third of reduce
- progress is "copy" (transferring map output to reduce nodes), the
- middle third is "sort" (sorting map output) and the last third is
- "reduce" (generating output). Long-term, the "sort" phase will
- also be removed.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-316">HADOOP-316</a>. Fix a potential deadlock in the jobtracker.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-319">HADOOP-319</a>. Fix FileSystem.close() to remove the FileSystem
- instance from the cache.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-135">HADOOP-135</a>. Fix potential deadlock in JobTracker by acquiring
- locks in a consistent order.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-278">HADOOP-278</a>. Check for existence of input directories before
- starting MapReduce jobs, making it easier to debug this common
- error.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-304">HADOOP-304</a>. Improve error message for
- UnregisterdDatanodeException to include expected node name.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-305">HADOOP-305</a>. Fix TaskTracker to ask for new tasks as soon as a
- task is finished, rather than waiting for the next heartbeat.
- This improves performance when tasks are short.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-59">HADOOP-59</a>. Add support for generic command line options. One may
- now specify the filesystem (-fs), the MapReduce jobtracker (-jt),
- a config file (-conf) or any configuration property (-D). The
- "dfs", "fsck", "job", and "distcp" commands currently support
- this, with more to be added.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-296">HADOOP-296</a>. Permit specification of the amount of reserved space
- on a DFS datanode. One may specify both the percentage free and
- the number of bytes.<br />(Johan Oskarson via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-325">HADOOP-325</a>. Fix a problem initializing RPC parameter classes, and
- remove the workaround used to initialize classes.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-328">HADOOP-328</a>. Add an option to the "distcp" command to ignore read
- errors while copying.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-27">HADOOP-27</a>. Don't allocate tasks to trackers whose local free
- space is too low.<br />(Johan Oskarson via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-318">HADOOP-318</a>. Keep slow DFS output from causing task timeouts.
- This incompatibly changes some public interfaces, adding a
- parameter to OutputFormat.getRecordWriter() and the new method
- Reporter.progress(), but it makes lots of tasks succeed that were
- previously failing.<br />(Milind Bhandarkar via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.3.2_-_2006-06-09_')">Release 0.3.2 - 2006-06-09
- </a></h3>
- <ol id="release_0.3.2_-_2006-06-09_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-275">HADOOP-275</a>. Update the streaming contrib module to use log4j for
- its logging.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-279">HADOOP-279</a>. Provide defaults for log4j logging parameters, so
- that things still work reasonably when Hadoop-specific system
- properties are not provided.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-280">HADOOP-280</a>. Fix a typo in AllTestDriver which caused the wrong
- test to be run when "DistributedFSCheck" was specified.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-240">HADOOP-240</a>. DFS's mkdirs() implementation no longer logs a warning
- when the directory already exists.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-285">HADOOP-285</a>. Fix DFS datanodes to be able to re-join the cluster
- after the connection to the namenode is lost.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-277">HADOOP-277</a>. Fix a race condition when creating directories.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-289">HADOOP-289</a>. Improved exception handling in DFS datanode.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-292">HADOOP-292</a>. Fix client-side logging to go to standard error
- rather than standard output, so that it can be distinguished from
- application output.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-294">HADOOP-294</a>. Fixed bug where conditions for retrying after errors
- in the DFS client were reversed.<br />(omalley via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.3.1_-_2006-06-05_')">Release 0.3.1 - 2006-06-05
- </a></h3>
- <ol id="release_0.3.1_-_2006-06-05_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-272">HADOOP-272</a>. Fix a bug in bin/hadoop setting log
- parameters.<br />(omalley & cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-274">HADOOP-274</a>. Change applications to log to standard output rather
- than to a rolling log file like daemons.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-262">HADOOP-262</a>. Fix reduce tasks to report progress while they're
- waiting for map outputs, so that they do not time out.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-245">HADOOP-245</a> and <a href="http://issues.apache.org/jira/browse/HADOOP-246">HADOOP-246</a>. Improvements to record io package.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-276">HADOOP-276</a>. Add logging config files to jar file so that they're
- always found.<br />(omalley via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.3.0_-_2006-06-02_')">Release 0.3.0 - 2006-06-02
- </a></h3>
- <ol id="release_0.3.0_-_2006-06-02_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-208">HADOOP-208</a>. Enhance MapReduce web interface, adding new pages
- for failed tasks, and tasktrackers.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-204">HADOOP-204</a>. Tweaks to metrics package.<br />(David Bowen via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-209">HADOOP-209</a>. Add a MapReduce-based file copier. This will
- copy files within or between file systems in parallel.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-146">HADOOP-146</a>. Fix DFS to check when randomly generating a new block
- id that no existing blocks already have that id.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-180">HADOOP-180</a>. Make a daemon thread that does the actual task clean ups, so
- that the main offerService thread in the taskTracker doesn't get stuck
- and miss his heartbeat window. This was killing many task trackers as
- big jobs finished (300+ tasks / node).<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-200">HADOOP-200</a>. Avoid transmitting entire list of map task names to
- reduce tasks. Instead just transmit the number of map tasks and
- henceforth refer to them by number when collecting map output.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-219">HADOOP-219</a>. Fix a NullPointerException when handling a checksum
- exception under SequenceFile.Sorter.sort().<br />(cutting & stack)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-212">HADOOP-212</a>. Permit alteration of the file block size in DFS. The
- default block size for new files may now be specified in the
- configuration with the dfs.block.size property. The block size
- may also be specified when files are opened.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-218">HADOOP-218</a>. Avoid accessing configuration while looping through
- tasks in JobTracker.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-161">HADOOP-161</a>. Add hashCode() method to DFS's Block.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-115">HADOOP-115</a>. Map output types may now be specified. These are also
- used as reduce input types, thus permitting reduce input types to
- differ from reduce output types.<br />(Runping Qi via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-216">HADOOP-216</a>. Add task progress to task status page.<br />(Bryan Pendelton via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-233">HADOOP-233</a>. Add web server to task tracker that shows running
- tasks and logs. Also add log access to job tracker web interface.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-205">HADOOP-205</a>. Incorporate pending tasks into tasktracker load
- calculations.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-247">HADOOP-247</a>. Fix sort progress to better handle exceptions.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-195">HADOOP-195</a>. Improve performance of the transfer of map outputs to
- reduce nodes by performing multiple transfers in parallel, each on
- a separate socket.<br />(Sameer Paranjpye via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-251">HADOOP-251</a>. Fix task processes to be tolerant of failed progress
- reports to their parent process.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-325">HADOOP-325</a>. Improve the FileNotFound exceptions thrown by
- LocalFileSystem to include the name of the file.<br />(Benjamin Reed via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-254">HADOOP-254</a>. Use HTTP to transfer map output data to reduce
- nodes. This, together with <a href="http://issues.apache.org/jira/browse/HADOOP-195">HADOOP-195</a>, greatly improves the
- performance of these transfers.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-163">HADOOP-163</a>. Cause datanodes that\ are unable to either read or
- write data to exit, so that the namenode will no longer target
- them for new blocks and will replicate their data on other nodes.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-222">HADOOP-222</a>. Add a -setrep option to the dfs commands that alters
- file replication levels.<br />(Johan Oskarson via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-75">HADOOP-75</a>. In DFS, only check for a complete file when the file
- is closed, rather than as each block is written.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-124">HADOOP-124</a>. Change DFS so that datanodes are identified by a
- persistent ID rather than by host and port. This solves a number
- of filesystem integrity problems, when, e.g., datanodes are
- restarted.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-256">HADOOP-256</a>. Add a C API for DFS.<br />(Arun C Murthy via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-211">HADOOP-211</a>. Switch to use the Jakarta Commons logging internally,
- configured to use log4j by default.<br />(Arun C Murthy and cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-265">HADOOP-265</a>. Tasktracker now fails to start if it does not have a
- writable local directory for temporary files. In this case, it
- logs a message to the JobTracker and exits.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-270">HADOOP-270</a>. Fix potential deadlock in datanode shutdown.<br />(Hairong Kuang via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.2.1_-_2006-05-12_')">Release 0.2.1 - 2006-05-12
- </a></h3>
- <ol id="release_0.2.1_-_2006-05-12_">
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-199">HADOOP-199</a>. Fix reduce progress (broken by <a href="http://issues.apache.org/jira/browse/HADOOP-182">HADOOP-182</a>).<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-201">HADOOP-201</a>. Fix 'bin/hadoop dfs -report'.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-207">HADOOP-207</a>. Fix JDK 1.4 incompatibility introduced by <a href="http://issues.apache.org/jira/browse/HADOOP-96">HADOOP-96</a>.
- System.getenv() does not work in JDK 1.4.<br />(Hairong Kuang via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.2.0_-_2006-05-05_')">Release 0.2.0 - 2006-05-05
- </a></h3>
- <ol id="release_0.2.0_-_2006-05-05_">
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-126">HADOOP-126</a>. 'bin/hadoop dfs -cp' now correctly copies .crc
- files.<br />(Konstantin Shvachko via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-51">HADOOP-51</a>. Change DFS to support per-file replication counts.<br />(Konstantin Shvachko via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-131">HADOOP-131</a>. Add scripts to start/stop dfs and mapred daemons.
- Use these in start/stop-all scripts.<br />(Chris Mattmann via cutting)</li>
- <li>Stop using ssh options by default that are not yet in widely used
- versions of ssh. Folks can still enable their use by uncommenting
- a line in conf/hadoop-env.sh.<br />(cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-92">HADOOP-92</a>. Show information about all attempts to run each
- task in the web ui.<br />(Mahadev konar via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-128">HADOOP-128</a>. Improved DFS error handling.<br />(Owen O'Malley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-129">HADOOP-129</a>. Replace uses of java.io.File with new class named
- Path. This fixes bugs where java.io.File methods were called
- directly when FileSystem methods were desired, and reduces the
- likelihood of such bugs in the future. It also makes the handling
- of pathnames more consistent between local and dfs FileSystems and
- between Windows and Unix. java.io.File-based methods are still
- available for back-compatibility, but are deprecated and will be
- removed once 0.2 is released.<br />(cutting)</li>
- <li>Change dfs.data.dir and mapred.local.dir to be comma-separated
- lists of directories, no longer be space-separated. This fixes
- several bugs on Windows.<br />(cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-144">HADOOP-144</a>. Use mapred task id for dfs client id, to
- facilitate debugging.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-143">HADOOP-143</a>. Do not line-wrap stack-traces in web ui.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-118">HADOOP-118</a>. In DFS, improve clean up of abandoned file
- creations.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-138">HADOOP-138</a>. Stop multiple tasks in a single heartbeat, rather
- than one per heartbeat.<br />(Stefan via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-139">HADOOP-139</a>. Remove a potential deadlock in
- LocalFileSystem.lock().<br />(Igor Bolotin via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-134">HADOOP-134</a>. Don't hang jobs when the tasktracker is
- misconfigured to use an un-writable local directory.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-115">HADOOP-115</a>. Correct an error message.<br />(Stack via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-133">HADOOP-133</a>. Retry pings from child to parent, in case of
- (local) communcation problems. Also log exit status, so that one
- can distinguish patricide from other deaths.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-142">HADOOP-142</a>. Avoid re-running a task on a host where it has
- previously failed.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-148">HADOOP-148</a>. Maintain a task failure count for each
- tasktracker and display it in the web ui.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-151">HADOOP-151</a>. Close a potential socket leak, where new IPC
- connection pools were created per configuration instance that RPCs
- use. Now a global RPC connection pool is used again, as
- originally intended.<br />(cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-69">HADOOP-69</a>. Don't throw a NullPointerException when getting
- hints for non-existing file split.<br />(Bryan Pendelton via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-157">HADOOP-157</a>. When a task that writes dfs files (e.g., a reduce
- task) failed and was retried, it would fail again and again,
- eventually failing the job. The problem was that dfs did not yet
- know that the failed task had abandoned the files, and would not
- yet let another task create files with the same names. Dfs now
- retries when creating a file long enough for locks on abandoned
- files to expire.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-150">HADOOP-150</a>. Improved task names that include job
- names.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-162">HADOOP-162</a>. Fix ConcurrentModificationException when
- releasing file locks.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-132">HADOOP-132</a>. Initial check-in of new Metrics API, including
- implementations for writing metric data to a file and for sending
- it to Ganglia.<br />(David Bowen via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-160">HADOOP-160</a>. Remove some uneeded synchronization around
- time-consuming operations in the TaskTracker.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-166">HADOOP-166</a>. RPCs failed when passed subclasses of a declared
- parameter type. This is fixed by changing ObjectWritable to store
- both the declared type and the instance type for Writables. Note
- that this incompatibly changes the format of ObjectWritable and
- will render unreadable any ObjectWritables stored in files.
- Nutch only uses ObjectWritable in intermediate files, so this
- should not be a problem for Nutch.<br />(Stefan & cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-168">HADOOP-168</a>. MapReduce RPC protocol methods should all declare
- IOException, so that timeouts are handled appropriately.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-169">HADOOP-169</a>. Don't fail a reduce task if a call to the
- jobtracker to locate map outputs fails.<br />(omalley via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-170">HADOOP-170</a>. Permit FileSystem clients to examine and modify
- the replication count of individual files. Also fix a few
- replication-related bugs.<br />(Konstantin Shvachko via cutting)</li>
- <li>Permit specification of a higher replication levels for job
- submission files (job.xml and job.jar). This helps with large
- clusters, since these files are read by every node.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-173">HADOOP-173</a>. Optimize allocation of tasks with local data.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-167">HADOOP-167</a>. Reduce number of Configurations and JobConf's
- created.<br />(omalley via cutting)</li>
- <li>NUTCH-256. Change FileSystem#createNewFile() to create a .crc
- file. The lack of a .crc file was causing warnings.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-174">HADOOP-174</a>. Change JobClient to not abort job until it has failed
- to contact the job tracker for five attempts, not just one as
- before.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-177">HADOOP-177</a>. Change MapReduce web interface to page through tasks.
- Previously, when jobs had more than a few thousand tasks they
- could crash web browsers.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-178">HADOOP-178</a>. In DFS, piggyback blockwork requests from datanodes
- on heartbeat responses from namenode. This reduces the volume of
- RPC traffic. Also move startup delay in blockwork from datanode
- to namenode. This fixes a problem where restarting the namenode
- triggered a lot of uneeded replication.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-183">HADOOP-183</a>. If the DFS namenode is restarted with different
- minimum and/or maximum replication counts, existing files'
- replication counts are now automatically adjusted to be within the
- newly configured bounds.<br />(Hairong Kuang via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-186">HADOOP-186</a>. Better error handling in TaskTracker's top-level
- loop. Also improve calculation of time to send next heartbeat.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-187">HADOOP-187</a>. Add two MapReduce examples/benchmarks. One creates
- files containing random data. The second sorts the output of the
- first.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-185">HADOOP-185</a>. Fix so that, when a task tracker times out making the
- RPC asking for a new task to run, the job tracker does not think
- that it is actually running the task returned.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-190">HADOOP-190</a>. If a child process hangs after it has reported
- completion, its output should not be lost.<br />(Stack via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-184">HADOOP-184</a>. Re-structure some test code to better support testing
- on a cluster.<br />(Mahadev Konar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-191">HADOOP-191</a> Add streaming package, Hadoop's first contrib module.
- This permits folks to easily submit MapReduce jobs whose map and
- reduce functions are implemented by shell commands. Use
- 'bin/hadoop jar build/hadoop-streaming.jar' to get details.<br />(Michel Tourn via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-189">HADOOP-189</a>. Fix MapReduce in standalone configuration to
- correctly handle job jar files that contain a lib directory with
- nested jar files.<br />(cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-65">HADOOP-65</a>. Initial version of record I/O framework that enables
- the specification of record types and generates marshalling code
- in both Java and C++. Generated Java code implements
- WritableComparable, but is not yet otherwise used by
- Hadoop.<br />(Milind Bhandarkar via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-193">HADOOP-193</a>. Add a MapReduce-based FileSystem benchmark.<br />(Konstantin Shvachko via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-194">HADOOP-194</a>. Add a MapReduce-based FileSystem checker. This reads
- every block in every file in the filesystem.<br />(Konstantin Shvachko
- via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-182">HADOOP-182</a>. Fix so that lost task trackers to not change the
- status of reduce tasks or completed jobs. Also fixes the progress
- meter so that failed tasks are subtracted.<br />(omalley via cutting)</li>
- <li><a href="http://issues.apache.org/jira/browse/HADOOP-96">HADOOP-96</a>. Logging improvements. Log files are now separate from
- standard output and standard error files. Logs are now rolled.
- Logging of all DFS state changes can be enabled, to facilitate
- debugging.<br />(Hairong Kuang via cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.1.1_-_2006-04-08_')">Release 0.1.1 - 2006-04-08
- </a></h3>
- <ol id="release_0.1.1_-_2006-04-08_">
- <li>Added CHANGES.txt, logging all significant changes to Hadoop.<br />(cutting)</li>
- <li>Fix MapReduceBase.close() to throw IOException, as declared in the
- Closeable interface. This permits subclasses which override this
- method to throw that exception.<br />(cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-117">HADOOP-117</a>. Pathnames were mistakenly transposed in
- JobConf.getLocalFile() causing many mapred temporary files to not
- be removed.<br />(Raghavendra Prabhu via cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-116">HADOOP-116</a>. Clean up job submission files when jobs complete.<br />(cutting)</li>
- <li>Fix <a href="http://issues.apache.org/jira/browse/HADOOP-125">HADOOP-125</a>. Fix handling of absolute paths on Windows<br />(cutting)</li>
- </ol>
- <h3><a href="javascript:toggleList('release_0.1.0_-_2006-04-01_')">Release 0.1.0 - 2006-04-01
- </a></h3>
- <ol id="release_0.1.0_-_2006-04-01_">
- <li>The first release of Hadoop.
- </li>
- </ol>
- </ul>
- </body>
- </html>
|