14 年之前 · 4796e1adcb
--- a/mapreduce/CHANGES.txt
+++ b/mapreduce/CHANGES.txt
@@ -40,6 +40,9 @@ Trunk (unreleased changes)
 
															   IMPROVEMENTS
														
 
															+    MAPREDUCE-2365. Add counters to track bytes (read,written) via 
														
 
															+    File(Input,Output)Format. (Siddharth Seth via acmurthy)
														
 
															+ 
														
 
															     MAPREDUCE-2680. Display queue name in job client CLI. (acmurthy) 
														
 
															     MAPREDUCE-2679. Minor changes to sync trunk with MR-279 branch. (acmurthy) 
														
--- a/mapreduce/src/java/org/apache/hadoop/mapred/Counters.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapred/Counters.java
@@ -38,7 +38,7 @@ import org.apache.hadoop.io.IntWritable;
 
															 import org.apache.hadoop.io.Text;
														
 
															 import org.apache.hadoop.io.Writable;
														
 
															 import org.apache.hadoop.io.WritableUtils;
														
 
															-import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
														
 
															+import org.apache.hadoop.mapreduce.lib.input.FileInputFormatCounter;
														
 
															 import org.apache.hadoop.util.StringUtils;
														
 
															 /**
														
@@ -457,11 +457,10 @@ public class Counters implements Writable, Iterable<Counters.Group> {
 
															    */
														
 
															   public synchronized Counter findCounter(String group, String name) {
														
 
															     if (name.equals("MAP_INPUT_BYTES")) {
														
 
															-      group = FileInputFormat.COUNTER_GROUP; 
														
 
															-      name = FileInputFormat.BYTES_READ; 
														
 
															       LOG.warn("Counter name MAP_INPUT_BYTES is deprecated. " +
														
 
															                "Use FileInputFormatCounters as group name and " +
														
 
															                " BYTES_READ as counter name instead");
														
 
															+      return findCounter(FileInputFormatCounter.BYTES_READ);
														
 
															     }
														
 
															     return getGroup(group).getCounterForName(name);
														
 
															   }
														
--- a/mapreduce/src/java/org/apache/hadoop/mapred/MapTask.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapred/MapTask.java
@@ -35,7 +35,7 @@ import org.apache.commons.logging.LogFactory;
 
															 import org.apache.hadoop.fs.FSDataInputStream;
														
 
															 import org.apache.hadoop.fs.FSDataOutputStream;
														
 
															 import org.apache.hadoop.fs.FileSystem;
														
 
															-import org.apache.hadoop.fs.LocalDirAllocator;
														
 
															+import org.apache.hadoop.fs.FileSystem.Statistics;
														
 
															 import org.apache.hadoop.fs.LocalFileSystem;
														
 
															 import org.apache.hadoop.fs.Path;
														
 
															 import org.apache.hadoop.io.DataInputBuffer;
														
@@ -51,12 +51,12 @@ import org.apache.hadoop.io.serializer.Serializer;
 
															 import org.apache.hadoop.mapred.IFile.Writer;
														
 
															 import org.apache.hadoop.mapred.Merger.Segment;
														
 
															 import org.apache.hadoop.mapred.SortedRanges.SkipRangeIterator;
														
 
															-import org.apache.hadoop.mapreduce.MRConfig;
														
 
															 import org.apache.hadoop.mapreduce.MRJobConfig;
														
 
															 import org.apache.hadoop.mapreduce.TaskAttemptContext;
														
 
															 import org.apache.hadoop.mapreduce.TaskCounter;
														
 
															-import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
														
 
															+import org.apache.hadoop.mapreduce.lib.input.FileInputFormatCounter;
														
 
															 import org.apache.hadoop.mapreduce.lib.map.WrappedMapper;
														
 
															+import org.apache.hadoop.mapreduce.lib.output.FileOutputFormatCounter;
														
 
															 import org.apache.hadoop.mapreduce.split.JobSplit.TaskSplitIndex;
														
 
															 import org.apache.hadoop.mapreduce.task.MapContextImpl;
														
 
															 import org.apache.hadoop.util.IndexedSortable;
														
@@ -141,20 +141,31 @@ class MapTask extends Task {
 
															   class TrackedRecordReader<K, V> 
														
 
															       implements RecordReader<K,V> {
														
 
															     private RecordReader<K,V> rawIn;
														
 
															-    private Counters.Counter inputByteCounter;
														
 
															+    private Counters.Counter fileInputByteCounter;
														
 
															     private Counters.Counter inputRecordCounter;
														
 
															     private TaskReporter reporter;
														
 
															-    private long beforePos = -1;
														
 
															-    private long afterPos = -1;
														
 
															+    private long bytesInPrev = -1;
														
 
															+    private long bytesInCurr = -1;
														
 
															+    private final Statistics fsStats;
														
 
															-    TrackedRecordReader(RecordReader<K,V> raw, TaskReporter reporter) 
														
 
															+    TrackedRecordReader(TaskReporter reporter, JobConf job) 
														
 
															       throws IOException{
														
 
															-      rawIn = raw;
														
 
															       inputRecordCounter = reporter.getCounter(TaskCounter.MAP_INPUT_RECORDS);
														
 
															-      inputByteCounter = reporter.getCounter(
														
 
															-                           FileInputFormat.COUNTER_GROUP,
														
 
															-                           FileInputFormat.BYTES_READ);
														
 
															+      fileInputByteCounter = reporter.getCounter(FileInputFormatCounter.BYTES_READ);
														
 
															       this.reporter = reporter;
														
 
															+      
														
 
															+      Statistics matchedStats = null;
														
 
															+      if (this.reporter.getInputSplit() instanceof FileSplit) {
														
 
															+        matchedStats = getFsStatistics(((FileSplit) this.reporter
														
 
															+            .getInputSplit()).getPath(), job);
														
 
															+      }
														
 
															+      fsStats = matchedStats;
														
 
															+
														
 
															+      bytesInPrev = getInputBytes(fsStats);
														
 
															+      rawIn = job.getInputFormat().getRecordReader(reporter.getInputSplit(),
														
 
															+          job, reporter);
														
 
															+      bytesInCurr = getInputBytes(fsStats);
														
 
															+      fileInputByteCounter.increment(bytesInCurr - bytesInPrev);
														
 
															     }
														
 
															     public K createKey() {
														
@@ -176,26 +187,37 @@ class MapTask extends Task {
 
															     protected void incrCounters() {
														
 
															       inputRecordCounter.increment(1);
														
 
															-      inputByteCounter.increment(afterPos - beforePos);
														
 
															     }
														
 
															     protected synchronized boolean moveToNext(K key, V value)
														
 
															       throws IOException {
														
 
															-      beforePos = getPos();
														
 
															+      bytesInPrev = getInputBytes(fsStats);
														
 
															       boolean ret = rawIn.next(key, value);
														
 
															-      afterPos = getPos();
														
 
															+      bytesInCurr = getInputBytes(fsStats);
														
 
															+      fileInputByteCounter.increment(bytesInCurr - bytesInPrev);
														
 
															       reporter.setProgress(getProgress());
														
 
															       return ret;
														
 
															     }
														
 
															     public long getPos() throws IOException { return rawIn.getPos(); }
														
 
															-    public void close() throws IOException { rawIn.close(); }
														
 
															+
														
 
															+    public void close() throws IOException {
														
 
															+      bytesInPrev = getInputBytes(fsStats);
														
 
															+      rawIn.close();
														
 
															+      bytesInCurr = getInputBytes(fsStats);
														
 
															+      fileInputByteCounter.increment(bytesInCurr - bytesInPrev);
														
 
															+    }
														
 
															+
														
 
															     public float getProgress() throws IOException {
														
 
															       return rawIn.getProgress();
														
 
															     }
														
 
															     TaskReporter getTaskReporter() {
														
 
															       return reporter;
														
 
															     }
														
 
															+
														
 
															+    private long getInputBytes(Statistics stats) {
														
 
															+      return stats == null ? 0 : stats.getBytesRead();
														
 
															+    }
														
 
															   }
														
 
															   /**
														
@@ -210,9 +232,9 @@ class MapTask extends Task {
 
															     private Counters.Counter skipRecCounter;
														
 
															     private long recIndex = -1;
														
 
															-    SkippingRecordReader(RecordReader<K,V> raw, TaskUmbilicalProtocol umbilical,
														
 
															-                         TaskReporter reporter) throws IOException{
														
 
															-      super(raw, reporter);
														
 
															+    SkippingRecordReader(TaskUmbilicalProtocol umbilical,
														
 
															+                         TaskReporter reporter, JobConf job) throws IOException{
														
 
															+      super(reporter, job);
														
 
															       this.umbilical = umbilical;
														
 
															       this.skipRecCounter = reporter.getCounter(TaskCounter.MAP_SKIPPED_RECORDS);
														
 
															       this.toWriteSkipRecs = toWriteSkipRecs() &&  
														
@@ -356,11 +378,9 @@ class MapTask extends Task {
 
															     updateJobWithSplit(job, inputSplit);
														
 
															     reporter.setInputSplit(inputSplit);
														
 
															-    RecordReader<INKEY,INVALUE> rawIn =                  // open input
														
 
															-      job.getInputFormat().getRecordReader(inputSplit, job, reporter);
														
 
															     RecordReader<INKEY,INVALUE> in = isSkipping() ? 
														
 
															-        new SkippingRecordReader<INKEY,INVALUE>(rawIn, umbilical, reporter) :
														
 
															-        new TrackedRecordReader<INKEY,INVALUE>(rawIn, reporter);
														
 
															+        new SkippingRecordReader<INKEY,INVALUE>(umbilical, reporter, job) :
														
 
															+          new TrackedRecordReader<INKEY,INVALUE>(reporter, job);
														
 
															     job.setBoolean(JobContext.SKIP_RECORDS, isSkipping());
														
@@ -409,18 +429,40 @@ class MapTask extends Task {
 
															     extends org.apache.hadoop.mapreduce.RecordReader<K,V> {
														
 
															     private final org.apache.hadoop.mapreduce.RecordReader<K,V> real;
														
 
															     private final org.apache.hadoop.mapreduce.Counter inputRecordCounter;
														
 
															+    private final org.apache.hadoop.mapreduce.Counter fileInputByteCounter;
														
 
															     private final TaskReporter reporter;
														
 
															+    private final Statistics fsStats;
														
 
															-    NewTrackingRecordReader(org.apache.hadoop.mapreduce.RecordReader<K,V> real,
														
 
															-                            TaskReporter reporter) {
														
 
															-      this.real = real;
														
 
															+    NewTrackingRecordReader(org.apache.hadoop.mapreduce.InputSplit split,
														
 
															+        org.apache.hadoop.mapreduce.InputFormat<K, V> inputFormat,
														
 
															+        TaskReporter reporter,
														
 
															+        org.apache.hadoop.mapreduce.TaskAttemptContext taskContext)
														
 
															+        throws InterruptedException, IOException {
														
 
															       this.reporter = reporter;
														
 
															-      this.inputRecordCounter = reporter.getCounter(TaskCounter.MAP_INPUT_RECORDS);
														
 
															+      this.inputRecordCounter = reporter
														
 
															+          .getCounter(TaskCounter.MAP_INPUT_RECORDS);
														
 
															+      this.fileInputByteCounter = reporter
														
 
															+          .getCounter(FileInputFormatCounter.BYTES_READ);
														
 
															+
														
 
															+      Statistics matchedStats = null;
														
 
															+      if (split instanceof org.apache.hadoop.mapreduce.lib.input.FileSplit) {
														
 
															+        matchedStats = getFsStatistics(((org.apache.hadoop.mapreduce.lib.input.FileSplit) split)
														
 
															+            .getPath(), taskContext.getConfiguration());
														
 
															+      }
														
 
															+      fsStats = matchedStats;
														
 
															+
														
 
															+      long bytesInPrev = getInputBytes(fsStats);
														
 
															+      this.real = inputFormat.createRecordReader(split, taskContext);
														
 
															+      long bytesInCurr = getInputBytes(fsStats);
														
 
															+      fileInputByteCounter.increment(bytesInCurr - bytesInPrev);
														
 
															     }
														
 
															     @Override
														
 
															     public void close() throws IOException {
														
 
															+      long bytesInPrev = getInputBytes(fsStats);
														
 
															       real.close();
														
 
															+      long bytesInCurr = getInputBytes(fsStats);
														
 
															+      fileInputByteCounter.increment(bytesInCurr - bytesInPrev);
														
 
															     }
														
 
															     @Override
														
@@ -442,18 +484,28 @@ class MapTask extends Task {
 
															     public void initialize(org.apache.hadoop.mapreduce.InputSplit split,
														
 
															                            org.apache.hadoop.mapreduce.TaskAttemptContext context
														
 
															                            ) throws IOException, InterruptedException {
														
 
															+      long bytesInPrev = getInputBytes(fsStats);
														
 
															       real.initialize(split, context);
														
 
															+      long bytesInCurr = getInputBytes(fsStats);
														
 
															+      fileInputByteCounter.increment(bytesInCurr - bytesInPrev);
														
 
															     }
														
 
															     @Override
														
 
															     public boolean nextKeyValue() throws IOException, InterruptedException {
														
 
															+      long bytesInPrev = getInputBytes(fsStats);
														
 
															       boolean result = real.nextKeyValue();
														
 
															+      long bytesInCurr = getInputBytes(fsStats);
														
 
															       if (result) {
														
 
															         inputRecordCounter.increment(1);
														
 
															       }
														
 
															+      fileInputByteCounter.increment(bytesInCurr - bytesInPrev);
														
 
															       reporter.setProgress(getProgress());
														
 
															       return result;
														
 
															     }
														
 
															+
														
 
															+    private long getInputBytes(Statistics stats) {
														
 
															+      return stats == null ? 0 : stats.getBytesRead();
														
 
															+    }
														
 
															   }
														
 
															   /**
														
@@ -506,15 +558,30 @@ class MapTask extends Task {
 
															     private final TaskReporter reporter;
														
 
															     private final Counters.Counter mapOutputRecordCounter;
														
 
															+    private final Counters.Counter fileOutputByteCounter; 
														
 
															+    private final Statistics fsStats;
														
 
															     @SuppressWarnings("unchecked")
														
 
															     NewDirectOutputCollector(MRJobConfig jobContext,
														
 
															         JobConf job, TaskUmbilicalProtocol umbilical, TaskReporter reporter) 
														
 
															     throws IOException, ClassNotFoundException, InterruptedException {
														
 
															       this.reporter = reporter;
														
 
															+      mapOutputRecordCounter = reporter
														
 
															+          .getCounter(TaskCounter.MAP_OUTPUT_RECORDS);
														
 
															+      fileOutputByteCounter = reporter
														
 
															+          .getCounter(FileOutputFormatCounter.BYTES_WRITTEN);
														
 
															+
														
 
															+      Statistics matchedStats = null;
														
 
															+      if (outputFormat instanceof org.apache.hadoop.mapreduce.lib.output.FileOutputFormat) {
														
 
															+        matchedStats = getFsStatistics(org.apache.hadoop.mapreduce.lib.output.FileOutputFormat
														
 
															+            .getOutputPath(taskContext), taskContext.getConfiguration());
														
 
															+      }
														
 
															+      fsStats = matchedStats;
														
 
															+
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															       out = outputFormat.getRecordWriter(taskContext);
														
 
															-      mapOutputRecordCounter = 
														
 
															-        reporter.getCounter(TaskCounter.MAP_OUTPUT_RECORDS);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															     }
														
 
															     @Override
														
@@ -522,7 +589,10 @@ class MapTask extends Task {
 
															     public void write(K key, V value) 
														
 
															     throws IOException, InterruptedException {
														
 
															       reporter.progress();
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															       out.write(key, value);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															       mapOutputRecordCounter.increment(1);
														
 
															     }
														
@@ -531,9 +601,16 @@ class MapTask extends Task {
 
															     throws IOException,InterruptedException {
														
 
															       reporter.progress();
														
 
															       if (out != null) {
														
 
															+        long bytesOutPrev = getOutputBytes(fsStats);
														
 
															         out.close(context);
														
 
															+        long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+        fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															       }
														
 
															     }
														
 
															+    
														
 
															+    private long getOutputBytes(Statistics stats) {
														
 
															+      return stats == null ? 0 : stats.getBytesWritten();
														
 
															+    }
														
 
															   }
														
 
															   private class NewOutputCollector<K,V>
														
@@ -609,7 +686,7 @@ class MapTask extends Task {
 
															     org.apache.hadoop.mapreduce.RecordReader<INKEY,INVALUE> input =
														
 
															       new NewTrackingRecordReader<INKEY,INVALUE>
														
 
															-          (inputFormat.createRecordReader(split, taskContext), reporter);
														
 
															+        (split, inputFormat, reporter, taskContext);
														
 
															     job.setBoolean(JobContext.SKIP_RECORDS, isSkipping());
														
 
															     org.apache.hadoop.mapreduce.RecordWriter output = null;
														
@@ -662,6 +739,8 @@ class MapTask extends Task {
 
															     private TaskReporter reporter = null;
														
 
															     private final Counters.Counter mapOutputRecordCounter;
														
 
															+    private final Counters.Counter fileOutputByteCounter;
														
 
															+    private final Statistics fsStats;
														
 
															     @SuppressWarnings("unchecked")
														
 
															     public DirectMapOutputCollector(TaskUmbilicalProtocol umbilical,
														
@@ -670,14 +749,30 @@ class MapTask extends Task {
 
															       String finalName = getOutputName(getPartition());
														
 
															       FileSystem fs = FileSystem.get(job);
														
 
															-      out = job.getOutputFormat().getRecordWriter(fs, job, finalName, reporter);
														
 
															-
														
 
															+      OutputFormat<K, V> outputFormat = job.getOutputFormat();   
														
 
															       mapOutputRecordCounter = reporter.getCounter(TaskCounter.MAP_OUTPUT_RECORDS);
														
 
															+      
														
 
															+      fileOutputByteCounter = reporter
														
 
															+          .getCounter(FileOutputFormatCounter.BYTES_WRITTEN);
														
 
															+
														
 
															+      Statistics matchedStats = null;
														
 
															+      if (outputFormat instanceof FileOutputFormat) {
														
 
															+        matchedStats = getFsStatistics(FileOutputFormat.getOutputPath(job), job);
														
 
															+      }
														
 
															+      fsStats = matchedStats;
														
 
															+
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															+      out = job.getOutputFormat().getRecordWriter(fs, job, finalName, reporter);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															     }
														
 
															     public void close() throws IOException {
														
 
															       if (this.out != null) {
														
 
															+        long bytesOutPrev = getOutputBytes(fsStats);
														
 
															         out.close(this.reporter);
														
 
															+        long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+        fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															       }
														
 
															     }
														
@@ -688,10 +783,16 @@ class MapTask extends Task {
 
															     public void collect(K key, V value, int partition) throws IOException {
														
 
															       reporter.progress();
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															       out.write(key, value);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															       mapOutputRecordCounter.increment(1);
														
 
															     }
														
 
															-    
														
 
															+
														
 
															+    private long getOutputBytes(Statistics stats) {
														
 
															+      return stats == null ? 0 : stats.getBytesWritten();
														
 
															+    }
														
 
															   }
														
 
															   private class MapOutputBuffer<K extends Object, V extends Object>
														
@@ -757,6 +858,7 @@ class MapTask extends Task {
 
															     // Counters
														
 
															     final Counters.Counter mapOutputByteCounter;
														
 
															     final Counters.Counter mapOutputRecordCounter;
														
 
															+    final Counters.Counter fileOutputByteCounter;
														
 
															     final ArrayList<SpillRecord> indexCacheList =
														
 
															       new ArrayList<SpillRecord>();
														
@@ -823,6 +925,8 @@ class MapTask extends Task {
 
															       mapOutputByteCounter = reporter.getCounter(TaskCounter.MAP_OUTPUT_BYTES);
														
 
															       mapOutputRecordCounter =
														
 
															         reporter.getCounter(TaskCounter.MAP_OUTPUT_RECORDS);
														
 
															+      fileOutputByteCounter = reporter
														
 
															+          .getCounter(TaskCounter.MAP_OUTPUT_MATERIALIZED_BYTES);
														
 
															       // compression
														
 
															       if (job.getCompressMapOutput()) {
														
@@ -1317,6 +1421,8 @@ class MapTask extends Task {
 
															       // release sort buffer before the merge
														
 
															       kvbuffer = null;
														
 
															       mergeParts();
														
 
															+      Path outputPath = mapOutputFile.getOutputFile();
														
 
															+      fileOutputByteCounter.increment(rfs.getFileStatus(outputPath).getLen());
														
 
															     }
														
 
															     public void close() { }
														
--- a/mapreduce/src/java/org/apache/hadoop/mapred/ReduceTask.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapred/ReduceTask.java
@@ -34,6 +34,7 @@ import org.apache.hadoop.classification.InterfaceStability;
 
															 import org.apache.hadoop.conf.Configuration;
														
 
															 import org.apache.hadoop.fs.FileStatus;
														
 
															 import org.apache.hadoop.fs.FileSystem;
														
 
															+import org.apache.hadoop.fs.FileSystem.Statistics;
														
 
															 import org.apache.hadoop.fs.Path;
														
 
															 import org.apache.hadoop.io.DataInputBuffer;
														
 
															 import org.apache.hadoop.io.RawComparator;
														
@@ -48,6 +49,7 @@ import org.apache.hadoop.mapred.SortedRanges.SkipRangeIterator;
 
															 import org.apache.hadoop.mapred.TaskTracker.TaskInProgress;
														
 
															 import org.apache.hadoop.mapreduce.TaskAttemptContext;
														
 
															 import org.apache.hadoop.mapreduce.TaskCounter;
														
 
															+import org.apache.hadoop.mapreduce.lib.output.FileOutputFormatCounter;
														
 
															 import org.apache.hadoop.mapreduce.server.jobtracker.JTConfig;
														
 
															 import org.apache.hadoop.mapreduce.task.reduce.Shuffle;
														
 
															 import org.apache.hadoop.util.Progress;
														
@@ -95,6 +97,8 @@ public class ReduceTask extends Task {
 
															     getCounters().findCounter(TaskCounter.COMBINE_INPUT_RECORDS);
														
 
															   private Counters.Counter reduceCombineOutputCounter =
														
 
															     getCounters().findCounter(TaskCounter.COMBINE_OUTPUT_RECORDS);
														
 
															+  private Counters.Counter fileOutputByteCounter =
														
 
															+    getCounters().findCounter(FileOutputFormatCounter.BYTES_WRITTEN);
														
 
															   // A custom comparator for map output files. Here the ordering is determined
														
 
															   // by the file's size and path. In case of files with same size and different
														
@@ -407,17 +411,14 @@ public class ReduceTask extends Task {
 
															     // make output collector
														
 
															     String finalName = getOutputName(getPartition());
														
 
															-    FileSystem fs = FileSystem.get(job);
														
 
															+    final RecordWriter<OUTKEY, OUTVALUE> out = new OldTrackingRecordWriter<OUTKEY, OUTVALUE>(
														
 
															+        this, job, reporter, finalName);
														
 
															-    final RecordWriter<OUTKEY,OUTVALUE> out = 
														
 
															-      job.getOutputFormat().getRecordWriter(fs, job, finalName, reporter);  
														
 
															-    
														
 
															     OutputCollector<OUTKEY,OUTVALUE> collector = 
														
 
															       new OutputCollector<OUTKEY,OUTVALUE>() {
														
 
															         public void collect(OUTKEY key, OUTVALUE value)
														
 
															           throws IOException {
														
 
															           out.write(key, value);
														
 
															-          reduceOutputCounter.increment(1);
														
 
															           // indicate that progress update needs to be sent
														
 
															           reporter.progress();
														
 
															         }
														
@@ -465,28 +466,104 @@ public class ReduceTask extends Task {
 
															     }
														
 
															   }
														
 
															+  static class OldTrackingRecordWriter<K, V> implements RecordWriter<K, V> {
														
 
															+
														
 
															+    private final RecordWriter<K, V> real;
														
 
															+    private final org.apache.hadoop.mapred.Counters.Counter reduceOutputCounter;
														
 
															+    private final org.apache.hadoop.mapred.Counters.Counter fileOutputByteCounter;
														
 
															+    private final Statistics fsStats;
														
 
															+
														
 
															+    @SuppressWarnings({ "deprecation", "unchecked" })
														
 
															+    public OldTrackingRecordWriter(ReduceTask reduce, JobConf job,
														
 
															+        TaskReporter reporter, String finalName) throws IOException {
														
 
															+      this.reduceOutputCounter = reduce.reduceOutputCounter;
														
 
															+      this.fileOutputByteCounter = reduce.fileOutputByteCounter;
														
 
															+      Statistics matchedStats = null;
														
 
															+      if (job.getOutputFormat() instanceof FileOutputFormat) {
														
 
															+        matchedStats = getFsStatistics(FileOutputFormat.getOutputPath(job), job);
														
 
															+      }
														
 
															+      fsStats = matchedStats;
														
 
															+
														
 
															+      FileSystem fs = FileSystem.get(job);
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															+      this.real = job.getOutputFormat().getRecordWriter(fs, job, finalName,
														
 
															+          reporter);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															+    }
														
 
															+
														
 
															+    @Override
														
 
															+    public void write(K key, V value) throws IOException {
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															+      real.write(key, value);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															+      reduceOutputCounter.increment(1);
														
 
															+    }
														
 
															+
														
 
															+    @Override
														
 
															+    public void close(Reporter reporter) throws IOException {
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															+      real.close(reporter);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															+    }
														
 
															+
														
 
															+    private long getOutputBytes(Statistics stats) {
														
 
															+      return stats == null ? 0 : stats.getBytesWritten();
														
 
															+    }
														
 
															+  }
														
 
															+
														
 
															   static class NewTrackingRecordWriter<K,V> 
														
 
															       extends org.apache.hadoop.mapreduce.RecordWriter<K,V> {
														
 
															     private final org.apache.hadoop.mapreduce.RecordWriter<K,V> real;
														
 
															     private final org.apache.hadoop.mapreduce.Counter outputRecordCounter;
														
 
															-  
														
 
															-    NewTrackingRecordWriter(org.apache.hadoop.mapreduce.RecordWriter<K,V> real,
														
 
															-                            org.apache.hadoop.mapreduce.Counter recordCounter) {
														
 
															-      this.real = real;
														
 
															-      this.outputRecordCounter = recordCounter;
														
 
															+    private final org.apache.hadoop.mapreduce.Counter fileOutputByteCounter;
														
 
															+    private final Statistics fsStats;
														
 
															+
														
 
															+    @SuppressWarnings("unchecked")
														
 
															+    NewTrackingRecordWriter(ReduceTask reduce,
														
 
															+        org.apache.hadoop.mapreduce.TaskAttemptContext taskContext)
														
 
															+        throws InterruptedException, IOException {
														
 
															+      this.outputRecordCounter = reduce.reduceOutputCounter;
														
 
															+      this.fileOutputByteCounter = reduce.fileOutputByteCounter;
														
 
															+
														
 
															+      Statistics matchedStats = null;
														
 
															+      if (reduce.outputFormat instanceof org.apache.hadoop.mapreduce.lib.output.FileOutputFormat) {
														
 
															+        matchedStats = getFsStatistics(org.apache.hadoop.mapreduce.lib.output.FileOutputFormat
														
 
															+            .getOutputPath(taskContext), taskContext.getConfiguration());
														
 
															+      }
														
 
															+
														
 
															+      fsStats = matchedStats;
														
 
															+
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															+      this.real = (org.apache.hadoop.mapreduce.RecordWriter<K, V>) reduce.outputFormat
														
 
															+          .getRecordWriter(taskContext);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															     }
														
 
															     @Override
														
 
															     public void close(TaskAttemptContext context) throws IOException,
														
 
															     InterruptedException {
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															       real.close(context);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															     }
														
 
															     @Override
														
 
															     public void write(K key, V value) throws IOException, InterruptedException {
														
 
															+      long bytesOutPrev = getOutputBytes(fsStats);
														
 
															       real.write(key,value);
														
 
															+      long bytesOutCurr = getOutputBytes(fsStats);
														
 
															+      fileOutputByteCounter.increment(bytesOutCurr - bytesOutPrev);
														
 
															       outputRecordCounter.increment(1);
														
 
															     }
														
 
															+
														
 
															+    private long getOutputBytes(Statistics stats) {
														
 
															+      return stats == null ? 0 : stats.getBytesWritten();
														
 
															+    }
														
 
															   }
														
 
															   @SuppressWarnings("unchecked")
														
@@ -529,11 +606,8 @@ public class ReduceTask extends Task {
 
															     org.apache.hadoop.mapreduce.Reducer<INKEY,INVALUE,OUTKEY,OUTVALUE> reducer =
														
 
															       (org.apache.hadoop.mapreduce.Reducer<INKEY,INVALUE,OUTKEY,OUTVALUE>)
														
 
															         ReflectionUtils.newInstance(taskContext.getReducerClass(), job);
														
 
															-    org.apache.hadoop.mapreduce.RecordWriter<OUTKEY,OUTVALUE> output =
														
 
															-      (org.apache.hadoop.mapreduce.RecordWriter<OUTKEY,OUTVALUE>)
														
 
															-        outputFormat.getRecordWriter(taskContext);
														
 
															     org.apache.hadoop.mapreduce.RecordWriter<OUTKEY,OUTVALUE> trackedRW = 
														
 
															-      new NewTrackingRecordWriter<OUTKEY, OUTVALUE>(output, reduceOutputCounter);
														
 
															+      new NewTrackingRecordWriter<OUTKEY, OUTVALUE>(this, taskContext);
														
 
															     job.setBoolean("mapred.skip.on", isSkipping());
														
 
															     job.setBoolean(JobContext.SKIP_RECORDS, isSkipping());
														
 
															     org.apache.hadoop.mapreduce.Reducer.Context 
														
@@ -545,6 +619,6 @@ public class ReduceTask extends Task {
 
															                                                reporter, comparator, keyClass,
														
 
															                                                valueClass);
														
 
															     reducer.run(reducerContext);
														
 
															-    output.close(reducerContext);
														
 
															+    trackedRW.close(reducerContext);
														
 
															   }
														
 
															 }
														
--- a/mapreduce/src/java/org/apache/hadoop/mapred/Task.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapred/Task.java
@@ -289,6 +289,28 @@ abstract public class Task implements Writable, Configurable {
 
															     }
														
 
															   }
														
 
															+  /**
														
 
															+   * Gets a handle to the Statistics instance based on the scheme associated
														
 
															+   * with path.
														
 
															+   * 
														
 
															+   * @param path the path.
														
 
															+   * @param conf the configuration to extract the scheme from if not part of 
														
 
															+   *   the path.
														
 
															+   * @return a Statistics instance, or null if none is found for the scheme.
														
 
															+   */
														
 
															+  protected static Statistics getFsStatistics(Path path, Configuration conf) throws IOException {
														
 
															+    Statistics matchedStats = null;
														
 
															+    path = path.getFileSystem(conf).makeQualified(path);
														
 
															+    String scheme = path.toUri().getScheme();
														
 
															+    for (Statistics stats : FileSystem.getAllStatistics()) {
														
 
															+      if (stats.getScheme().equals(scheme)) {
														
 
															+        matchedStats = stats;
														
 
															+        break;
														
 
															+      }
														
 
															+    }
														
 
															+    return matchedStats;
														
 
															+  }
														
 
															+
														
 
															   /**
														
 
															    * Get skipRanges.
														
 
															    */
														
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/TaskCounter.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/TaskCounter.java
@@ -29,6 +29,7 @@ public enum TaskCounter {
 
															   MAP_OUTPUT_RECORDS,
														
 
															   MAP_SKIPPED_RECORDS,
														
 
															   MAP_OUTPUT_BYTES,
														
 
															+  MAP_OUTPUT_MATERIALIZED_BYTES,
														
 
															   SPLIT_RAW_BYTES,
														
 
															   COMBINE_INPUT_RECORDS,
														
 
															   COMBINE_OUTPUT_RECORDS,
														
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/TaskCounter.properties
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/TaskCounter.properties
@@ -17,6 +17,7 @@ CounterGroupName=              Map-Reduce Framework
 
															 MAP_INPUT_RECORDS.name=        Map input records
														
 
															 MAP_OUTPUT_RECORDS.name=       Map output records
														
 
															 MAP_OUTPUT_BYTES.name=         Map output bytes
														
 
															+MAP_OUTPUT_MATERIALIZED_BYTES.name= Map output materialized bytes
														
 
															 MAP_SKIPPED_RECORDS.name=      Map skipped records
														
 
															 COMBINE_INPUT_RECORDS.name=    Combine input records
														
 
															 COMBINE_OUTPUT_RECORDS.name=   Combine output records
														
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/input/FileInputFormat.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/input/FileInputFormat.java
@@ -54,9 +54,6 @@ import org.apache.hadoop.util.StringUtils;
 
															 @InterfaceAudience.Public
														
 
															 @InterfaceStability.Stable
														
 
															 public abstract class FileInputFormat<K, V> extends InputFormat<K, V> {
														
 
															-  public static final String COUNTER_GROUP = 
														
 
															-                                "FileInputFormatCounters";
														
 
															-  public static final String BYTES_READ = "BYTES_READ";
														
 
															   public static final String INPUT_DIR = 
														
 
															     "mapreduce.input.fileinputformat.inputdir";
														
 
															   public static final String SPLIT_MAXSIZE = 
														
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/input/LineRecordReader.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/input/LineRecordReader.java
@@ -35,7 +35,6 @@ import org.apache.hadoop.io.compress.SplitCompressionInputStream;
 
															 import org.apache.hadoop.io.compress.SplittableCompressionCodec;
														
 
															 import org.apache.hadoop.io.compress.CompressionCodecFactory;
														
 
															 import org.apache.hadoop.io.compress.Decompressor;
														
 
															-import org.apache.hadoop.mapreduce.Counter;
														
 
															 import org.apache.hadoop.mapreduce.InputSplit;
														
 
															 import org.apache.hadoop.mapreduce.RecordReader;
														
 
															 import org.apache.hadoop.mapreduce.TaskAttemptContext;
														
@@ -63,7 +62,6 @@ public class LineRecordReader extends RecordReader<LongWritable, Text> {
 
															   private int maxLineLength;
														
 
															   private LongWritable key = null;
														
 
															   private Text value = null;
														
 
															-  private Counter inputByteCounter;
														
 
															   private CompressionCodec codec;
														
 
															   private Decompressor decompressor;
														
 
															   private byte[] recordDelimiterBytes;
														
@@ -78,8 +76,6 @@ public class LineRecordReader extends RecordReader<LongWritable, Text> {
 
															   public void initialize(InputSplit genericSplit,
														
 
															                          TaskAttemptContext context) throws IOException {
														
 
															     FileSplit split = (FileSplit) genericSplit;
														
 
															-    inputByteCounter = context.getCounter(
														
 
															-      FileInputFormat.COUNTER_GROUP, FileInputFormat.BYTES_READ);
														
 
															     Configuration job = context.getConfiguration();
														
 
															     this.maxLineLength = job.getInt(MAX_LINE_LENGTH, Integer.MAX_VALUE);
														
 
															     start = split.getStart();
														
@@ -174,7 +170,6 @@ public class LineRecordReader extends RecordReader<LongWritable, Text> {
 
															         break;
														
 
															       }
														
 
															       pos += newSize;
														
 
															-      inputByteCounter.increment(newSize);
														
 
															       if (newSize < maxLineLength) {
														
 
															         break;
														
 
															       }
														
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/input/SequenceFileRecordReader.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/input/SequenceFileRecordReader.java
@@ -27,9 +27,7 @@ import org.apache.hadoop.conf.Configuration;
 
															 import org.apache.hadoop.fs.FileSystem;
														
 
															 import org.apache.hadoop.fs.Path;
														
 
															 import org.apache.hadoop.io.*;
														
 
															-import org.apache.hadoop.mapreduce.Counter;
														
 
															 import org.apache.hadoop.mapreduce.InputSplit;
														
 
															-import org.apache.hadoop.mapreduce.MapContext;
														
 
															 import org.apache.hadoop.mapreduce.RecordReader;
														
 
															 import org.apache.hadoop.mapreduce.TaskAttemptContext;
														
@@ -44,16 +42,12 @@ public class SequenceFileRecordReader<K, V> extends RecordReader<K, V> {
 
															   private K key = null;
														
 
															   private V value = null;
														
 
															   protected Configuration conf;
														
 
															-  private Counter inputByteCounter;
														
 
															-  private long pos;
														
 
															-  
														
 
															+
														
 
															   @Override
														
 
															   public void initialize(InputSplit split, 
														
 
															                          TaskAttemptContext context
														
 
															                          ) throws IOException, InterruptedException {
														
 
															     FileSplit fileSplit = (FileSplit) split;
														
 
															-    inputByteCounter = ((MapContext)context).getCounter(
														
 
															-      FileInputFormat.COUNTER_GROUP, FileInputFormat.BYTES_READ);
														
 
															     conf = context.getConfiguration();    
														
 
															     Path path = fileSplit.getPath();
														
 
															     FileSystem fs = path.getFileSystem(conf);
														
@@ -74,8 +68,7 @@ public class SequenceFileRecordReader<K, V> extends RecordReader<K, V> {
 
															     if (!more) {
														
 
															       return false;
														
 
															     }
														
 
															-    inputByteCounter.increment(in.getPosition()-pos);
														
 
															-    pos = in.getPosition();
														
 
															+    long pos = in.getPosition();
														
 
															     key = (K) in.next(key);
														
 
															     if (key == null || (pos >= end && in.syncSeen())) {
														
 
															       more = false;
														
--- a/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/output/FileOutputFormat.java
+++ b/mapreduce/src/java/org/apache/hadoop/mapreduce/lib/output/FileOutputFormat.java
@@ -150,7 +150,9 @@ public static final String OUTDIR = "mapreduce.output.fileoutputformat.outputdir
 
															    * @param outputDir the {@link Path} of the output directory for 
														
 
															    * the map-reduce job.
														
 
															    */
														
 
															-  public static void setOutputPath(Job job, Path outputDir) {
														
 
															+  public static void setOutputPath(Job job, Path outputDir) throws IOException {
														
 
															+    outputDir = outputDir.getFileSystem(job.getConfiguration()).makeQualified(
														
 
															+        outputDir);
														
 
															     job.getConfiguration().set(FileOutputFormat.OUTDIR, outputDir.toString());
														
 
															   }
														
--- a/mapreduce/src/test/mapred/org/apache/hadoop/mapred/TestJobCounters.java
+++ b/mapreduce/src/test/mapred/org/apache/hadoop/mapred/TestJobCounters.java
@@ -42,9 +42,10 @@ import org.apache.hadoop.io.Writable;
 
															 import org.apache.hadoop.io.WritableComparable;
														
 
															 import org.apache.hadoop.mapreduce.Cluster;
														
 
															 import org.apache.hadoop.mapreduce.Job;
														
 
															-import org.apache.hadoop.mapreduce.MRJobConfig;
														
 
															 import org.apache.hadoop.mapreduce.TaskCounter;
														
 
															 import org.apache.hadoop.mapreduce.TaskType;
														
 
															+import org.apache.hadoop.mapreduce.lib.input.FileInputFormatCounter;
														
 
															+import org.apache.hadoop.mapreduce.lib.output.FileOutputFormatCounter;
														
 
															 /**
														
 
															  * This is an wordcount application that tests the count of records
														
@@ -58,6 +59,26 @@ import org.apache.hadoop.mapreduce.TaskType;
 
															  */
														
 
															 public class TestJobCounters {
														
 
															+  private void validateFileCounters(Counters counter, long fileBytesRead,
														
 
															+      long fileBytesWritten, long mapOutputBytes,
														
 
															+      long mapOutputMaterializedBytes) {
														
 
															+    assertTrue(counter.findCounter(FileInputFormatCounter.BYTES_READ)
														
 
															+        .getValue() != 0);
														
 
															+    assertEquals(fileBytesRead,
														
 
															+        counter.findCounter(FileInputFormatCounter.BYTES_READ).getValue());
														
 
															+
														
 
															+    assertTrue(counter.findCounter(FileOutputFormatCounter.BYTES_WRITTEN)
														
 
															+        .getValue() != 0);
														
 
															+
														
 
															+    if (mapOutputBytes >= 0) {
														
 
															+      assertTrue(counter.findCounter(TaskCounter.MAP_OUTPUT_BYTES).getValue() != 0);
														
 
															+    }
														
 
															+    if (mapOutputMaterializedBytes >= 0) {
														
 
															+      assertTrue(counter.findCounter(TaskCounter.MAP_OUTPUT_MATERIALIZED_BYTES)
														
 
															+          .getValue() != 0);
														
 
															+    }
														
 
															+  }
														
 
															+
														
 
															   private void validateCounters(Counters counter, long spillRecCnt,
														
 
															                                 long mapInputRecords, long mapOutputRecords) {
														
 
															       // Check if the numer of Spilled Records is same as expected
														
@@ -108,6 +129,19 @@ public class TestJobCounters {
 
															   private static Path OUT_DIR = null;
														
 
															   private static Path testdir = null;
														
 
															+  private static Path[] inFiles = new Path[5];
														
 
															+
														
 
															+  private static long getFileSize(Path path) throws IOException {
														
 
															+    FileSystem fs = FileSystem.getLocal(new Configuration());
														
 
															+    long len = 0;
														
 
															+    len += fs.getFileStatus(path).getLen();
														
 
															+    Path crcPath = new Path(path.getParent(), "." + path.getName() + ".crc");
														
 
															+    if (fs.exists(crcPath)) {
														
 
															+      len += fs.getFileStatus(crcPath).getLen();
														
 
															+    }
														
 
															+    return len;
														
 
															+  }
														
 
															+
														
 
															   @BeforeClass
														
 
															   public static void initPaths() throws IOException {
														
 
															     final Configuration conf = new Configuration();
														
@@ -125,11 +159,15 @@ public class TestJobCounters {
 
															     if (!fs.mkdirs(IN_DIR)) {
														
 
															       throw new IOException("Mkdirs failed to create " + IN_DIR);
														
 
															     }
														
 
															-    // create 3 input files each with 5*2k words
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_1"), conf);
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_2"), conf);
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_3"), conf);
														
 
															+    for (int i = 0; i < inFiles.length; i++) {
														
 
															+      inFiles[i] = new Path(IN_DIR, "input5_2k_" + i);
														
 
															+    }
														
 
															+
														
 
															+    // create 3 input files each with 5*2k words
														
 
															+    createWordsFile(inFiles[0], conf);
														
 
															+    createWordsFile(inFiles[1], conf);
														
 
															+    createWordsFile(inFiles[2], conf);
														
 
															   }
														
 
															   @AfterClass
														
@@ -181,8 +219,12 @@ public class TestJobCounters {
 
															     JobConf conf = createConfiguration();
														
 
															     conf.setNumMapTasks(3);
														
 
															     conf.setInt(JobContext.IO_SORT_FACTOR, 2);
														
 
															-    removeWordsFile(new Path(IN_DIR, "input5_2k_4"), conf);
														
 
															-    removeWordsFile(new Path(IN_DIR, "input5_2k_5"), conf);
														
 
															+    removeWordsFile(inFiles[3], conf);
														
 
															+    removeWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															     FileInputFormat.setInputPaths(conf, IN_DIR);
														
 
															     FileOutputFormat.setOutputPath(conf, new Path(OUT_DIR, "outputO0"));
														
@@ -211,6 +253,7 @@ public class TestJobCounters {
 
															     // 3 files, 5120 = 5 * 1024 rec/file = 15360 input records
														
 
															     // 4 records/line = 61440 output records
														
 
															     validateCounters(c1, 90112, 15360, 61440);
														
 
															+    validateFileCounters(c1, inputSize, 0, 0, 0);
														
 
															   }
														
@@ -218,8 +261,13 @@ public class TestJobCounters {
 
															   public void testOldCounterB() throws Exception {
														
 
															     JobConf conf = createConfiguration();
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_4"), conf);
														
 
															-    removeWordsFile(new Path(IN_DIR, "input5_2k_5"), conf);
														
 
															+    createWordsFile(inFiles[3], conf);
														
 
															+    removeWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															+    inputSize += getFileSize(inFiles[3]);
														
 
															     conf.setNumMapTasks(4);
														
 
															     conf.setInt(JobContext.IO_SORT_FACTOR, 2);
														
 
															     FileInputFormat.setInputPaths(conf, IN_DIR);
														
@@ -239,13 +287,20 @@ public class TestJobCounters {
 
															     // 4 files, 5120 = 5 * 1024 rec/file = 15360 input records
														
 
															     // 4 records/line = 81920 output records
														
 
															     validateCounters(c1, 131072, 20480, 81920);
														
 
															+    validateFileCounters(c1, inputSize, 0, 0, 0);
														
 
															   }
														
 
															   @Test
														
 
															   public void testOldCounterC() throws Exception {
														
 
															     JobConf conf = createConfiguration();
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_4"), conf);
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_5"), conf);
														
 
															+    createWordsFile(inFiles[3], conf);
														
 
															+    createWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															+    inputSize += getFileSize(inFiles[3]);
														
 
															+    inputSize += getFileSize(inFiles[4]);
														
 
															     conf.setNumMapTasks(4);
														
 
															     conf.setInt(JobContext.IO_SORT_FACTOR, 3);
														
 
															     FileInputFormat.setInputPaths(conf, IN_DIR);
														
@@ -260,6 +315,31 @@ public class TestJobCounters {
 
															     // 5 files, 5120 = 5 * 1024 rec/file = 15360 input records
														
 
															     // 4 records/line = 102400 output records
														
 
															     validateCounters(c1, 147456, 25600, 102400);
														
 
															+    validateFileCounters(c1, inputSize, 0, 0, 0);
														
 
															+  }
														
 
															+
														
 
															+  @Test
														
 
															+  public void testOldCounterD() throws Exception {
														
 
															+    JobConf conf = createConfiguration();
														
 
															+    conf.setNumMapTasks(3);
														
 
															+    conf.setInt(JobContext.IO_SORT_FACTOR, 2);
														
 
															+    conf.setNumReduceTasks(0);
														
 
															+    removeWordsFile(inFiles[3], conf);
														
 
															+    removeWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															+    FileInputFormat.setInputPaths(conf, IN_DIR);
														
 
															+    FileOutputFormat.setOutputPath(conf, new Path(OUT_DIR, "outputO3"));
														
 
															+
														
 
															+    RunningJob myJob = JobClient.runJob(conf);
														
 
															+    Counters c1 = myJob.getCounters();
														
 
															+
														
 
															+    // No Reduces. Will go through the direct output collector. Spills=0
														
 
															+
														
 
															+    validateCounters(c1, 0, 15360, 61440);
														
 
															+    validateFileCounters(c1, inputSize, 0, -1, -1);
														
 
															   }
														
 
															   @Test
														
@@ -267,8 +347,12 @@ public class TestJobCounters {
 
															     final Job job = createJob();
														
 
															     final Configuration conf = job.getConfiguration();
														
 
															     conf.setInt(JobContext.IO_SORT_FACTOR, 2);
														
 
															-    removeWordsFile(new Path(IN_DIR, "input5_2k_4"), conf);
														
 
															-    removeWordsFile(new Path(IN_DIR, "input5_2k_5"), conf);
														
 
															+    removeWordsFile(inFiles[3], conf);
														
 
															+    removeWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															     org.apache.hadoop.mapreduce.lib.input.FileInputFormat.setInputPaths(
														
 
															         job, IN_DIR);
														
 
															     org.apache.hadoop.mapreduce.lib.output.FileOutputFormat.setOutputPath(
														
@@ -276,6 +360,7 @@ public class TestJobCounters {
 
															     assertTrue(job.waitForCompletion(true));
														
 
															     final Counters c1 = Counters.downgrade(job.getCounters());
														
 
															     validateCounters(c1, 90112, 15360, 61440);
														
 
															+    validateFileCounters(c1, inputSize, 0, 0, 0);    
														
 
															   }
														
 
															   @Test
														
@@ -283,8 +368,13 @@ public class TestJobCounters {
 
															     final Job job = createJob();
														
 
															     final Configuration conf = job.getConfiguration();
														
 
															     conf.setInt(JobContext.IO_SORT_FACTOR, 2);
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_4"), conf);
														
 
															-    removeWordsFile(new Path(IN_DIR, "input5_2k_5"), conf);
														
 
															+    createWordsFile(inFiles[3], conf);
														
 
															+    removeWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															+    inputSize += getFileSize(inFiles[3]);
														
 
															     org.apache.hadoop.mapreduce.lib.input.FileInputFormat.setInputPaths(
														
 
															         job, IN_DIR);
														
 
															     org.apache.hadoop.mapreduce.lib.output.FileOutputFormat.setOutputPath(
														
@@ -292,6 +382,7 @@ public class TestJobCounters {
 
															     assertTrue(job.waitForCompletion(true));
														
 
															     final Counters c1 = Counters.downgrade(job.getCounters());
														
 
															     validateCounters(c1, 131072, 20480, 81920);
														
 
															+    validateFileCounters(c1, inputSize, 0, 0, 0);
														
 
															   }
														
 
															   @Test
														
@@ -299,8 +390,14 @@ public class TestJobCounters {
 
															     final Job job = createJob();
														
 
															     final Configuration conf = job.getConfiguration();
														
 
															     conf.setInt(JobContext.IO_SORT_FACTOR, 3);
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_4"), conf);
														
 
															-    createWordsFile(new Path(IN_DIR, "input5_2k_5"), conf);
														
 
															+    createWordsFile(inFiles[3], conf);
														
 
															+    createWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															+    inputSize += getFileSize(inFiles[3]);
														
 
															+    inputSize += getFileSize(inFiles[4]);
														
 
															     org.apache.hadoop.mapreduce.lib.input.FileInputFormat.setInputPaths(
														
 
															         job, IN_DIR);
														
 
															     org.apache.hadoop.mapreduce.lib.output.FileOutputFormat.setOutputPath(
														
@@ -308,6 +405,29 @@ public class TestJobCounters {
 
															     assertTrue(job.waitForCompletion(true));
														
 
															     final Counters c1 = Counters.downgrade(job.getCounters());
														
 
															     validateCounters(c1, 147456, 25600, 102400);
														
 
															+    validateFileCounters(c1, inputSize, 0, 0, 0);
														
 
															+  }
														
 
															+
														
 
															+  @Test
														
 
															+  public void testNewCounterD() throws Exception {
														
 
															+    final Job job = createJob();
														
 
															+    final Configuration conf = job.getConfiguration();
														
 
															+    conf.setInt(JobContext.IO_SORT_FACTOR, 2);
														
 
															+    job.setNumReduceTasks(0);
														
 
															+    removeWordsFile(inFiles[3], conf);
														
 
															+    removeWordsFile(inFiles[4], conf);
														
 
															+    long inputSize = 0;
														
 
															+    inputSize += getFileSize(inFiles[0]);
														
 
															+    inputSize += getFileSize(inFiles[1]);
														
 
															+    inputSize += getFileSize(inFiles[2]);
														
 
															+    org.apache.hadoop.mapreduce.lib.input.FileInputFormat.setInputPaths(job,
														
 
															+        IN_DIR);
														
 
															+    org.apache.hadoop.mapreduce.lib.output.FileOutputFormat.setOutputPath(job,
														
 
															+        new Path(OUT_DIR, "outputN3"));
														
 
															+    assertTrue(job.waitForCompletion(true));
														
 
															+    final Counters c1 = Counters.downgrade(job.getCounters());
														
 
															+    validateCounters(c1, 0, 15360, 61440);
														
 
															+    validateFileCounters(c1, inputSize, 0, -1, -1);
														
 
															   }
														
 
															   /** 
														
--- a/mapreduce/src/test/mapred/org/apache/hadoop/mapred/TestMiniMRDFSSort.java
+++ b/mapreduce/src/test/mapred/org/apache/hadoop/mapred/TestMiniMRDFSSort.java
@@ -34,6 +34,7 @@ import org.apache.hadoop.io.Text;
 
															 import org.apache.hadoop.mapred.lib.IdentityMapper;
														
 
															 import org.apache.hadoop.mapred.lib.IdentityReducer;
														
 
															 import org.apache.hadoop.mapred.lib.NullOutputFormat;
														
 
															+import org.apache.hadoop.mapreduce.lib.input.FileInputFormatCounter;
														
 
															 import org.apache.hadoop.fs.FileSystem;
														
 
															 import org.apache.hadoop.fs.Path;
														
 
															 import org.apache.hadoop.util.ToolRunner;
														
@@ -101,10 +102,8 @@ public class TestMiniMRDFSSort extends TestCase {
 
															     Sort sort = new Sort();
														
 
															     assertEquals(ToolRunner.run(job, sort, sortArgs), 0);
														
 
															     org.apache.hadoop.mapreduce.Counters counters = sort.getResult().getCounters();
														
 
															-    long mapInput = counters.findCounter(
														
 
															-      org.apache.hadoop.mapreduce.lib.input.FileInputFormat.COUNTER_GROUP,
														
 
															-      org.apache.hadoop.mapreduce.lib.input.FileInputFormat.BYTES_READ).
														
 
															-      getValue();
														
 
															+    long mapInput = counters.findCounter(FileInputFormatCounter.BYTES_READ)
														
 
															+        .getValue();
														
 
															     long hdfsRead = counters.findCounter(Task.FILESYSTEM_COUNTER_GROUP,
														
 
															                                          "HDFS_BYTES_READ").getValue();
														
 
															     // the hdfs read should be between 100% and 110% of the map input bytes
														
--- a/mapreduce/src/test/mapred/org/apache/hadoop/mapreduce/TestMapReduceLocal.java
+++ b/mapreduce/src/test/mapred/org/apache/hadoop/mapreduce/TestMapReduceLocal.java
@@ -38,6 +38,7 @@ import org.apache.hadoop.io.LongWritable;
 
															 import org.apache.hadoop.io.Text;
														
 
															 import org.apache.hadoop.mapred.MiniMRCluster;
														
 
															 import org.apache.hadoop.mapreduce.lib.input.FileInputFormat;
														
 
															+import org.apache.hadoop.mapreduce.lib.input.FileInputFormatCounter;
														
 
															 import org.apache.hadoop.mapreduce.lib.input.LineRecordReader;
														
 
															 import org.apache.hadoop.mapreduce.lib.input.TextInputFormat;
														
 
															 import org.apache.hadoop.mapreduce.lib.output.FileOutputFormat;
														
@@ -147,8 +148,7 @@ public class TestMapReduceLocal extends TestCase {
 
															                  out);
														
 
															     Counters ctrs = job.getCounters();
														
 
															     System.out.println("Counters: " + ctrs);
														
 
															-    long mapIn = ctrs.findCounter(FileInputFormat.COUNTER_GROUP, 
														
 
															-                                  FileInputFormat.BYTES_READ).getValue();
														
 
															+    long mapIn = ctrs.findCounter(FileInputFormatCounter.BYTES_READ).getValue();
														
 
															     assertTrue(mapIn != 0);    
														
 
															     long combineIn = ctrs.findCounter(COUNTER_GROUP,
														
 
															                                       "COMBINE_INPUT_RECORDS").getValue();