Browse Source

MAPREDUCE-6366. mapreduce.terasort.final.sync configuration in TeraSort doesn't work. Contributed by Takuya Fukudome.

Tsuyoshi Ozawa 10 years ago
parent
commit
e82067bfe6

+ 3 - 0
hadoop-mapreduce-project/CHANGES.txt

@@ -419,6 +419,9 @@ Release 2.8.0 - UNRELEASED
     copySucceeded() in one thread and copyFailed() in another thread on the
     same host. (Junping Du via ozawa)
 
+    MAPREDUCE-6366. mapreduce.terasort.final.sync configuration in TeraSort
+    doesn't work. (Takuya Fukudome via ozawa)
+
 Release 2.7.1 - UNRELEASED
 
   INCOMPATIBLE CHANGES

+ 0 - 1
hadoop-mapreduce-project/hadoop-mapreduce-examples/src/main/java/org/apache/hadoop/examples/terasort/TeraSort.java

@@ -328,7 +328,6 @@ public class TeraSort extends Configured implements Tool {
     }
     
     job.getConfiguration().setInt("dfs.replication", getOutputReplication(job));
-    TeraOutputFormat.setFinalSync(job, true);
     int ret = job.waitForCompletion(true) ? 0 : 1;
     LOG.info("done");
     return ret;

+ 1 - 1
hadoop-mapreduce-project/hadoop-mapreduce-examples/src/main/java/org/apache/hadoop/examples/terasort/TeraSortConfigKeys.java

@@ -70,7 +70,7 @@ public enum TeraSortConfigKeys {
   public static final long DEFAULT_NUM_ROWS = 0L;
   public static final int DEFAULT_NUM_PARTITIONS = 10;
   public static final long DEFAULT_SAMPLE_SIZE = 100000L;
-  public static final boolean DEFAULT_FINAL_SYNC_ATTRIBUTE = false;
+  public static final boolean DEFAULT_FINAL_SYNC_ATTRIBUTE = true;
   public static final boolean DEFAULT_USE_TERA_SCHEDULER = true;
   public static final boolean DEFAULT_USE_SIMPLE_PARTITIONER = false;
   public static final int DEFAULT_OUTPUT_REPLICATION = 1;