|
@@ -0,0 +1,284 @@
|
|
|
+/**
|
|
|
+ * Licensed to the Apache Software Foundation (ASF) under one
|
|
|
+ * or more contributor license agreements. See the NOTICE file
|
|
|
+ * distributed with this work for additional information
|
|
|
+ * regarding copyright ownership. The ASF licenses this file
|
|
|
+ * to you under the Apache License, Version 2.0 (the
|
|
|
+ * "License"); you may not use this file except in compliance
|
|
|
+ * with the License. You may obtain a copy of the License at
|
|
|
+ *
|
|
|
+ * http://www.apache.org/licenses/LICENSE-2.0
|
|
|
+ *
|
|
|
+ * Unless required by applicable law or agreed to in writing, software
|
|
|
+ * distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
+ * See the License for the specific language governing permissions and
|
|
|
+ * limitations under the License.
|
|
|
+ */
|
|
|
+
|
|
|
+package org.apache.hadoop.mapred;
|
|
|
+
|
|
|
+import java.io.File;
|
|
|
+import java.io.FileInputStream;
|
|
|
+import java.io.IOException;
|
|
|
+import java.net.URI;
|
|
|
+
|
|
|
+import junit.framework.TestCase;
|
|
|
+
|
|
|
+import org.apache.hadoop.fs.FileSystem;
|
|
|
+import org.apache.hadoop.fs.FileUtil;
|
|
|
+import org.apache.hadoop.fs.Path;
|
|
|
+import org.apache.hadoop.fs.RawLocalFileSystem;
|
|
|
+import org.apache.hadoop.io.NullWritable;
|
|
|
+import org.apache.hadoop.io.Text;
|
|
|
+
|
|
|
+@SuppressWarnings("unchecked")
|
|
|
+public class TestFileOutputCommitter extends TestCase {
|
|
|
+ private static Path outDir = new Path(System.getProperty("test.build.data",
|
|
|
+ "/tmp"), "output");
|
|
|
+
|
|
|
+ // A random task attempt id for testing.
|
|
|
+ private static String attempt = "attempt_200707121733_0001_m_000000_0";
|
|
|
+ private static String partFile = "part-00000";
|
|
|
+ private static TaskAttemptID taskID = TaskAttemptID.forName(attempt);
|
|
|
+ private Text key1 = new Text("key1");
|
|
|
+ private Text key2 = new Text("key2");
|
|
|
+ private Text val1 = new Text("val1");
|
|
|
+ private Text val2 = new Text("val2");
|
|
|
+
|
|
|
+
|
|
|
+ private void writeOutput(RecordWriter theRecordWriter,
|
|
|
+ TaskAttemptContext context) throws IOException, InterruptedException {
|
|
|
+ NullWritable nullWritable = NullWritable.get();
|
|
|
+
|
|
|
+ try {
|
|
|
+ theRecordWriter.write(key1, val1);
|
|
|
+ theRecordWriter.write(null, nullWritable);
|
|
|
+ theRecordWriter.write(null, val1);
|
|
|
+ theRecordWriter.write(nullWritable, val2);
|
|
|
+ theRecordWriter.write(key2, nullWritable);
|
|
|
+ theRecordWriter.write(key1, null);
|
|
|
+ theRecordWriter.write(null, null);
|
|
|
+ theRecordWriter.write(key2, val2);
|
|
|
+ } finally {
|
|
|
+ theRecordWriter.close(null);
|
|
|
+ }
|
|
|
+ }
|
|
|
+
|
|
|
+
|
|
|
+ public void testRecovery() throws Exception {
|
|
|
+ JobConf conf = new JobConf();
|
|
|
+ FileOutputFormat.setOutputPath(conf, outDir);
|
|
|
+ conf.set(JobContext.TASK_ATTEMPT_ID, attempt);
|
|
|
+ conf.setInt(MRConstants.APPLICATION_ATTEMPT_ID, 1);
|
|
|
+ JobContext jContext = new JobContextImpl(conf, taskID.getJobID());
|
|
|
+ TaskAttemptContext tContext = new TaskAttemptContextImpl(conf, taskID);
|
|
|
+ FileOutputCommitter committer = new FileOutputCommitter();
|
|
|
+
|
|
|
+ // setup
|
|
|
+ committer.setupJob(jContext);
|
|
|
+ committer.setupTask(tContext);
|
|
|
+
|
|
|
+ // write output
|
|
|
+ TextOutputFormat theOutputFormat = new TextOutputFormat();
|
|
|
+ RecordWriter theRecordWriter =
|
|
|
+ theOutputFormat.getRecordWriter(null, conf, partFile, null);
|
|
|
+ writeOutput(theRecordWriter, tContext);
|
|
|
+
|
|
|
+ // do commit
|
|
|
+ committer.commitTask(tContext);
|
|
|
+ Path jobTempDir1 = new Path(outDir,
|
|
|
+ FileOutputCommitter.getJobAttemptBaseDirName(
|
|
|
+ conf.getInt(MRConstants.APPLICATION_ATTEMPT_ID, 0)));
|
|
|
+ assertTrue((new File(jobTempDir1.toString()).exists()));
|
|
|
+ validateContent(jobTempDir1);
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+ //now while running the second app attempt,
|
|
|
+ //recover the task output from first attempt
|
|
|
+ JobConf conf2 = new JobConf(conf);
|
|
|
+ conf2.set(JobContext.TASK_ATTEMPT_ID, attempt);
|
|
|
+ conf2.setInt(MRConstants.APPLICATION_ATTEMPT_ID, 2);
|
|
|
+ JobContext jContext2 = new JobContextImpl(conf2, taskID.getJobID());
|
|
|
+ TaskAttemptContext tContext2 = new TaskAttemptContextImpl(conf2, taskID);
|
|
|
+ FileOutputCommitter committer2 = new FileOutputCommitter();
|
|
|
+ committer.setupJob(jContext2);
|
|
|
+ Path jobTempDir2 = new Path(outDir,
|
|
|
+ FileOutputCommitter.getJobAttemptBaseDirName(
|
|
|
+ conf2.getInt(MRConstants.APPLICATION_ATTEMPT_ID, 0)));
|
|
|
+ assertTrue((new File(jobTempDir2.toString()).exists()));
|
|
|
+
|
|
|
+ tContext2.getConfiguration().setInt(MRConstants.APPLICATION_ATTEMPT_ID, 2);
|
|
|
+ committer2.recoverTask(tContext2);
|
|
|
+ validateContent(jobTempDir2);
|
|
|
+
|
|
|
+ committer2.commitJob(jContext2);
|
|
|
+ validateContent(outDir);
|
|
|
+ FileUtil.fullyDelete(new File(outDir.toString()));
|
|
|
+ }
|
|
|
+
|
|
|
+ private void validateContent(Path dir) throws IOException {
|
|
|
+ File expectedFile = new File(new Path(dir, partFile).toString());
|
|
|
+ StringBuffer expectedOutput = new StringBuffer();
|
|
|
+ expectedOutput.append(key1).append('\t').append(val1).append("\n");
|
|
|
+ expectedOutput.append(val1).append("\n");
|
|
|
+ expectedOutput.append(val2).append("\n");
|
|
|
+ expectedOutput.append(key2).append("\n");
|
|
|
+ expectedOutput.append(key1).append("\n");
|
|
|
+ expectedOutput.append(key2).append('\t').append(val2).append("\n");
|
|
|
+ String output = slurp(expectedFile);
|
|
|
+ assertEquals(output, expectedOutput.toString());
|
|
|
+ }
|
|
|
+
|
|
|
+
|
|
|
+ public void testCommitter() throws Exception {
|
|
|
+ JobConf conf = new JobConf();
|
|
|
+ FileOutputFormat.setOutputPath(conf, outDir);
|
|
|
+ conf.set(JobContext.TASK_ATTEMPT_ID, attempt);
|
|
|
+ JobContext jContext = new JobContextImpl(conf, taskID.getJobID());
|
|
|
+ TaskAttemptContext tContext = new TaskAttemptContextImpl(conf, taskID);
|
|
|
+ FileOutputCommitter committer = new FileOutputCommitter();
|
|
|
+
|
|
|
+ // setup
|
|
|
+ committer.setupJob(jContext);
|
|
|
+ committer.setupTask(tContext);
|
|
|
+
|
|
|
+ // write output
|
|
|
+ TextOutputFormat theOutputFormat = new TextOutputFormat();
|
|
|
+ RecordWriter theRecordWriter =
|
|
|
+ theOutputFormat.getRecordWriter(null, conf, partFile, null);
|
|
|
+ writeOutput(theRecordWriter, tContext);
|
|
|
+
|
|
|
+ // do commit
|
|
|
+ committer.commitTask(tContext);
|
|
|
+ committer.commitJob(jContext);
|
|
|
+
|
|
|
+ // validate output
|
|
|
+ validateContent(outDir);
|
|
|
+ FileUtil.fullyDelete(new File(outDir.toString()));
|
|
|
+ }
|
|
|
+
|
|
|
+
|
|
|
+ public void testAbort() throws IOException, InterruptedException {
|
|
|
+ JobConf conf = new JobConf();
|
|
|
+ FileOutputFormat.setOutputPath(conf, outDir);
|
|
|
+ conf.set(JobContext.TASK_ATTEMPT_ID, attempt);
|
|
|
+ JobContext jContext = new JobContextImpl(conf, taskID.getJobID());
|
|
|
+ TaskAttemptContext tContext = new TaskAttemptContextImpl(conf, taskID);
|
|
|
+ FileOutputCommitter committer = new FileOutputCommitter();
|
|
|
+
|
|
|
+ // do setup
|
|
|
+ committer.setupJob(jContext);
|
|
|
+ committer.setupTask(tContext);
|
|
|
+
|
|
|
+ // write output
|
|
|
+ TextOutputFormat theOutputFormat = new TextOutputFormat();
|
|
|
+ RecordWriter theRecordWriter =
|
|
|
+ theOutputFormat.getRecordWriter(null, conf, partFile, null);
|
|
|
+ writeOutput(theRecordWriter, tContext);
|
|
|
+
|
|
|
+ // do abort
|
|
|
+ committer.abortTask(tContext);
|
|
|
+ FileSystem outputFileSystem = outDir.getFileSystem(conf);
|
|
|
+ Path workPath = new Path(outDir,
|
|
|
+ committer.getTaskAttemptBaseDirName(tContext))
|
|
|
+ .makeQualified(outputFileSystem);
|
|
|
+ File expectedFile = new File(new Path(workPath, partFile)
|
|
|
+ .toString());
|
|
|
+ assertFalse("task temp dir still exists", expectedFile.exists());
|
|
|
+
|
|
|
+ committer.abortJob(jContext, JobStatus.State.FAILED);
|
|
|
+ expectedFile = new File(new Path(outDir, FileOutputCommitter.TEMP_DIR_NAME)
|
|
|
+ .toString());
|
|
|
+ assertFalse("job temp dir still exists", expectedFile.exists());
|
|
|
+ assertEquals("Output directory not empty", 0, new File(outDir.toString())
|
|
|
+ .listFiles().length);
|
|
|
+ FileUtil.fullyDelete(new File(outDir.toString()));
|
|
|
+ }
|
|
|
+
|
|
|
+ public static class FakeFileSystem extends RawLocalFileSystem {
|
|
|
+ public FakeFileSystem() {
|
|
|
+ super();
|
|
|
+ }
|
|
|
+
|
|
|
+ public URI getUri() {
|
|
|
+ return URI.create("faildel:///");
|
|
|
+ }
|
|
|
+
|
|
|
+ @Override
|
|
|
+ public boolean delete(Path p, boolean recursive) throws IOException {
|
|
|
+ throw new IOException("fake delete failed");
|
|
|
+ }
|
|
|
+ }
|
|
|
+
|
|
|
+
|
|
|
+ public void testFailAbort() throws IOException, InterruptedException {
|
|
|
+ JobConf conf = new JobConf();
|
|
|
+ conf.set(FileSystem.FS_DEFAULT_NAME_KEY, "faildel:///");
|
|
|
+ conf.setClass("fs.faildel.impl", FakeFileSystem.class, FileSystem.class);
|
|
|
+ conf.set(JobContext.TASK_ATTEMPT_ID, attempt);
|
|
|
+ conf.setInt(MRConstants.APPLICATION_ATTEMPT_ID, 1);
|
|
|
+ FileOutputFormat.setOutputPath(conf, outDir);
|
|
|
+ JobContext jContext = new JobContextImpl(conf, taskID.getJobID());
|
|
|
+ TaskAttemptContext tContext = new TaskAttemptContextImpl(conf, taskID);
|
|
|
+ FileOutputCommitter committer = new FileOutputCommitter();
|
|
|
+
|
|
|
+ // do setup
|
|
|
+ committer.setupJob(jContext);
|
|
|
+ committer.setupTask(tContext);
|
|
|
+
|
|
|
+ // write output
|
|
|
+ File jobTmpDir = new File(new Path(outDir,
|
|
|
+ FileOutputCommitter.TEMP_DIR_NAME + Path.SEPARATOR +
|
|
|
+ conf.getInt(MRConstants.APPLICATION_ATTEMPT_ID, 0) +
|
|
|
+ Path.SEPARATOR +
|
|
|
+ FileOutputCommitter.TEMP_DIR_NAME).toString());
|
|
|
+ File taskTmpDir = new File(jobTmpDir, "_" + taskID);
|
|
|
+ File expectedFile = new File(taskTmpDir, partFile);
|
|
|
+ TextOutputFormat<?, ?> theOutputFormat = new TextOutputFormat();
|
|
|
+ RecordWriter<?, ?> theRecordWriter =
|
|
|
+ theOutputFormat.getRecordWriter(null, conf,
|
|
|
+ expectedFile.getAbsolutePath(), null);
|
|
|
+ writeOutput(theRecordWriter, tContext);
|
|
|
+
|
|
|
+ // do abort
|
|
|
+ Throwable th = null;
|
|
|
+ try {
|
|
|
+ committer.abortTask(tContext);
|
|
|
+ } catch (IOException ie) {
|
|
|
+ th = ie;
|
|
|
+ }
|
|
|
+ assertNotNull(th);
|
|
|
+ assertTrue(th instanceof IOException);
|
|
|
+ assertTrue(th.getMessage().contains("fake delete failed"));
|
|
|
+ assertTrue(expectedFile + " does not exists", expectedFile.exists());
|
|
|
+
|
|
|
+ th = null;
|
|
|
+ try {
|
|
|
+ committer.abortJob(jContext, JobStatus.State.FAILED);
|
|
|
+ } catch (IOException ie) {
|
|
|
+ th = ie;
|
|
|
+ }
|
|
|
+ assertNotNull(th);
|
|
|
+ assertTrue(th instanceof IOException);
|
|
|
+ assertTrue(th.getMessage().contains("fake delete failed"));
|
|
|
+ assertTrue("job temp dir does not exists", jobTmpDir.exists());
|
|
|
+ FileUtil.fullyDelete(new File(outDir.toString()));
|
|
|
+ }
|
|
|
+
|
|
|
+ public static String slurp(File f) throws IOException {
|
|
|
+ int len = (int) f.length();
|
|
|
+ byte[] buf = new byte[len];
|
|
|
+ FileInputStream in = new FileInputStream(f);
|
|
|
+ String contents = null;
|
|
|
+ try {
|
|
|
+ in.read(buf, 0, len);
|
|
|
+ contents = new String(buf, "UTF-8");
|
|
|
+ } finally {
|
|
|
+ in.close();
|
|
|
+ }
|
|
|
+ return contents;
|
|
|
+ }
|
|
|
+
|
|
|
+}
|