|
@@ -0,0 +1,159 @@
|
|
|
|
+/**
|
|
|
|
+ * Licensed to the Apache Software Foundation (ASF) under one
|
|
|
|
+ * or more contributor license agreements. See the NOTICE file
|
|
|
|
+ * distributed with this work for additional information
|
|
|
|
+ * regarding copyright ownership. The ASF licenses this file
|
|
|
|
+ * to you under the Apache License, Version 2.0 (the
|
|
|
|
+ * "License"); you may not use this file except in compliance
|
|
|
|
+ * with the License. You may obtain a copy of the License at
|
|
|
|
+ *
|
|
|
|
+ * http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
+ *
|
|
|
|
+ * Unless required by applicable law or agreed to in writing, software
|
|
|
|
+ * distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
+ * See the License for the specific language governing permissions and
|
|
|
|
+ * limitations under the License.
|
|
|
|
+ */
|
|
|
|
+
|
|
|
|
+package org.apache.hadoop.hdfs.server.namenode;
|
|
|
|
+
|
|
|
|
+import java.io.IOException;
|
|
|
|
+
|
|
|
|
+import org.apache.commons.logging.Log;
|
|
|
|
+import org.apache.commons.logging.LogFactory;
|
|
|
|
+import org.apache.hadoop.conf.Configuration;
|
|
|
|
+import org.apache.hadoop.fs.Path;
|
|
|
|
+import org.apache.hadoop.hdfs.protocol.FSConstants.SafeModeAction;
|
|
|
|
+import org.apache.hadoop.hdfs.DFSConfigKeys;
|
|
|
|
+import org.apache.hadoop.hdfs.DistributedFileSystem;
|
|
|
|
+import org.apache.hadoop.hdfs.HdfsConfiguration;
|
|
|
|
+import org.apache.hadoop.hdfs.MiniDFSCluster;
|
|
|
|
+import org.apache.hadoop.hdfs.DFSTestUtil;
|
|
|
|
+import junit.framework.TestCase;
|
|
|
|
+
|
|
|
|
+/**
|
|
|
|
+ * Tests to verify safe mode correctness.
|
|
|
|
+ */
|
|
|
|
+public class TestSafeMode extends TestCase {
|
|
|
|
+
|
|
|
|
+ static Log LOG = LogFactory.getLog(TestSafeMode.class);
|
|
|
|
+
|
|
|
|
+ /**
|
|
|
|
+ * This test verifies that if SafeMode is manually entered, name-node does not
|
|
|
|
+ * come out of safe mode even after the startup safe mode conditions are met.
|
|
|
|
+ * <ol>
|
|
|
|
+ * <li>Start cluster with 1 data-node.</li>
|
|
|
|
+ * <li>Create 2 files with replication 1.</li>
|
|
|
|
+ * <li>Re-start cluster with 0 data-nodes.
|
|
|
|
+ * Name-node should stay in automatic safe-mode.</li>
|
|
|
|
+ * <li>Enter safe mode manually.</li>
|
|
|
|
+ * <li>Start the data-node.</li>
|
|
|
|
+ * <li>Wait longer than <tt>dfs.safemode.extension</tt> and
|
|
|
|
+ * verify that the name-node is still in safe mode.</li>
|
|
|
|
+ * </ol>
|
|
|
|
+ *
|
|
|
|
+ * @throws IOException
|
|
|
|
+ */
|
|
|
|
+ public void testManualSafeMode() throws IOException {
|
|
|
|
+ MiniDFSCluster cluster = null;
|
|
|
|
+ DistributedFileSystem fs = null;
|
|
|
|
+ try {
|
|
|
|
+ Configuration conf = new HdfsConfiguration();
|
|
|
|
+ // disable safemode extension to make the test run faster.
|
|
|
|
+ conf.set(DFSConfigKeys.DFS_NAMENODE_SAFEMODE_EXTENSION_KEY, "1");
|
|
|
|
+ cluster = new MiniDFSCluster.Builder(conf).build();
|
|
|
|
+ cluster.waitActive();
|
|
|
|
+
|
|
|
|
+ fs = (DistributedFileSystem)cluster.getFileSystem();
|
|
|
|
+ Path file1 = new Path("/tmp/testManualSafeMode/file1");
|
|
|
|
+ Path file2 = new Path("/tmp/testManualSafeMode/file2");
|
|
|
|
+
|
|
|
|
+ LOG.info("Created file1 and file2.");
|
|
|
|
+
|
|
|
|
+ // create two files with one block each.
|
|
|
|
+ DFSTestUtil.createFile(fs, file1, 1000, (short)1, 0);
|
|
|
|
+ DFSTestUtil.createFile(fs, file2, 2000, (short)1, 0);
|
|
|
|
+ fs.close();
|
|
|
|
+ cluster.shutdown();
|
|
|
|
+
|
|
|
|
+ // now bring up just the NameNode.
|
|
|
|
+ cluster = new MiniDFSCluster.Builder(conf).numDataNodes(0).format(false).build();
|
|
|
|
+ cluster.waitActive();
|
|
|
|
+ fs = (DistributedFileSystem)cluster.getFileSystem();
|
|
|
|
+
|
|
|
|
+ LOG.info("Restarted cluster with just the NameNode");
|
|
|
|
+
|
|
|
|
+ assertTrue("No datanode is started. Should be in SafeMode",
|
|
|
|
+ fs.setSafeMode(SafeModeAction.SAFEMODE_GET));
|
|
|
|
+
|
|
|
|
+ // manually set safemode.
|
|
|
|
+ fs.setSafeMode(SafeModeAction.SAFEMODE_ENTER);
|
|
|
|
+
|
|
|
|
+ // now bring up the datanode and wait for it to be active.
|
|
|
|
+ cluster.startDataNodes(conf, 1, true, null, null);
|
|
|
|
+ cluster.waitActive();
|
|
|
|
+
|
|
|
|
+ LOG.info("Datanode is started.");
|
|
|
|
+
|
|
|
|
+ // wait longer than dfs.safemode.extension
|
|
|
|
+ try {
|
|
|
|
+ Thread.sleep(2000);
|
|
|
|
+ } catch (InterruptedException ignored) {}
|
|
|
|
+
|
|
|
|
+ assertTrue("should still be in SafeMode",
|
|
|
|
+ fs.setSafeMode(SafeModeAction.SAFEMODE_GET));
|
|
|
|
+
|
|
|
|
+ fs.setSafeMode(SafeModeAction.SAFEMODE_LEAVE);
|
|
|
|
+ assertFalse("should not be in SafeMode",
|
|
|
|
+ fs.setSafeMode(SafeModeAction.SAFEMODE_GET));
|
|
|
|
+ } finally {
|
|
|
|
+ if(fs != null) fs.close();
|
|
|
|
+ if(cluster!= null) cluster.shutdown();
|
|
|
|
+ }
|
|
|
|
+ }
|
|
|
|
+
|
|
|
|
+
|
|
|
|
+ /**
|
|
|
|
+ * Verify that the NameNode stays in safemode when dfs.safemode.datanode.min
|
|
|
|
+ * is set to a number greater than the number of live datanodes.
|
|
|
|
+ */
|
|
|
|
+ public void testDatanodeThreshold() throws IOException {
|
|
|
|
+ MiniDFSCluster cluster = null;
|
|
|
|
+ DistributedFileSystem fs = null;
|
|
|
|
+ try {
|
|
|
|
+ Configuration conf = new Configuration();
|
|
|
|
+ conf.setInt(DFSConfigKeys.DFS_NAMENODE_SAFEMODE_EXTENSION_KEY, 0);
|
|
|
|
+ conf.setInt(DFSConfigKeys.DFS_NAMENODE_SAFEMODE_MIN_DATANODES_KEY, 1);
|
|
|
|
+
|
|
|
|
+ // bring up a cluster with no datanodes
|
|
|
|
+ cluster = new MiniDFSCluster.Builder(conf).numDataNodes(0).format(true).build();
|
|
|
|
+ cluster.waitActive();
|
|
|
|
+ fs = (DistributedFileSystem)cluster.getFileSystem();
|
|
|
|
+
|
|
|
|
+ assertTrue("No datanode started, but we require one - safemode expected",
|
|
|
|
+ fs.setSafeMode(SafeModeAction.SAFEMODE_GET));
|
|
|
|
+
|
|
|
|
+ String tipMsg = cluster.getNamesystem().getSafeModeTip();
|
|
|
|
+ assertTrue("Safemode tip message looks right",
|
|
|
|
+ tipMsg.contains("The number of live datanodes 0 needs an " +
|
|
|
|
+ "additional 1 live"));
|
|
|
|
+
|
|
|
|
+ // Start a datanode
|
|
|
|
+ cluster.startDataNodes(conf, 1, true, null, null);
|
|
|
|
+
|
|
|
|
+ // Wait long enough for safemode check to refire
|
|
|
|
+ try {
|
|
|
|
+ Thread.sleep(1000);
|
|
|
|
+ } catch (InterruptedException ignored) {}
|
|
|
|
+
|
|
|
|
+ // We now should be out of safe mode.
|
|
|
|
+ assertFalse(
|
|
|
|
+ "Out of safe mode after starting datanode.",
|
|
|
|
+ fs.setSafeMode(SafeModeAction.SAFEMODE_GET));
|
|
|
|
+ } finally {
|
|
|
|
+ if (fs != null) fs.close();
|
|
|
|
+ if (cluster != null) cluster.shutdown();
|
|
|
|
+ }
|
|
|
|
+ }
|
|
|
|
+}
|