8 سال پیش · 6c348c5691
--- a/hadoop-common-project/hadoop-common/src/main/resources/core-default.xml
+++ b/hadoop-common-project/hadoop-common/src/main/resources/core-default.xml
@@ -994,8 +994,8 @@
 
				 <property>
			
 
				   <name>fs.s3a.threads.max</name>
			
 
				   <value>10</value>
			
 
				-  <description> Maximum number of concurrent active (part)uploads,
			
 
				-    which each use a thread from the threadpool.</description>
			
 
				+  <description>The total number of threads available in the filesystem for data
			
 
				+    uploads *or any other queued filesystem operation*.</description>
			
 
				 </property>
			
 
				 
			
 
				 <property>
			
@@ -1008,8 +1008,7 @@
 
				 <property>
			
 
				   <name>fs.s3a.max.total.tasks</name>
			
 
				   <value>5</value>
			
 
				-  <description>Number of (part)uploads allowed to the queue before
			
 
				-    blocking additional uploads.</description>
			
 
				+  <description>The number of operations which can be queued for execution</description>
			
 
				 </property>
			
 
				 
			
 
				 <property>
			
@@ -1047,13 +1046,21 @@
 
				   <name>fs.s3a.multipart.purge</name>
			
 
				   <value>false</value>
			
 
				   <description>True if you want to purge existing multipart uploads that may not have been
			
 
				-     completed/aborted correctly</description>
			
 
				+    completed/aborted correctly. The corresponding purge age is defined in
			
 
				+    fs.s3a.multipart.purge.age.
			
 
				+    If set, when the filesystem is instantiated then all outstanding uploads
			
 
				+    older than the purge age will be terminated -across the entire bucket.
			
 
				+    This will impact multipart uploads by other applications and users. so should
			
 
				+    be used sparingly, with an age value chosen to stop failed uploads, without
			
 
				+    breaking ongoing operations.
			
 
				+  </description>
			
 
				 </property>
			
 
				 
			
 
				 <property>
			
 
				   <name>fs.s3a.multipart.purge.age</name>
			
 
				   <value>86400</value>
			
 
				-  <description>Minimum age in seconds of multipart uploads to purge</description>
			
 
				+  <description>Minimum age in seconds of multipart uploads to purge.
			
 
				+  </description>
			
 
				 </property>
			
 
				 
			
 
				 <property>
			
@@ -1086,10 +1093,50 @@
 
				 <property>
			
 
				   <name>fs.s3a.fast.upload</name>
			
 
				   <value>false</value>
			
 
				-  <description>Upload directly from memory instead of buffering to
			
 
				-    disk first. Memory usage and parallelism can be controlled as up to
			
 
				-    fs.s3a.multipart.size memory is consumed for each (part)upload actively
			
 
				-    uploading (fs.s3a.threads.max) or queueing (fs.s3a.max.total.tasks)</description>
			
 
				+  <description>
			
 
				+    Use the incremental block-based fast upload mechanism with
			
 
				+    the buffering mechanism set in fs.s3a.fast.upload.buffer.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.buffer</name>
			
 
				+  <value>disk</value>
			
 
				+  <description>
			
 
				+    The buffering mechanism to use when using S3A fast upload
			
 
				+    (fs.s3a.fast.upload=true). Values: disk, array, bytebuffer.
			
 
				+    This configuration option has no effect if fs.s3a.fast.upload is false.
			
 
				+
			
 
				+    "disk" will use the directories listed in fs.s3a.buffer.dir as
			
 
				+    the location(s) to save data prior to being uploaded.
			
 
				+
			
 
				+    "array" uses arrays in the JVM heap
			
 
				+
			
 
				+    "bytebuffer" uses off-heap memory within the JVM.
			
 
				+
			
 
				+    Both "array" and "bytebuffer" will consume memory in a single stream up to the number
			
 
				+    of blocks set by:
			
 
				+
			
 
				+        fs.s3a.multipart.size * fs.s3a.fast.upload.active.blocks.
			
 
				+
			
 
				+    If using either of these mechanisms, keep this value low
			
 
				+
			
 
				+    The total number of threads performing work across all threads is set by
			
 
				+    fs.s3a.threads.max, with fs.s3a.max.total.tasks values setting the number of queued
			
 
				+    work items.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.active.blocks</name>
			
 
				+  <value>4</value>
			
 
				+  <description>
			
 
				+    Maximum Number of blocks a single output stream can have
			
 
				+    active (uploading, or queued to the central FileSystem
			
 
				+    instance's pool of queued operations.
			
 
				+
			
 
				+    This stops a single stream overloading the shared thread pool.
			
 
				+  </description>
			
 
				 </property>
			
 
				 
			
 
				 <property>
			
@@ -1100,13 +1147,6 @@
 
				   any call to setReadahead() is made to an open stream.</description>
			
 
				 </property>
			
 
				 
			
 
				-<property>
			
 
				-  <name>fs.s3a.fast.buffer.size</name>
			
 
				-  <value>1048576</value>
			
 
				-  <description>Size of initial memory buffer in bytes allocated for an
			
 
				-    upload. No effect if fs.s3a.fast.upload is false.</description>
			
 
				-</property>
			
 
				-
			
 
				 <property>
			
 
				   <name>fs.s3a.user.agent.prefix</name>
			
 
				   <value></value>
			
--- a/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/fs/contract/ContractTestUtils.java
+++ b/hadoop-common-project/hadoop-common/src/test/java/org/apache/hadoop/fs/contract/ContractTestUtils.java
@@ -965,7 +965,7 @@ public class ContractTestUtils extends Assert {
 
				    * @return the number of megabytes/second of the recorded operation
			
 
				    */
			
 
				   public static double bandwidthMBs(long bytes, long durationNS) {
			
 
				-    return (bytes * 1000.0) / durationNS;
			
 
				+    return bytes / (1024.0 * 1024) * 1.0e9 / durationNS;
			
 
				   }
			
 
				 
			
 
				   /**
			
@@ -1415,6 +1415,14 @@ public class ContractTestUtils extends Assert {
 
				       return endTime - startTime;
			
 
				     }
			
 
				 
			
 
				+    /**
			
 
				+     * Intermediate duration of the operation.
			
 
				+     * @return how much time has passed since the start (in nanos).
			
 
				+     */
			
 
				+    public long elapsedTime() {
			
 
				+      return now() - startTime;
			
 
				+    }
			
 
				+
			
 
				     public double bandwidth(long bytes) {
			
 
				       return bandwidthMBs(bytes, duration());
			
 
				     }
			
@@ -1422,10 +1430,12 @@ public class ContractTestUtils extends Assert {
 
				     /**
			
 
				      * Bandwidth as bytes per second.
			
 
				      * @param bytes bytes in
			
 
				-     * @return the number of bytes per second this operation timed.
			
 
				+     * @return the number of bytes per second this operation.
			
 
				+     *         0 if duration == 0.
			
 
				      */
			
 
				     public double bandwidthBytes(long bytes) {
			
 
				-      return (bytes * 1.0) / duration();
			
 
				+      double duration = duration();
			
 
				+      return duration > 0 ? bytes / duration : 0;
			
 
				     }
			
 
				 
			
 
				     /**
			
--- a/hadoop-tools/hadoop-aws/pom.xml
+++ b/hadoop-tools/hadoop-aws/pom.xml
@@ -35,6 +35,15 @@
 
				     <file.encoding>UTF-8</file.encoding>
			
 
				     <downloadSources>true</downloadSources>
			
 
				     <hadoop.tmp.dir>${project.build.directory}/test</hadoop.tmp.dir>
			
 
				+
			
 
				+    <!-- are scale tests enabled ? -->
			
 
				+    <fs.s3a.scale.test.enabled>unset</fs.s3a.scale.test.enabled>
			
 
				+    <!-- Size in MB of huge files. -->
			
 
				+    <fs.s3a.scale.test.huge.filesize>unset</fs.s3a.scale.test.huge.filesize>
			
 
				+    <!-- Size in MB of the partion size in huge file uploads. -->
			
 
				+    <fs.s3a.scale.test.huge.partitionsize>unset</fs.s3a.scale.test.huge.partitionsize>
			
 
				+    <!-- Timeout in seconds for scale tests.-->
			
 
				+    <fs.s3a.scale.test.timeout>3600</fs.s3a.scale.test.timeout>
			
 
				   </properties>
			
 
				 
			
 
				   <profiles>
			
@@ -115,6 +124,11 @@
 
				                 <!-- substitution.  Putting a prefix in front of it like -->
			
 
				                 <!-- "fork-" makes it work. -->
			
 
				                 <test.unique.fork.id>fork-${surefire.forkNumber}</test.unique.fork.id>
			
 
				+                <!-- Propagate scale parameters -->
			
 
				+                <fs.s3a.scale.test.enabled>${fs.s3a.scale.test.enabled}</fs.s3a.scale.test.enabled>
			
 
				+                <fs.s3a.scale.test.huge.filesize>${fs.s3a.scale.test.huge.filesize}</fs.s3a.scale.test.huge.filesize>
			
 
				+                <fs.s3a.scale.test.huge.huge.partitionsize>${fs.s3a.scale.test.huge.partitionsize}</fs.s3a.scale.test.huge.huge.partitionsize>
			
 
				+                <fs.s3a.scale.test.timeout>${fs.s3a.scale.test.timeout}</fs.s3a.scale.test.timeout>
			
 
				               </systemPropertyVariables>
			
 
				             </configuration>
			
 
				           </plugin>
			
@@ -132,7 +146,10 @@
 
				                   <forkCount>${testsThreadCount}</forkCount>
			
 
				                   <reuseForks>false</reuseForks>
			
 
				                   <argLine>${maven-surefire-plugin.argLine} -DminiClusterDedicatedDirs=true</argLine>
			
 
				+                  <forkedProcessTimeoutInSeconds>${fs.s3a.scale.test.timeout}</forkedProcessTimeoutInSeconds>
			
 
				                   <systemPropertyVariables>
			
 
				+                    <!-- Tell tests that they are being executed in parallel -->
			
 
				+                    <test.parallel.execution>true</test.parallel.execution>
			
 
				                     <test.build.data>${test.build.data}/${surefire.forkNumber}</test.build.data>
			
 
				                     <test.build.dir>${test.build.dir}/${surefire.forkNumber}</test.build.dir>
			
 
				                     <hadoop.tmp.dir>${hadoop.tmp.dir}/${surefire.forkNumber}</hadoop.tmp.dir>
			
@@ -142,6 +159,11 @@
 
				                     <!-- substitution.  Putting a prefix in front of it like -->
			
 
				                     <!-- "fork-" makes it work. -->
			
 
				                     <test.unique.fork.id>fork-${surefire.forkNumber}</test.unique.fork.id>
			
 
				+                    <!-- Propagate scale parameters -->
			
 
				+                    <fs.s3a.scale.test.enabled>${fs.s3a.scale.test.enabled}</fs.s3a.scale.test.enabled>
			
 
				+                    <fs.s3a.scale.test.huge.filesize>${fs.s3a.scale.test.huge.filesize}</fs.s3a.scale.test.huge.filesize>
			
 
				+                    <fs.s3a.scale.test.huge.huge.partitionsize>${fs.s3a.scale.test.huge.partitionsize}</fs.s3a.scale.test.huge.huge.partitionsize>
			
 
				+                    <fs.s3a.scale.test.timeout>${fs.s3a.scale.test.timeout}</fs.s3a.scale.test.timeout>
			
 
				                   </systemPropertyVariables>
			
 
				                   <!-- Some tests cannot run in parallel.  Tests that cover -->
			
 
				                   <!-- access to the root directory must run in isolation -->
			
@@ -160,10 +182,11 @@
 
				                   <excludes>
			
 
				                     <exclude>**/ITestJets3tNativeS3FileSystemContract.java</exclude>
			
 
				                     <exclude>**/ITestS3ABlockingThreadPool.java</exclude>
			
 
				-                    <exclude>**/ITestS3AFastOutputStream.java</exclude>
			
 
				                     <exclude>**/ITestS3AFileSystemContract.java</exclude>
			
 
				                     <exclude>**/ITestS3AMiniYarnCluster.java</exclude>
			
 
				                     <exclude>**/ITest*Root*.java</exclude>
			
 
				+                    <exclude>**/ITestS3AFileContextStatistics.java</exclude>
			
 
				+                    <include>**/ITestS3AHuge*.java</include>
			
 
				                   </excludes>
			
 
				                 </configuration>
			
 
				               </execution>
			
@@ -174,6 +197,16 @@
 
				                   <goal>verify</goal>
			
 
				                 </goals>
			
 
				                 <configuration>
			
 
				+                  <forkedProcessTimeoutInSeconds>${fs.s3a.scale.test.timeout}</forkedProcessTimeoutInSeconds>
			
 
				+                  <systemPropertyVariables>
			
 
				+                    <!-- Tell tests that they are being executed sequentially -->
			
 
				+                    <test.parallel.execution>false</test.parallel.execution>
			
 
				+                    <!-- Propagate scale parameters -->
			
 
				+                    <fs.s3a.scale.test.enabled>${fs.s3a.scale.test.enabled}</fs.s3a.scale.test.enabled>
			
 
				+                    <fs.s3a.scale.test.huge.filesize>${fs.s3a.scale.test.huge.filesize}</fs.s3a.scale.test.huge.filesize>
			
 
				+                    <fs.s3a.scale.test.huge.huge.partitionsize>${fs.s3a.scale.test.huge.partitionsize}</fs.s3a.scale.test.huge.huge.partitionsize>
			
 
				+                    <fs.s3a.scale.test.timeout>${fs.s3a.scale.test.timeout}</fs.s3a.scale.test.timeout>
			
 
				+                  </systemPropertyVariables>
			
 
				                   <!-- Do a sequential run for tests that cannot handle -->
			
 
				                   <!-- parallel execution. -->
			
 
				                   <includes>
			
@@ -183,6 +216,8 @@
 
				                     <include>**/ITestS3AFileSystemContract.java</include>
			
 
				                     <include>**/ITestS3AMiniYarnCluster.java</include>
			
 
				                     <include>**/ITest*Root*.java</include>
			
 
				+                    <include>**/ITestS3AFileContextStatistics.java</include>
			
 
				+                    <include>**/ITestS3AHuge*.java</include>
			
 
				                   </includes>
			
 
				                 </configuration>
			
 
				               </execution>
			
@@ -210,7 +245,13 @@
 
				                   <goal>verify</goal>
			
 
				                 </goals>
			
 
				                 <configuration>
			
 
				-                  <forkedProcessTimeoutInSeconds>3600</forkedProcessTimeoutInSeconds>
			
 
				+                  <systemPropertyVariables>
			
 
				+                    <!-- Propagate scale parameters -->
			
 
				+                    <fs.s3a.scale.test.enabled>${fs.s3a.scale.test.enabled}</fs.s3a.scale.test.enabled>
			
 
				+                    <fs.s3a.scale.test.huge.filesize>${fs.s3a.scale.test.huge.filesize}</fs.s3a.scale.test.huge.filesize>
			
 
				+                    <fs.s3a.scale.test.timeout>${fs.s3a.scale.test.timeout}</fs.s3a.scale.test.timeout>
			
 
				+                  </systemPropertyVariables>
			
 
				+                  <forkedProcessTimeoutInSeconds>${fs.s3a.scale.test.timeout}</forkedProcessTimeoutInSeconds>
			
 
				                 </configuration>
			
 
				               </execution>
			
 
				             </executions>
			
@@ -218,6 +259,19 @@
 
				         </plugins>
			
 
				       </build>
			
 
				     </profile>
			
 
				+
			
 
				+    <!-- Turn on scale tests-->
			
 
				+    <profile>
			
 
				+      <id>scale</id>
			
 
				+      <activation>
			
 
				+        <property>
			
 
				+          <name>scale</name>
			
 
				+        </property>
			
 
				+      </activation>
			
 
				+      <properties >
			
 
				+        <fs.s3a.scale.test.enabled>true</fs.s3a.scale.test.enabled>
			
 
				+      </properties>
			
 
				+    </profile>
			
 
				   </profiles>
			
 
				 
			
 
				   <build>
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/BlockingThreadPoolExecutorService.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/BlockingThreadPoolExecutorService.java
@@ -18,30 +18,21 @@
 
				 
			
 
				 package org.apache.hadoop.fs.s3a;
			
 
				 
			
 
				-import java.util.Collection;
			
 
				-import java.util.List;
			
 
				 import java.util.concurrent.BlockingQueue;
			
 
				-import java.util.concurrent.Callable;
			
 
				-import java.util.concurrent.ExecutionException;
			
 
				-import java.util.concurrent.Future;
			
 
				 import java.util.concurrent.LinkedBlockingQueue;
			
 
				 import java.util.concurrent.RejectedExecutionHandler;
			
 
				-import java.util.concurrent.Semaphore;
			
 
				 import java.util.concurrent.ThreadFactory;
			
 
				 import java.util.concurrent.ThreadPoolExecutor;
			
 
				 import java.util.concurrent.TimeUnit;
			
 
				-import java.util.concurrent.TimeoutException;
			
 
				 import java.util.concurrent.atomic.AtomicInteger;
			
 
				 
			
 
				 import org.slf4j.Logger;
			
 
				 import org.slf4j.LoggerFactory;
			
 
				 
			
 
				-import com.google.common.util.concurrent.ForwardingListeningExecutorService;
			
 
				-import com.google.common.util.concurrent.Futures;
			
 
				-import com.google.common.util.concurrent.ListenableFuture;
			
 
				-import com.google.common.util.concurrent.ListeningExecutorService;
			
 
				 import com.google.common.util.concurrent.MoreExecutors;
			
 
				 
			
 
				+import org.apache.hadoop.classification.InterfaceAudience;
			
 
				+
			
 
				 /**
			
 
				  * This ExecutorService blocks the submission of new tasks when its queue is
			
 
				  * already full by using a semaphore. Task submissions require permits, task
			
@@ -50,17 +41,17 @@ import com.google.common.util.concurrent.MoreExecutors;
 
				  * This is inspired by <a href="https://github.com/apache/incubator-s4/blob/master/subprojects/s4-comm/src/main/java/org/apache/s4/comm/staging/BlockingThreadPoolExecutorService.java">
			
 
				  * this s4 threadpool</a>
			
 
				  */
			
 
				-public class BlockingThreadPoolExecutorService
			
 
				-    extends ForwardingListeningExecutorService {
			
 
				+@InterfaceAudience.Private
			
 
				+final class BlockingThreadPoolExecutorService
			
 
				+    extends SemaphoredDelegatingExecutor {
			
 
				 
			
 
				   private static Logger LOG = LoggerFactory
			
 
				       .getLogger(BlockingThreadPoolExecutorService.class);
			
 
				 
			
 
				-  private Semaphore queueingPermits;
			
 
				-  private ListeningExecutorService executorDelegatee;
			
 
				-
			
 
				   private static final AtomicInteger POOLNUMBER = new AtomicInteger(1);
			
 
				 
			
 
				+  private final ThreadPoolExecutor eventProcessingExecutor;
			
 
				+
			
 
				   /**
			
 
				    * Returns a {@link java.util.concurrent.ThreadFactory} that names each
			
 
				    * created thread uniquely,
			
@@ -69,7 +60,7 @@ public class BlockingThreadPoolExecutorService
 
				    * @param prefix The prefix of every created Thread's name
			
 
				    * @return a {@link java.util.concurrent.ThreadFactory} that names threads
			
 
				    */
			
 
				-  public static ThreadFactory getNamedThreadFactory(final String prefix) {
			
 
				+  static ThreadFactory getNamedThreadFactory(final String prefix) {
			
 
				     SecurityManager s = System.getSecurityManager();
			
 
				     final ThreadGroup threadGroup = (s != null) ? s.getThreadGroup() :
			
 
				         Thread.currentThread().getThreadGroup();
			
@@ -113,6 +104,12 @@ public class BlockingThreadPoolExecutorService
 
				     };
			
 
				   }
			
 
				 
			
 
				+  private BlockingThreadPoolExecutorService(int permitCount,
			
 
				+      ThreadPoolExecutor eventProcessingExecutor) {
			
 
				+    super(MoreExecutors.listeningDecorator(eventProcessingExecutor),
			
 
				+        permitCount, false);
			
 
				+    this.eventProcessingExecutor = eventProcessingExecutor;
			
 
				+  }
			
 
				 
			
 
				   /**
			
 
				    * A thread pool that that blocks clients submitting additional tasks if
			
@@ -125,10 +122,12 @@ public class BlockingThreadPoolExecutorService
 
				    * @param unit time unit
			
 
				    * @param prefixName prefix of name for threads
			
 
				    */
			
 
				-  public BlockingThreadPoolExecutorService(int activeTasks, int waitingTasks,
			
 
				-      long keepAliveTime, TimeUnit unit, String prefixName) {
			
 
				-    super();
			
 
				-    queueingPermits = new Semaphore(waitingTasks + activeTasks, false);
			
 
				+  public static BlockingThreadPoolExecutorService newInstance(
			
 
				+      int activeTasks,
			
 
				+      int waitingTasks,
			
 
				+      long keepAliveTime, TimeUnit unit,
			
 
				+      String prefixName) {
			
 
				+
			
 
				     /* Although we generally only expect up to waitingTasks tasks in the
			
 
				     queue, we need to be able to buffer all tasks in case dequeueing is
			
 
				     slower than enqueueing. */
			
@@ -147,126 +146,25 @@ public class BlockingThreadPoolExecutorService
 
				               }
			
 
				             });
			
 
				     eventProcessingExecutor.allowCoreThreadTimeOut(true);
			
 
				-    executorDelegatee =
			
 
				-        MoreExecutors.listeningDecorator(eventProcessingExecutor);
			
 
				-
			
 
				-  }
			
 
				-
			
 
				-  @Override
			
 
				-  protected ListeningExecutorService delegate() {
			
 
				-    return executorDelegatee;
			
 
				-  }
			
 
				-
			
 
				-  @Override
			
 
				-  public <T> ListenableFuture<T> submit(Callable<T> task) {
			
 
				-    try {
			
 
				-      queueingPermits.acquire();
			
 
				-    } catch (InterruptedException e) {
			
 
				-      Thread.currentThread().interrupt();
			
 
				-      return Futures.immediateFailedCheckedFuture(e);
			
 
				-    }
			
 
				-    return super.submit(new CallableWithPermitRelease<T>(task));
			
 
				-  }
			
 
				-
			
 
				-  @Override
			
 
				-  public <T> ListenableFuture<T> submit(Runnable task, T result) {
			
 
				-    try {
			
 
				-      queueingPermits.acquire();
			
 
				-    } catch (InterruptedException e) {
			
 
				-      Thread.currentThread().interrupt();
			
 
				-      return Futures.immediateFailedCheckedFuture(e);
			
 
				-    }
			
 
				-    return super.submit(new RunnableWithPermitRelease(task), result);
			
 
				-  }
			
 
				-
			
 
				-  @Override
			
 
				-  public ListenableFuture<?> submit(Runnable task) {
			
 
				-    try {
			
 
				-      queueingPermits.acquire();
			
 
				-    } catch (InterruptedException e) {
			
 
				-      Thread.currentThread().interrupt();
			
 
				-      return Futures.immediateFailedCheckedFuture(e);
			
 
				-    }
			
 
				-    return super.submit(new RunnableWithPermitRelease(task));
			
 
				-  }
			
 
				-
			
 
				-  @Override
			
 
				-  public void execute(Runnable command) {
			
 
				-    try {
			
 
				-      queueingPermits.acquire();
			
 
				-    } catch (InterruptedException e) {
			
 
				-      Thread.currentThread().interrupt();
			
 
				-    }
			
 
				-    super.execute(new RunnableWithPermitRelease(command));
			
 
				+    return new BlockingThreadPoolExecutorService(waitingTasks + activeTasks,
			
 
				+        eventProcessingExecutor);
			
 
				   }
			
 
				 
			
 
				   /**
			
 
				-   * Releases a permit after the task is executed.
			
 
				+   * Get the actual number of active threads.
			
 
				+   * @return the active thread count
			
 
				    */
			
 
				-  class RunnableWithPermitRelease implements Runnable {
			
 
				-
			
 
				-    private Runnable delegatee;
			
 
				-
			
 
				-    public RunnableWithPermitRelease(Runnable delegatee) {
			
 
				-      this.delegatee = delegatee;
			
 
				-    }
			
 
				-
			
 
				-    @Override
			
 
				-    public void run() {
			
 
				-      try {
			
 
				-        delegatee.run();
			
 
				-      } finally {
			
 
				-        queueingPermits.release();
			
 
				-      }
			
 
				-
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  /**
			
 
				-   * Releases a permit after the task is completed.
			
 
				-   */
			
 
				-  class CallableWithPermitRelease<T> implements Callable<T> {
			
 
				-
			
 
				-    private Callable<T> delegatee;
			
 
				-
			
 
				-    public CallableWithPermitRelease(Callable<T> delegatee) {
			
 
				-      this.delegatee = delegatee;
			
 
				-    }
			
 
				-
			
 
				-    @Override
			
 
				-    public T call() throws Exception {
			
 
				-      try {
			
 
				-        return delegatee.call();
			
 
				-      } finally {
			
 
				-        queueingPermits.release();
			
 
				-      }
			
 
				-    }
			
 
				-
			
 
				-  }
			
 
				-
			
 
				-  @Override
			
 
				-  public <T> List<Future<T>> invokeAll(Collection<? extends Callable<T>> tasks)
			
 
				-      throws InterruptedException {
			
 
				-    throw new RuntimeException("Not implemented");
			
 
				+  int getActiveCount() {
			
 
				+    return eventProcessingExecutor.getActiveCount();
			
 
				   }
			
 
				 
			
 
				   @Override
			
 
				-  public <T> List<Future<T>> invokeAll(Collection<? extends Callable<T>> tasks,
			
 
				-      long timeout, TimeUnit unit) throws InterruptedException {
			
 
				-    throw new RuntimeException("Not implemented");
			
 
				+  public String toString() {
			
 
				+    final StringBuilder sb = new StringBuilder(
			
 
				+        "BlockingThreadPoolExecutorService{");
			
 
				+    sb.append(super.toString());
			
 
				+    sb.append(", activeCount=").append(getActiveCount());
			
 
				+    sb.append('}');
			
 
				+    return sb.toString();
			
 
				   }
			
 
				-
			
 
				-  @Override
			
 
				-  public <T> T invokeAny(Collection<? extends Callable<T>> tasks)
			
 
				-      throws InterruptedException, ExecutionException {
			
 
				-    throw new RuntimeException("Not implemented");
			
 
				-  }
			
 
				-
			
 
				-  @Override
			
 
				-  public <T> T invokeAny(Collection<? extends Callable<T>> tasks, long timeout,
			
 
				-      TimeUnit unit)
			
 
				-      throws InterruptedException, ExecutionException, TimeoutException {
			
 
				-    throw new RuntimeException("Not implemented");
			
 
				-  }
			
 
				-
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/Constants.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/Constants.java
@@ -35,6 +35,9 @@ public final class Constants {
 
				   private Constants() {
			
 
				   }
			
 
				 
			
 
				+  /** The minimum multipart size which S3 supports. */
			
 
				+  public static final int MULTIPART_MIN_SIZE = 5 * 1024 * 1024;
			
 
				+
			
 
				   // s3 access key
			
 
				   public static final String ACCESS_KEY = "fs.s3a.access.key";
			
 
				 
			
@@ -124,14 +127,72 @@ public final class Constants {
 
				   // comma separated list of directories
			
 
				   public static final String BUFFER_DIR = "fs.s3a.buffer.dir";
			
 
				 
			
 
				-  // should we upload directly from memory rather than using a file buffer
			
 
				+  // switch to the fast block-by-block upload mechanism
			
 
				   public static final String FAST_UPLOAD = "fs.s3a.fast.upload";
			
 
				   public static final boolean DEFAULT_FAST_UPLOAD = false;
			
 
				 
			
 
				   //initial size of memory buffer for a fast upload
			
 
				+  @Deprecated
			
 
				   public static final String FAST_BUFFER_SIZE = "fs.s3a.fast.buffer.size";
			
 
				   public static final int DEFAULT_FAST_BUFFER_SIZE = 1048576; //1MB
			
 
				 
			
 
				+  /**
			
 
				+   * What buffer to use.
			
 
				+   * Default is {@link #FAST_UPLOAD_BUFFER_DISK}
			
 
				+   * Value: {@value}
			
 
				+   */
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public static final String FAST_UPLOAD_BUFFER =
			
 
				+      "fs.s3a.fast.upload.buffer";
			
 
				+
			
 
				+  /**
			
 
				+   * Buffer blocks to disk: {@value}.
			
 
				+   * Capacity is limited to available disk space.
			
 
				+   */
			
 
				+
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public static final String FAST_UPLOAD_BUFFER_DISK = "disk";
			
 
				+
			
 
				+  /**
			
 
				+   * Use an in-memory array. Fast but will run of heap rapidly: {@value}.
			
 
				+   */
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public static final String FAST_UPLOAD_BUFFER_ARRAY = "array";
			
 
				+
			
 
				+  /**
			
 
				+   * Use a byte buffer. May be more memory efficient than the
			
 
				+   * {@link #FAST_UPLOAD_BUFFER_ARRAY}: {@value}.
			
 
				+   */
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public static final String FAST_UPLOAD_BYTEBUFFER = "bytebuffer";
			
 
				+
			
 
				+  /**
			
 
				+   * Default buffer option: {@value}.
			
 
				+   */
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public static final String DEFAULT_FAST_UPLOAD_BUFFER =
			
 
				+      FAST_UPLOAD_BUFFER_DISK;
			
 
				+
			
 
				+  /**
			
 
				+   * Maximum Number of blocks a single output stream can have
			
 
				+   * active (uploading, or queued to the central FileSystem
			
 
				+   * instance's pool of queued operations.
			
 
				+   * This stops a single stream overloading the shared thread pool.
			
 
				+   * {@value}
			
 
				+   * <p>
			
 
				+   * Default is {@link #DEFAULT_FAST_UPLOAD_ACTIVE_BLOCKS}
			
 
				+   */
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public static final String FAST_UPLOAD_ACTIVE_BLOCKS =
			
 
				+      "fs.s3a.fast.upload.active.blocks";
			
 
				+
			
 
				+  /**
			
 
				+   * Limit of queued block upload operations before writes
			
 
				+   * block. Value: {@value}
			
 
				+   */
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public static final int DEFAULT_FAST_UPLOAD_ACTIVE_BLOCKS = 4;
			
 
				+
			
 
				   // Private | PublicRead | PublicReadWrite | AuthenticatedRead |
			
 
				   // LogDeliveryWrite | BucketOwnerRead | BucketOwnerFullControl
			
 
				   public static final String CANNED_ACL = "fs.s3a.acl.default";
			
@@ -145,7 +206,7 @@ public final class Constants {
 
				   // purge any multipart uploads older than this number of seconds
			
 
				   public static final String PURGE_EXISTING_MULTIPART_AGE =
			
 
				       "fs.s3a.multipart.purge.age";
			
 
				-  public static final long DEFAULT_PURGE_EXISTING_MULTIPART_AGE = 14400;
			
 
				+  public static final long DEFAULT_PURGE_EXISTING_MULTIPART_AGE = 86400;
			
 
				 
			
 
				   // s3 server-side encryption
			
 
				   public static final String SERVER_SIDE_ENCRYPTION_ALGORITHM =
			
@@ -215,4 +276,10 @@ public final class Constants {
 
				   public static final Class<? extends S3ClientFactory>
			
 
				       DEFAULT_S3_CLIENT_FACTORY_IMPL =
			
 
				           S3ClientFactory.DefaultS3ClientFactory.class;
			
 
				+
			
 
				+  /**
			
 
				+   * Maximum number of partitions in a multipart upload: {@value}.
			
 
				+   */
			
 
				+  @InterfaceAudience.Private
			
 
				+  public static final int MAX_MULTIPART_COUNT = 10000;
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3ABlockOutputStream.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3ABlockOutputStream.java
@@ -0,0 +1,703 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+import java.io.InputStream;
			
 
				+import java.io.OutputStream;
			
 
				+import java.util.ArrayList;
			
 
				+import java.util.List;
			
 
				+import java.util.concurrent.Callable;
			
 
				+import java.util.concurrent.ExecutionException;
			
 
				+import java.util.concurrent.ExecutorService;
			
 
				+import java.util.concurrent.TimeUnit;
			
 
				+import java.util.concurrent.atomic.AtomicBoolean;
			
 
				+
			
 
				+import com.amazonaws.AmazonClientException;
			
 
				+import com.amazonaws.event.ProgressEvent;
			
 
				+import com.amazonaws.event.ProgressEventType;
			
 
				+import com.amazonaws.event.ProgressListener;
			
 
				+import com.amazonaws.services.s3.model.CompleteMultipartUploadResult;
			
 
				+import com.amazonaws.services.s3.model.PartETag;
			
 
				+import com.amazonaws.services.s3.model.PutObjectRequest;
			
 
				+import com.amazonaws.services.s3.model.PutObjectResult;
			
 
				+import com.amazonaws.services.s3.model.UploadPartRequest;
			
 
				+import com.google.common.base.Preconditions;
			
 
				+import com.google.common.util.concurrent.Futures;
			
 
				+import com.google.common.util.concurrent.ListenableFuture;
			
 
				+import com.google.common.util.concurrent.ListeningExecutorService;
			
 
				+import com.google.common.util.concurrent.MoreExecutors;
			
 
				+import org.slf4j.Logger;
			
 
				+import org.slf4j.LoggerFactory;
			
 
				+
			
 
				+import org.apache.hadoop.classification.InterfaceAudience;
			
 
				+import org.apache.hadoop.classification.InterfaceStability;
			
 
				+import org.apache.hadoop.io.IOUtils;
			
 
				+import org.apache.hadoop.io.retry.RetryPolicies;
			
 
				+import org.apache.hadoop.io.retry.RetryPolicy;
			
 
				+import org.apache.hadoop.util.Progressable;
			
 
				+
			
 
				+import static org.apache.hadoop.fs.s3a.S3AUtils.*;
			
 
				+import static org.apache.hadoop.fs.s3a.Statistic.*;
			
 
				+
			
 
				+/**
			
 
				+ * Upload files/parts directly via different buffering mechanisms:
			
 
				+ * including memory and disk.
			
 
				+ *
			
 
				+ * If the stream is closed and no update has started, then the upload
			
 
				+ * is instead done as a single PUT operation.
			
 
				+ *
			
 
				+ * Unstable: statistics and error handling might evolve.
			
 
				+ */
			
 
				+@InterfaceAudience.Private
			
 
				+@InterfaceStability.Unstable
			
 
				+class S3ABlockOutputStream extends OutputStream {
			
 
				+
			
 
				+  private static final Logger LOG =
			
 
				+      LoggerFactory.getLogger(S3ABlockOutputStream.class);
			
 
				+
			
 
				+  /** Owner FileSystem. */
			
 
				+  private final S3AFileSystem fs;
			
 
				+
			
 
				+  /** Object being uploaded. */
			
 
				+  private final String key;
			
 
				+
			
 
				+  /** Size of all blocks. */
			
 
				+  private final int blockSize;
			
 
				+
			
 
				+  /** Callback for progress. */
			
 
				+  private final ProgressListener progressListener;
			
 
				+  private final ListeningExecutorService executorService;
			
 
				+
			
 
				+  /**
			
 
				+   * Retry policy for multipart commits; not all AWS SDK versions retry that.
			
 
				+   */
			
 
				+  private final RetryPolicy retryPolicy =
			
 
				+      RetryPolicies.retryUpToMaximumCountWithProportionalSleep(
			
 
				+          5,
			
 
				+          2000,
			
 
				+          TimeUnit.MILLISECONDS);
			
 
				+  /**
			
 
				+   * Factory for blocks.
			
 
				+   */
			
 
				+  private final S3ADataBlocks.BlockFactory blockFactory;
			
 
				+
			
 
				+  /** Preallocated byte buffer for writing single characters. */
			
 
				+  private final byte[] singleCharWrite = new byte[1];
			
 
				+
			
 
				+  /** Multipart upload details; null means none started. */
			
 
				+  private MultiPartUpload multiPartUpload;
			
 
				+
			
 
				+  /** Closed flag. */
			
 
				+  private final AtomicBoolean closed = new AtomicBoolean(false);
			
 
				+
			
 
				+  /** Current data block. Null means none currently active */
			
 
				+  private S3ADataBlocks.DataBlock activeBlock;
			
 
				+
			
 
				+  /** Count of blocks uploaded. */
			
 
				+  private long blockCount = 0;
			
 
				+
			
 
				+  /** Statistics to build up. */
			
 
				+  private final S3AInstrumentation.OutputStreamStatistics statistics;
			
 
				+
			
 
				+  /**
			
 
				+   * Write operation helper; encapsulation of the filesystem operations.
			
 
				+   */
			
 
				+  private final S3AFileSystem.WriteOperationHelper writeOperationHelper;
			
 
				+
			
 
				+  /**
			
 
				+   * An S3A output stream which uploads partitions in a separate pool of
			
 
				+   * threads; different {@link S3ADataBlocks.BlockFactory}
			
 
				+   * instances can control where data is buffered.
			
 
				+   *
			
 
				+   * @param fs S3AFilesystem
			
 
				+   * @param key S3 object to work on.
			
 
				+   * @param executorService the executor service to use to schedule work
			
 
				+   * @param progress report progress in order to prevent timeouts. If
			
 
				+   * this object implements {@code ProgressListener} then it will be
			
 
				+   * directly wired up to the AWS client, so receive detailed progress
			
 
				+   * information.
			
 
				+   * @param blockSize size of a single block.
			
 
				+   * @param blockFactory factory for creating stream destinations
			
 
				+   * @param statistics stats for this stream
			
 
				+   * @param writeOperationHelper state of the write operation.
			
 
				+   * @throws IOException on any problem
			
 
				+   */
			
 
				+  S3ABlockOutputStream(S3AFileSystem fs,
			
 
				+      String key,
			
 
				+      ExecutorService executorService,
			
 
				+      Progressable progress,
			
 
				+      long blockSize,
			
 
				+      S3ADataBlocks.BlockFactory blockFactory,
			
 
				+      S3AInstrumentation.OutputStreamStatistics statistics,
			
 
				+      S3AFileSystem.WriteOperationHelper writeOperationHelper)
			
 
				+      throws IOException {
			
 
				+    this.fs = fs;
			
 
				+    this.key = key;
			
 
				+    this.blockFactory = blockFactory;
			
 
				+    this.blockSize = (int) blockSize;
			
 
				+    this.statistics = statistics;
			
 
				+    this.writeOperationHelper = writeOperationHelper;
			
 
				+    Preconditions.checkArgument(blockSize >= Constants.MULTIPART_MIN_SIZE,
			
 
				+        "Block size is too small: %d", blockSize);
			
 
				+    this.executorService = MoreExecutors.listeningDecorator(executorService);
			
 
				+    this.multiPartUpload = null;
			
 
				+    this.progressListener = (progress instanceof ProgressListener) ?
			
 
				+        (ProgressListener) progress
			
 
				+        : new ProgressableListener(progress);
			
 
				+    // create that first block. This guarantees that an open + close sequence
			
 
				+    // writes a 0-byte entry.
			
 
				+    createBlockIfNeeded();
			
 
				+    LOG.debug("Initialized S3ABlockOutputStream for {}" +
			
 
				+        " output to {}", writeOperationHelper, activeBlock);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Demand create a destination block.
			
 
				+   * @return the active block; null if there isn't one.
			
 
				+   * @throws IOException on any failure to create
			
 
				+   */
			
 
				+  private synchronized S3ADataBlocks.DataBlock createBlockIfNeeded()
			
 
				+      throws IOException {
			
 
				+    if (activeBlock == null) {
			
 
				+      blockCount++;
			
 
				+      if (blockCount>= Constants.MAX_MULTIPART_COUNT) {
			
 
				+        LOG.error("Number of partitions in stream exceeds limit for S3: " +
			
 
				+             + Constants.MAX_MULTIPART_COUNT +  " write may fail.");
			
 
				+      }
			
 
				+      activeBlock = blockFactory.create(this.blockSize);
			
 
				+    }
			
 
				+    return activeBlock;
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Synchronized accessor to the active block.
			
 
				+   * @return the active block; null if there isn't one.
			
 
				+   */
			
 
				+  private synchronized S3ADataBlocks.DataBlock getActiveBlock() {
			
 
				+    return activeBlock;
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Predicate to query whether or not there is an active block.
			
 
				+   * @return true if there is an active block.
			
 
				+   */
			
 
				+  private synchronized boolean hasActiveBlock() {
			
 
				+    return activeBlock != null;
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Clear the active block.
			
 
				+   */
			
 
				+  private void clearActiveBlock() {
			
 
				+    LOG.debug("Clearing active block");
			
 
				+    synchronized (this) {
			
 
				+      activeBlock = null;
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Check for the filesystem being open.
			
 
				+   * @throws IOException if the filesystem is closed.
			
 
				+   */
			
 
				+  void checkOpen() throws IOException {
			
 
				+    if (closed.get()) {
			
 
				+      throw new IOException("Filesystem " + writeOperationHelper + " closed");
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * The flush operation does not trigger an upload; that awaits
			
 
				+   * the next block being full. What it does do is call {@code flush() }
			
 
				+   * on the current block, leaving it to choose how to react.
			
 
				+   * @throws IOException Any IO problem.
			
 
				+   */
			
 
				+  @Override
			
 
				+  public synchronized void flush() throws IOException {
			
 
				+    checkOpen();
			
 
				+    S3ADataBlocks.DataBlock dataBlock = getActiveBlock();
			
 
				+    if (dataBlock != null) {
			
 
				+      dataBlock.flush();
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Writes a byte to the destination. If this causes the buffer to reach
			
 
				+   * its limit, the actual upload is submitted to the threadpool.
			
 
				+   * @param b the int of which the lowest byte is written
			
 
				+   * @throws IOException on any problem
			
 
				+   */
			
 
				+  @Override
			
 
				+  public synchronized void write(int b) throws IOException {
			
 
				+    singleCharWrite[0] = (byte)b;
			
 
				+    write(singleCharWrite, 0, 1);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Writes a range of bytes from to the memory buffer. If this causes the
			
 
				+   * buffer to reach its limit, the actual upload is submitted to the
			
 
				+   * threadpool and the remainder of the array is written to memory
			
 
				+   * (recursively).
			
 
				+   * @param source byte array containing
			
 
				+   * @param offset offset in array where to start
			
 
				+   * @param len number of bytes to be written
			
 
				+   * @throws IOException on any problem
			
 
				+   */
			
 
				+  @Override
			
 
				+  public synchronized void write(byte[] source, int offset, int len)
			
 
				+      throws IOException {
			
 
				+
			
 
				+    S3ADataBlocks.validateWriteArgs(source, offset, len);
			
 
				+    checkOpen();
			
 
				+    if (len == 0) {
			
 
				+      return;
			
 
				+    }
			
 
				+    S3ADataBlocks.DataBlock block = createBlockIfNeeded();
			
 
				+    int written = block.write(source, offset, len);
			
 
				+    int remainingCapacity = block.remainingCapacity();
			
 
				+    if (written < len) {
			
 
				+      // not everything was written —the block has run out
			
 
				+      // of capacity
			
 
				+      // Trigger an upload then process the remainder.
			
 
				+      LOG.debug("writing more data than block has capacity -triggering upload");
			
 
				+      uploadCurrentBlock();
			
 
				+      // tail recursion is mildly expensive, but given buffer sizes must be MB.
			
 
				+      // it's unlikely to recurse very deeply.
			
 
				+      this.write(source, offset + written, len - written);
			
 
				+    } else {
			
 
				+      if (remainingCapacity == 0) {
			
 
				+        // the whole buffer is done, trigger an upload
			
 
				+        uploadCurrentBlock();
			
 
				+      }
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Start an asynchronous upload of the current block.
			
 
				+   * @throws IOException Problems opening the destination for upload
			
 
				+   * or initializing the upload.
			
 
				+   */
			
 
				+  private synchronized void uploadCurrentBlock() throws IOException {
			
 
				+    Preconditions.checkState(hasActiveBlock(), "No active block");
			
 
				+    LOG.debug("Writing block # {}", blockCount);
			
 
				+    if (multiPartUpload == null) {
			
 
				+      LOG.debug("Initiating Multipart upload");
			
 
				+      multiPartUpload = new MultiPartUpload();
			
 
				+    }
			
 
				+    try {
			
 
				+      multiPartUpload.uploadBlockAsync(getActiveBlock());
			
 
				+    } finally {
			
 
				+      // set the block to null, so the next write will create a new block.
			
 
				+      clearActiveBlock();
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Close the stream.
			
 
				+   *
			
 
				+   * This will not return until the upload is complete
			
 
				+   * or the attempt to perform the upload has failed.
			
 
				+   * Exceptions raised in this method are indicative that the write has
			
 
				+   * failed and data is at risk of being lost.
			
 
				+   * @throws IOException on any failure.
			
 
				+   */
			
 
				+  @Override
			
 
				+  public void close() throws IOException {
			
 
				+    if (closed.getAndSet(true)) {
			
 
				+      // already closed
			
 
				+      LOG.debug("Ignoring close() as stream is already closed");
			
 
				+      return;
			
 
				+    }
			
 
				+    S3ADataBlocks.DataBlock block = getActiveBlock();
			
 
				+    boolean hasBlock = hasActiveBlock();
			
 
				+    LOG.debug("{}: Closing block #{}: current block= {}",
			
 
				+        this,
			
 
				+        blockCount,
			
 
				+        hasBlock ? block : "(none)");
			
 
				+    try {
			
 
				+      if (multiPartUpload == null) {
			
 
				+        if (hasBlock) {
			
 
				+          // no uploads of data have taken place, put the single block up.
			
 
				+          // This must happen even if there is no data, so that 0 byte files
			
 
				+          // are created.
			
 
				+          putObject();
			
 
				+        }
			
 
				+      } else {
			
 
				+        // there has already been at least one block scheduled for upload;
			
 
				+        // put up the current then wait
			
 
				+        if (hasBlock && block.hasData()) {
			
 
				+          //send last part
			
 
				+          uploadCurrentBlock();
			
 
				+        }
			
 
				+        // wait for the partial uploads to finish
			
 
				+        final List<PartETag> partETags =
			
 
				+            multiPartUpload.waitForAllPartUploads();
			
 
				+        // then complete the operation
			
 
				+        multiPartUpload.complete(partETags);
			
 
				+      }
			
 
				+      LOG.debug("Upload complete for {}", writeOperationHelper);
			
 
				+    } catch (IOException ioe) {
			
 
				+      writeOperationHelper.writeFailed(ioe);
			
 
				+      throw ioe;
			
 
				+    } finally {
			
 
				+      LOG.debug("Closing block and factory");
			
 
				+      IOUtils.closeStream(block);
			
 
				+      IOUtils.closeStream(blockFactory);
			
 
				+      LOG.debug("Statistics: {}", statistics);
			
 
				+      IOUtils.closeStream(statistics);
			
 
				+      clearActiveBlock();
			
 
				+    }
			
 
				+    // All end of write operations, including deleting fake parent directories
			
 
				+    writeOperationHelper.writeSuccessful();
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Upload the current block as a single PUT request; if the buffer
			
 
				+   * is empty a 0-byte PUT will be invoked, as it is needed to create an
			
 
				+   * entry at the far end.
			
 
				+   * @throws IOException any problem.
			
 
				+   */
			
 
				+  private void putObject() throws IOException {
			
 
				+    LOG.debug("Executing regular upload for {}", writeOperationHelper);
			
 
				+
			
 
				+    final S3ADataBlocks.DataBlock block = getActiveBlock();
			
 
				+    int size = block.dataSize();
			
 
				+    final PutObjectRequest putObjectRequest =
			
 
				+        writeOperationHelper.newPutRequest(
			
 
				+            block.startUpload(),
			
 
				+            size);
			
 
				+    long transferQueueTime = now();
			
 
				+    BlockUploadProgress callback =
			
 
				+        new BlockUploadProgress(
			
 
				+            block, progressListener, transferQueueTime);
			
 
				+    putObjectRequest.setGeneralProgressListener(callback);
			
 
				+    statistics.blockUploadQueued(size);
			
 
				+    ListenableFuture<PutObjectResult> putObjectResult =
			
 
				+        executorService.submit(new Callable<PutObjectResult>() {
			
 
				+          @Override
			
 
				+          public PutObjectResult call() throws Exception {
			
 
				+            PutObjectResult result = fs.putObjectDirect(putObjectRequest);
			
 
				+            block.close();
			
 
				+            return result;
			
 
				+          }
			
 
				+        });
			
 
				+    clearActiveBlock();
			
 
				+    //wait for completion
			
 
				+    try {
			
 
				+      putObjectResult.get();
			
 
				+    } catch (InterruptedException ie) {
			
 
				+      LOG.warn("Interrupted object upload", ie);
			
 
				+      Thread.currentThread().interrupt();
			
 
				+    } catch (ExecutionException ee) {
			
 
				+      throw extractException("regular upload", key, ee);
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public String toString() {
			
 
				+    final StringBuilder sb = new StringBuilder(
			
 
				+        "S3ABlockOutputStream{");
			
 
				+    sb.append(writeOperationHelper.toString());
			
 
				+    sb.append(", blockSize=").append(blockSize);
			
 
				+    // unsynced access; risks consistency in exchange for no risk of deadlock.
			
 
				+    S3ADataBlocks.DataBlock block = activeBlock;
			
 
				+    if (block != null) {
			
 
				+      sb.append(", activeBlock=").append(block);
			
 
				+    }
			
 
				+    sb.append('}');
			
 
				+    return sb.toString();
			
 
				+  }
			
 
				+
			
 
				+  private void incrementWriteOperations() {
			
 
				+    fs.incrementWriteOperations();
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Current time in milliseconds.
			
 
				+   * @return time
			
 
				+   */
			
 
				+  private long now() {
			
 
				+    return System.currentTimeMillis();
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Multiple partition upload.
			
 
				+   */
			
 
				+  private class MultiPartUpload {
			
 
				+    private final String uploadId;
			
 
				+    private final List<ListenableFuture<PartETag>> partETagsFutures;
			
 
				+
			
 
				+    public MultiPartUpload() throws IOException {
			
 
				+      this.uploadId = writeOperationHelper.initiateMultiPartUpload();
			
 
				+      this.partETagsFutures = new ArrayList<>(2);
			
 
				+      LOG.debug("Initiated multi-part upload for {} with " +
			
 
				+          "id '{}'", writeOperationHelper, uploadId);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Upload a block of data.
			
 
				+     * This will take the block
			
 
				+     * @param block block to upload
			
 
				+     * @throws IOException upload failure
			
 
				+     */
			
 
				+    private void uploadBlockAsync(final S3ADataBlocks.DataBlock block)
			
 
				+        throws IOException {
			
 
				+      LOG.debug("Queueing upload of {}", block);
			
 
				+      final int size = block.dataSize();
			
 
				+      final InputStream uploadStream = block.startUpload();
			
 
				+      final int currentPartNumber = partETagsFutures.size() + 1;
			
 
				+      final UploadPartRequest request =
			
 
				+          writeOperationHelper.newUploadPartRequest(
			
 
				+              uploadId,
			
 
				+              uploadStream,
			
 
				+              currentPartNumber,
			
 
				+              size);
			
 
				+      long transferQueueTime = now();
			
 
				+      BlockUploadProgress callback =
			
 
				+          new BlockUploadProgress(
			
 
				+              block, progressListener, transferQueueTime);
			
 
				+      request.setGeneralProgressListener(callback);
			
 
				+      statistics.blockUploadQueued(block.dataSize());
			
 
				+      ListenableFuture<PartETag> partETagFuture =
			
 
				+          executorService.submit(new Callable<PartETag>() {
			
 
				+            @Override
			
 
				+            public PartETag call() throws Exception {
			
 
				+              // this is the queued upload operation
			
 
				+              LOG.debug("Uploading part {} for id '{}'", currentPartNumber,
			
 
				+                  uploadId);
			
 
				+              // do the upload
			
 
				+              PartETag partETag = fs.uploadPart(request).getPartETag();
			
 
				+              LOG.debug("Completed upload of {}", block);
			
 
				+              LOG.debug("Stream statistics of {}", statistics);
			
 
				+
			
 
				+              // close the block
			
 
				+              block.close();
			
 
				+              return partETag;
			
 
				+            }
			
 
				+          });
			
 
				+      partETagsFutures.add(partETagFuture);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Block awaiting all outstanding uploads to complete.
			
 
				+     * @return list of results
			
 
				+     * @throws IOException IO Problems
			
 
				+     */
			
 
				+    private List<PartETag> waitForAllPartUploads() throws IOException {
			
 
				+      LOG.debug("Waiting for {} uploads to complete", partETagsFutures.size());
			
 
				+      try {
			
 
				+        return Futures.allAsList(partETagsFutures).get();
			
 
				+      } catch (InterruptedException ie) {
			
 
				+        LOG.warn("Interrupted partUpload", ie);
			
 
				+        Thread.currentThread().interrupt();
			
 
				+        return null;
			
 
				+      } catch (ExecutionException ee) {
			
 
				+        //there is no way of recovering so abort
			
 
				+        //cancel all partUploads
			
 
				+        LOG.debug("While waiting for upload completion", ee);
			
 
				+        LOG.debug("Cancelling futures");
			
 
				+        for (ListenableFuture<PartETag> future : partETagsFutures) {
			
 
				+          future.cancel(true);
			
 
				+        }
			
 
				+        //abort multipartupload
			
 
				+        this.abort();
			
 
				+        throw extractException("Multi-part upload with id '" + uploadId
			
 
				+                + "' to " + key, key, ee);
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * This completes a multipart upload.
			
 
				+     * Sometimes it fails; here retries are handled to avoid losing all data
			
 
				+     * on a transient failure.
			
 
				+     * @param partETags list of partial uploads
			
 
				+     * @throws IOException on any problem
			
 
				+     */
			
 
				+    private CompleteMultipartUploadResult complete(List<PartETag> partETags)
			
 
				+        throws IOException {
			
 
				+      int retryCount = 0;
			
 
				+      AmazonClientException lastException;
			
 
				+      String operation =
			
 
				+          String.format("Completing multi-part upload for key '%s'," +
			
 
				+                  " id '%s' with %s partitions ",
			
 
				+              key, uploadId, partETags.size());
			
 
				+      do {
			
 
				+        try {
			
 
				+          LOG.debug(operation);
			
 
				+          return writeOperationHelper.completeMultipartUpload(
			
 
				+                  uploadId,
			
 
				+                  partETags);
			
 
				+        } catch (AmazonClientException e) {
			
 
				+          lastException = e;
			
 
				+          statistics.exceptionInMultipartComplete();
			
 
				+        }
			
 
				+      } while (shouldRetry(operation, lastException, retryCount++));
			
 
				+      // this point is only reached if the operation failed more than
			
 
				+      // the allowed retry count
			
 
				+      throw translateException(operation, key, lastException);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Abort a multi-part upload. Retries are attempted on failures.
			
 
				+     * IOExceptions are caught; this is expected to be run as a cleanup process.
			
 
				+     */
			
 
				+    public void abort() {
			
 
				+      int retryCount = 0;
			
 
				+      AmazonClientException lastException;
			
 
				+      fs.incrementStatistic(OBJECT_MULTIPART_UPLOAD_ABORTED);
			
 
				+      String operation =
			
 
				+          String.format("Aborting multi-part upload for '%s', id '%s",
			
 
				+              writeOperationHelper, uploadId);
			
 
				+      do {
			
 
				+        try {
			
 
				+          LOG.debug(operation);
			
 
				+          writeOperationHelper.abortMultipartUpload(uploadId);
			
 
				+          return;
			
 
				+        } catch (AmazonClientException e) {
			
 
				+          lastException = e;
			
 
				+          statistics.exceptionInMultipartAbort();
			
 
				+        }
			
 
				+      } while (shouldRetry(operation, lastException, retryCount++));
			
 
				+      // this point is only reached if the operation failed more than
			
 
				+      // the allowed retry count
			
 
				+      LOG.warn("Unable to abort multipart upload, you may need to purge  " +
			
 
				+          "uploaded parts", lastException);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Predicate to determine whether a failed operation should
			
 
				+     * be attempted again.
			
 
				+     * If a retry is advised, the exception is automatically logged and
			
 
				+     * the filesystem statistic {@link Statistic#IGNORED_ERRORS} incremented.
			
 
				+     * The method then sleeps for the sleep time suggested by the sleep policy;
			
 
				+     * if the sleep is interrupted then {@code Thread.interrupted()} is set
			
 
				+     * to indicate the thread was interrupted; then false is returned.
			
 
				+     *
			
 
				+     * @param operation operation for log message
			
 
				+     * @param e exception raised.
			
 
				+     * @param retryCount  number of retries already attempted
			
 
				+     * @return true if another attempt should be made
			
 
				+     */
			
 
				+    private boolean shouldRetry(String operation,
			
 
				+        AmazonClientException e,
			
 
				+        int retryCount) {
			
 
				+      try {
			
 
				+        RetryPolicy.RetryAction retryAction =
			
 
				+            retryPolicy.shouldRetry(e, retryCount, 0, true);
			
 
				+        boolean retry = retryAction == RetryPolicy.RetryAction.RETRY;
			
 
				+        if (retry) {
			
 
				+          fs.incrementStatistic(IGNORED_ERRORS);
			
 
				+          LOG.info("Retrying {} after exception ", operation, e);
			
 
				+          Thread.sleep(retryAction.delayMillis);
			
 
				+        }
			
 
				+        return retry;
			
 
				+      } catch (InterruptedException ex) {
			
 
				+        Thread.currentThread().interrupt();
			
 
				+        return false;
			
 
				+      } catch (Exception ignored) {
			
 
				+        return false;
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * The upload progress listener registered for events returned
			
 
				+   * during the upload of a single block.
			
 
				+   * It updates statistics and handles the end of the upload.
			
 
				+   * Transfer failures are logged at WARN.
			
 
				+   */
			
 
				+  private final class BlockUploadProgress implements ProgressListener {
			
 
				+    private final S3ADataBlocks.DataBlock block;
			
 
				+    private final ProgressListener nextListener;
			
 
				+    private final long transferQueueTime;
			
 
				+    private long transferStartTime;
			
 
				+
			
 
				+    /**
			
 
				+     * Track the progress of a single block upload.
			
 
				+     * @param block block to monitor
			
 
				+     * @param nextListener optional next progress listener
			
 
				+     * @param transferQueueTime time the block was transferred
			
 
				+     * into the queue
			
 
				+     */
			
 
				+    private BlockUploadProgress(S3ADataBlocks.DataBlock block,
			
 
				+        ProgressListener nextListener,
			
 
				+        long transferQueueTime) {
			
 
				+      this.block = block;
			
 
				+      this.transferQueueTime = transferQueueTime;
			
 
				+      this.nextListener = nextListener;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void progressChanged(ProgressEvent progressEvent) {
			
 
				+      ProgressEventType eventType = progressEvent.getEventType();
			
 
				+      long bytesTransferred = progressEvent.getBytesTransferred();
			
 
				+
			
 
				+      int size = block.dataSize();
			
 
				+      switch (eventType) {
			
 
				+
			
 
				+      case REQUEST_BYTE_TRANSFER_EVENT:
			
 
				+        // bytes uploaded
			
 
				+        statistics.bytesTransferred(bytesTransferred);
			
 
				+        break;
			
 
				+
			
 
				+      case TRANSFER_PART_STARTED_EVENT:
			
 
				+        transferStartTime = now();
			
 
				+        statistics.blockUploadStarted(transferStartTime - transferQueueTime,
			
 
				+            size);
			
 
				+        incrementWriteOperations();
			
 
				+        break;
			
 
				+
			
 
				+      case TRANSFER_PART_COMPLETED_EVENT:
			
 
				+        statistics.blockUploadCompleted(now() - transferStartTime, size);
			
 
				+        break;
			
 
				+
			
 
				+      case TRANSFER_PART_FAILED_EVENT:
			
 
				+        statistics.blockUploadFailed(now() - transferStartTime, size);
			
 
				+        LOG.warn("Transfer failure of block {}", block);
			
 
				+        break;
			
 
				+
			
 
				+      default:
			
 
				+        // nothing
			
 
				+      }
			
 
				+
			
 
				+      if (nextListener != null) {
			
 
				+        nextListener.progressChanged(progressEvent);
			
 
				+      }
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Bridge from AWS {@code ProgressListener} to Hadoop {@link Progressable}.
			
 
				+   */
			
 
				+  private static class ProgressableListener implements ProgressListener {
			
 
				+    private final Progressable progress;
			
 
				+
			
 
				+    public ProgressableListener(Progressable progress) {
			
 
				+      this.progress = progress;
			
 
				+    }
			
 
				+
			
 
				+    public void progressChanged(ProgressEvent progressEvent) {
			
 
				+      if (progress != null) {
			
 
				+        progress.progress();
			
 
				+      }
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3ADataBlocks.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3ADataBlocks.java
@@ -0,0 +1,821 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+import java.io.BufferedOutputStream;
			
 
				+import java.io.ByteArrayInputStream;
			
 
				+import java.io.ByteArrayOutputStream;
			
 
				+import java.io.Closeable;
			
 
				+import java.io.EOFException;
			
 
				+import java.io.File;
			
 
				+import java.io.FileInputStream;
			
 
				+import java.io.FileNotFoundException;
			
 
				+import java.io.FileOutputStream;
			
 
				+import java.io.FilterInputStream;
			
 
				+import java.io.IOException;
			
 
				+import java.io.InputStream;
			
 
				+import java.nio.ByteBuffer;
			
 
				+import java.util.concurrent.atomic.AtomicBoolean;
			
 
				+import java.util.concurrent.atomic.AtomicInteger;
			
 
				+
			
 
				+import com.google.common.base.Preconditions;
			
 
				+import org.slf4j.Logger;
			
 
				+import org.slf4j.LoggerFactory;
			
 
				+
			
 
				+import org.apache.hadoop.fs.FSExceptionMessages;
			
 
				+import org.apache.hadoop.util.DirectBufferPool;
			
 
				+
			
 
				+import static org.apache.hadoop.fs.s3a.S3ADataBlocks.DataBlock.DestState.*;
			
 
				+
			
 
				+/**
			
 
				+ * Set of classes to support output streaming into blocks which are then
			
 
				+ * uploaded as partitions.
			
 
				+ */
			
 
				+final class S3ADataBlocks {
			
 
				+
			
 
				+  private static final Logger LOG =
			
 
				+      LoggerFactory.getLogger(S3ADataBlocks.class);
			
 
				+
			
 
				+  private S3ADataBlocks() {
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Validate args to a write command. These are the same validation checks
			
 
				+   * expected for any implementation of {@code OutputStream.write()}.
			
 
				+   * @param b byte array containing data
			
 
				+   * @param off offset in array where to start
			
 
				+   * @param len number of bytes to be written
			
 
				+   * @throws NullPointerException for a null buffer
			
 
				+   * @throws IndexOutOfBoundsException if indices are out of range
			
 
				+   */
			
 
				+  static void validateWriteArgs(byte[] b, int off, int len)
			
 
				+      throws IOException {
			
 
				+    Preconditions.checkNotNull(b);
			
 
				+    if ((off < 0) || (off > b.length) || (len < 0) ||
			
 
				+        ((off + len) > b.length) || ((off + len) < 0)) {
			
 
				+      throw new IndexOutOfBoundsException(
			
 
				+          "write (b[" + b.length + "], " + off + ", " + len + ')');
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Create a factory.
			
 
				+   * @param owner factory owner
			
 
				+   * @param name factory name -the option from {@link Constants}.
			
 
				+   * @return the factory, ready to be initialized.
			
 
				+   * @throws IllegalArgumentException if the name is unknown.
			
 
				+   */
			
 
				+  static BlockFactory createFactory(S3AFileSystem owner,
			
 
				+      String name) {
			
 
				+    switch (name) {
			
 
				+    case Constants.FAST_UPLOAD_BUFFER_ARRAY:
			
 
				+      return new ArrayBlockFactory(owner);
			
 
				+    case Constants.FAST_UPLOAD_BUFFER_DISK:
			
 
				+      return new DiskBlockFactory(owner);
			
 
				+    case Constants.FAST_UPLOAD_BYTEBUFFER:
			
 
				+      return new ByteBufferBlockFactory(owner);
			
 
				+    default:
			
 
				+      throw new IllegalArgumentException("Unsupported block buffer" +
			
 
				+          " \"" + name + '"');
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Base class for block factories.
			
 
				+   */
			
 
				+  static abstract class BlockFactory implements Closeable {
			
 
				+
			
 
				+    private final S3AFileSystem owner;
			
 
				+
			
 
				+    protected BlockFactory(S3AFileSystem owner) {
			
 
				+      this.owner = owner;
			
 
				+    }
			
 
				+
			
 
				+
			
 
				+    /**
			
 
				+     * Create a block.
			
 
				+     * @param limit limit of the block.
			
 
				+     * @return a new block.
			
 
				+     */
			
 
				+    abstract DataBlock create(int limit) throws IOException;
			
 
				+
			
 
				+    /**
			
 
				+     * Implement any close/cleanup operation.
			
 
				+     * Base class is a no-op
			
 
				+     * @throws IOException -ideally, it shouldn't.
			
 
				+     */
			
 
				+    @Override
			
 
				+    public void close() throws IOException {
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Owner.
			
 
				+     */
			
 
				+    protected S3AFileSystem getOwner() {
			
 
				+      return owner;
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * This represents a block being uploaded.
			
 
				+   */
			
 
				+  static abstract class DataBlock implements Closeable {
			
 
				+
			
 
				+    enum DestState {Writing, Upload, Closed}
			
 
				+
			
 
				+    private volatile DestState state = Writing;
			
 
				+
			
 
				+    /**
			
 
				+     * Atomically enter a state, verifying current state.
			
 
				+     * @param current current state. null means "no check"
			
 
				+     * @param next next state
			
 
				+     * @throws IllegalStateException if the current state is not as expected
			
 
				+     */
			
 
				+    protected synchronized final void enterState(DestState current,
			
 
				+        DestState next)
			
 
				+        throws IllegalStateException {
			
 
				+      verifyState(current);
			
 
				+      LOG.debug("{}: entering state {}", this, next);
			
 
				+      state = next;
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Verify that the block is in the declared state.
			
 
				+     * @param expected expected state.
			
 
				+     * @throws IllegalStateException if the DataBlock is in the wrong state
			
 
				+     */
			
 
				+    protected final void verifyState(DestState expected)
			
 
				+        throws IllegalStateException {
			
 
				+      if (expected != null && state != expected) {
			
 
				+        throw new IllegalStateException("Expected stream state " + expected
			
 
				+            + " -but actual state is " + state + " in " + this);
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Current state.
			
 
				+     * @return the current state.
			
 
				+     */
			
 
				+    final DestState getState() {
			
 
				+      return state;
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Return the current data size.
			
 
				+     * @return the size of the data
			
 
				+     */
			
 
				+    abstract int dataSize();
			
 
				+
			
 
				+    /**
			
 
				+     * Predicate to verify that the block has the capacity to write
			
 
				+     * the given set of bytes.
			
 
				+     * @param bytes number of bytes desired to be written.
			
 
				+     * @return true if there is enough space.
			
 
				+     */
			
 
				+    abstract boolean hasCapacity(long bytes);
			
 
				+
			
 
				+    /**
			
 
				+     * Predicate to check if there is data in the block.
			
 
				+     * @return true if there is
			
 
				+     */
			
 
				+    boolean hasData() {
			
 
				+      return dataSize() > 0;
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * The remaining capacity in the block before it is full.
			
 
				+     * @return the number of bytes remaining.
			
 
				+     */
			
 
				+    abstract int remainingCapacity();
			
 
				+
			
 
				+    /**
			
 
				+     * Write a series of bytes from the buffer, from the offset.
			
 
				+     * Returns the number of bytes written.
			
 
				+     * Only valid in the state {@code Writing}.
			
 
				+     * Base class verifies the state but does no writing.
			
 
				+     * @param buffer buffer
			
 
				+     * @param offset offset
			
 
				+     * @param length length of write
			
 
				+     * @return number of bytes written
			
 
				+     * @throws IOException trouble
			
 
				+     */
			
 
				+    int write(byte[] buffer, int offset, int length) throws IOException {
			
 
				+      verifyState(Writing);
			
 
				+      Preconditions.checkArgument(buffer != null, "Null buffer");
			
 
				+      Preconditions.checkArgument(length >= 0, "length is negative");
			
 
				+      Preconditions.checkArgument(offset >= 0, "offset is negative");
			
 
				+      Preconditions.checkArgument(
			
 
				+          !(buffer.length - offset < length),
			
 
				+          "buffer shorter than amount of data to write");
			
 
				+      return 0;
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Flush the output.
			
 
				+     * Only valid in the state {@code Writing}.
			
 
				+     * In the base class, this is a no-op
			
 
				+     * @throws IOException any IO problem.
			
 
				+     */
			
 
				+    void flush() throws IOException {
			
 
				+      verifyState(Writing);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Switch to the upload state and return a stream for uploading.
			
 
				+     * Base class calls {@link #enterState(DestState, DestState)} to
			
 
				+     * manage the state machine.
			
 
				+     * @return the stream
			
 
				+     * @throws IOException trouble
			
 
				+     */
			
 
				+    InputStream startUpload() throws IOException {
			
 
				+      LOG.debug("Start datablock upload");
			
 
				+      enterState(Writing, Upload);
			
 
				+      return null;
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Enter the closed state.
			
 
				+     * @return true if the class was in any other state, implying that
			
 
				+     * the subclass should do its close operations
			
 
				+     */
			
 
				+    protected synchronized boolean enterClosedState() {
			
 
				+      if (!state.equals(Closed)) {
			
 
				+        enterState(null, Closed);
			
 
				+        return true;
			
 
				+      } else {
			
 
				+        return false;
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void close() throws IOException {
			
 
				+      if (enterClosedState()) {
			
 
				+        LOG.debug("Closed {}", this);
			
 
				+        innerClose();
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Inner close logic for subclasses to implement.
			
 
				+     */
			
 
				+    protected void innerClose() throws IOException {
			
 
				+
			
 
				+    }
			
 
				+
			
 
				+  }
			
 
				+
			
 
				+  // ====================================================================
			
 
				+
			
 
				+  /**
			
 
				+   * Use byte arrays on the heap for storage.
			
 
				+   */
			
 
				+  static class ArrayBlockFactory extends BlockFactory {
			
 
				+
			
 
				+    ArrayBlockFactory(S3AFileSystem owner) {
			
 
				+      super(owner);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    DataBlock create(int limit) throws IOException {
			
 
				+      return new ByteArrayBlock(limit);
			
 
				+    }
			
 
				+
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Stream to memory via a {@code ByteArrayOutputStream}.
			
 
				+   *
			
 
				+   * This was taken from {@code S3AFastOutputStream} and has the
			
 
				+   * same problem which surfaced there: it can consume a lot of heap space
			
 
				+   * proportional to the mismatch between writes to the stream and
			
 
				+   * the JVM-wide upload bandwidth to the S3 endpoint.
			
 
				+   * The memory consumption can be limited by tuning the filesystem settings
			
 
				+   * to restrict the number of queued/active uploads.
			
 
				+   */
			
 
				+
			
 
				+  static class ByteArrayBlock extends DataBlock {
			
 
				+    private ByteArrayOutputStream buffer;
			
 
				+    private final int limit;
			
 
				+    // cache data size so that it is consistent after the buffer is reset.
			
 
				+    private Integer dataSize;
			
 
				+
			
 
				+    ByteArrayBlock(int limit) {
			
 
				+      this.limit = limit;
			
 
				+      buffer = new ByteArrayOutputStream();
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Get the amount of data; if there is no buffer then the size is 0.
			
 
				+     * @return the amount of data available to upload.
			
 
				+     */
			
 
				+    @Override
			
 
				+    int dataSize() {
			
 
				+      return dataSize != null ? dataSize : buffer.size();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    InputStream startUpload() throws IOException {
			
 
				+      super.startUpload();
			
 
				+      dataSize = buffer.size();
			
 
				+      ByteArrayInputStream bufferData = new ByteArrayInputStream(
			
 
				+          buffer.toByteArray());
			
 
				+      buffer = null;
			
 
				+      return bufferData;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    boolean hasCapacity(long bytes) {
			
 
				+      return dataSize() + bytes <= limit;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    int remainingCapacity() {
			
 
				+      return limit - dataSize();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    int write(byte[] b, int offset, int len) throws IOException {
			
 
				+      super.write(b, offset, len);
			
 
				+      int written = Math.min(remainingCapacity(), len);
			
 
				+      buffer.write(b, offset, written);
			
 
				+      return written;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    protected void innerClose() {
			
 
				+      buffer = null;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String toString() {
			
 
				+      return "ByteArrayBlock{" +
			
 
				+          "state=" + getState() +
			
 
				+          ", limit=" + limit +
			
 
				+          ", dataSize=" + dataSize +
			
 
				+          '}';
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  // ====================================================================
			
 
				+
			
 
				+  /**
			
 
				+   * Stream via Direct ByteBuffers; these are allocated off heap
			
 
				+   * via {@link DirectBufferPool}.
			
 
				+   * This is actually the most complex of all the block factories,
			
 
				+   * due to the need to explicitly recycle buffers; in comparison, the
			
 
				+   * {@link DiskBlock} buffer delegates the work of deleting files to
			
 
				+   * the {@link DiskBlock.FileDeletingInputStream}. Here the
			
 
				+   * input stream {@link ByteBufferInputStream} has a similar task, along
			
 
				+   * with the foundational work of streaming data from a byte array.
			
 
				+   */
			
 
				+
			
 
				+  static class ByteBufferBlockFactory extends BlockFactory {
			
 
				+
			
 
				+    private final DirectBufferPool bufferPool = new DirectBufferPool();
			
 
				+    private final AtomicInteger buffersOutstanding = new AtomicInteger(0);
			
 
				+
			
 
				+    ByteBufferBlockFactory(S3AFileSystem owner) {
			
 
				+      super(owner);
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    ByteBufferBlock create(int limit) throws IOException {
			
 
				+      return new ByteBufferBlock(limit);
			
 
				+    }
			
 
				+
			
 
				+    private ByteBuffer requestBuffer(int limit) {
			
 
				+      LOG.debug("Requesting buffer of size {}", limit);
			
 
				+      buffersOutstanding.incrementAndGet();
			
 
				+      return bufferPool.getBuffer(limit);
			
 
				+    }
			
 
				+
			
 
				+    private void releaseBuffer(ByteBuffer buffer) {
			
 
				+      LOG.debug("Releasing buffer");
			
 
				+      bufferPool.returnBuffer(buffer);
			
 
				+      buffersOutstanding.decrementAndGet();
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Get count of outstanding buffers.
			
 
				+     * @return the current buffer count
			
 
				+     */
			
 
				+    public int getOutstandingBufferCount() {
			
 
				+      return buffersOutstanding.get();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String toString() {
			
 
				+      return "ByteBufferBlockFactory{"
			
 
				+          + "buffersOutstanding=" + buffersOutstanding +
			
 
				+          '}';
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * A DataBlock which requests a buffer from pool on creation; returns
			
 
				+     * it when the output stream is closed.
			
 
				+     */
			
 
				+    class ByteBufferBlock extends DataBlock {
			
 
				+      private ByteBuffer buffer;
			
 
				+      private final int bufferSize;
			
 
				+      // cache data size so that it is consistent after the buffer is reset.
			
 
				+      private Integer dataSize;
			
 
				+
			
 
				+      /**
			
 
				+       * Instantiate. This will request a ByteBuffer of the desired size.
			
 
				+       * @param bufferSize buffer size
			
 
				+       */
			
 
				+      ByteBufferBlock(int bufferSize) {
			
 
				+        this.bufferSize = bufferSize;
			
 
				+        buffer = requestBuffer(bufferSize);
			
 
				+      }
			
 
				+
			
 
				+      /**
			
 
				+       * Get the amount of data; if there is no buffer then the size is 0.
			
 
				+       * @return the amount of data available to upload.
			
 
				+       */
			
 
				+      @Override
			
 
				+      int dataSize() {
			
 
				+        return dataSize != null ? dataSize : bufferCapacityUsed();
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      ByteBufferInputStream startUpload() throws IOException {
			
 
				+        super.startUpload();
			
 
				+        dataSize = bufferCapacityUsed();
			
 
				+        // set the buffer up from reading from the beginning
			
 
				+        buffer.limit(buffer.position());
			
 
				+        buffer.position(0);
			
 
				+        return new ByteBufferInputStream(dataSize, buffer);
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public boolean hasCapacity(long bytes) {
			
 
				+        return bytes <= remainingCapacity();
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public int remainingCapacity() {
			
 
				+        return buffer != null ? buffer.remaining() : 0;
			
 
				+      }
			
 
				+
			
 
				+      private int bufferCapacityUsed() {
			
 
				+        return buffer.capacity() - buffer.remaining();
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      int write(byte[] b, int offset, int len) throws IOException {
			
 
				+        super.write(b, offset, len);
			
 
				+        int written = Math.min(remainingCapacity(), len);
			
 
				+        buffer.put(b, offset, written);
			
 
				+        return written;
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      protected void innerClose() {
			
 
				+        buffer = null;
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public String toString() {
			
 
				+        return "ByteBufferBlock{"
			
 
				+            + "state=" + getState() +
			
 
				+            ", dataSize=" + dataSize() +
			
 
				+            ", limit=" + bufferSize +
			
 
				+            ", remainingCapacity=" + remainingCapacity() +
			
 
				+            '}';
			
 
				+      }
			
 
				+
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Provide an input stream from a byte buffer; supporting
			
 
				+     * {@link #mark(int)}, which is required to enable replay of failed
			
 
				+     * PUT attempts.
			
 
				+     * This input stream returns the buffer to the pool afterwards.
			
 
				+     */
			
 
				+    class ByteBufferInputStream extends InputStream {
			
 
				+
			
 
				+      private final int size;
			
 
				+      private ByteBuffer byteBuffer;
			
 
				+
			
 
				+      ByteBufferInputStream(int size, ByteBuffer byteBuffer) {
			
 
				+        LOG.debug("Creating ByteBufferInputStream of size {}", size);
			
 
				+        this.size = size;
			
 
				+        this.byteBuffer = byteBuffer;
			
 
				+      }
			
 
				+
			
 
				+      /**
			
 
				+       * Return the buffer to the pool after the stream is closed.
			
 
				+       */
			
 
				+      @Override
			
 
				+      public synchronized void close() {
			
 
				+        if (byteBuffer != null) {
			
 
				+          LOG.debug("releasing buffer");
			
 
				+          releaseBuffer(byteBuffer);
			
 
				+          byteBuffer = null;
			
 
				+        }
			
 
				+      }
			
 
				+
			
 
				+      /**
			
 
				+       * Verify that the stream is open.
			
 
				+       * @throws IOException if the stream is closed
			
 
				+       */
			
 
				+      private void verifyOpen() throws IOException {
			
 
				+        if (byteBuffer == null) {
			
 
				+          throw new IOException(FSExceptionMessages.STREAM_IS_CLOSED);
			
 
				+        }
			
 
				+      }
			
 
				+
			
 
				+      public synchronized int read() throws IOException {
			
 
				+        if (available() > 0) {
			
 
				+          return byteBuffer.get() & 0xFF;
			
 
				+        } else {
			
 
				+          return -1;
			
 
				+        }
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public synchronized long skip(long offset) throws IOException {
			
 
				+        verifyOpen();
			
 
				+        long newPos = position() + offset;
			
 
				+        if (newPos < 0) {
			
 
				+          throw new EOFException(FSExceptionMessages.NEGATIVE_SEEK);
			
 
				+        }
			
 
				+        if (newPos > size) {
			
 
				+          throw new EOFException(FSExceptionMessages.CANNOT_SEEK_PAST_EOF);
			
 
				+        }
			
 
				+        byteBuffer.position((int) newPos);
			
 
				+        return newPos;
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public synchronized int available() {
			
 
				+        Preconditions.checkState(byteBuffer != null,
			
 
				+            FSExceptionMessages.STREAM_IS_CLOSED);
			
 
				+        return byteBuffer.remaining();
			
 
				+      }
			
 
				+
			
 
				+      /**
			
 
				+       * Get the current buffer position.
			
 
				+       * @return the buffer position
			
 
				+       */
			
 
				+      public synchronized int position() {
			
 
				+        return byteBuffer.position();
			
 
				+      }
			
 
				+
			
 
				+      /**
			
 
				+       * Check if there is data left.
			
 
				+       * @return true if there is data remaining in the buffer.
			
 
				+       */
			
 
				+      public synchronized boolean hasRemaining() {
			
 
				+        return byteBuffer.hasRemaining();
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public synchronized void mark(int readlimit) {
			
 
				+        LOG.debug("mark at {}", position());
			
 
				+        byteBuffer.mark();
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public synchronized void reset() throws IOException {
			
 
				+        LOG.debug("reset");
			
 
				+        byteBuffer.reset();
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public boolean markSupported() {
			
 
				+        return true;
			
 
				+      }
			
 
				+
			
 
				+      /**
			
 
				+       * Read in data.
			
 
				+       * @param buffer destination buffer
			
 
				+       * @param offset offset within the buffer
			
 
				+       * @param length length of bytes to read
			
 
				+       * @throws EOFException if the position is negative
			
 
				+       * @throws IndexOutOfBoundsException if there isn't space for the
			
 
				+       * amount of data requested.
			
 
				+       * @throws IllegalArgumentException other arguments are invalid.
			
 
				+       */
			
 
				+      @SuppressWarnings("NullableProblems")
			
 
				+      public synchronized int read(byte[] buffer, int offset, int length)
			
 
				+          throws IOException {
			
 
				+        Preconditions.checkArgument(length >= 0, "length is negative");
			
 
				+        Preconditions.checkArgument(buffer != null, "Null buffer");
			
 
				+        if (buffer.length - offset < length) {
			
 
				+          throw new IndexOutOfBoundsException(
			
 
				+              FSExceptionMessages.TOO_MANY_BYTES_FOR_DEST_BUFFER
			
 
				+                  + ": request length =" + length
			
 
				+                  + ", with offset =" + offset
			
 
				+                  + "; buffer capacity =" + (buffer.length - offset));
			
 
				+        }
			
 
				+        verifyOpen();
			
 
				+        if (!hasRemaining()) {
			
 
				+          return -1;
			
 
				+        }
			
 
				+
			
 
				+        int toRead = Math.min(length, available());
			
 
				+        byteBuffer.get(buffer, offset, toRead);
			
 
				+        return toRead;
			
 
				+      }
			
 
				+
			
 
				+      @Override
			
 
				+      public String toString() {
			
 
				+        final StringBuilder sb = new StringBuilder(
			
 
				+            "ByteBufferInputStream{");
			
 
				+        sb.append("size=").append(size);
			
 
				+        ByteBuffer buffer = this.byteBuffer;
			
 
				+        if (buffer != null) {
			
 
				+          sb.append(", available=").append(buffer.remaining());
			
 
				+        }
			
 
				+        sb.append('}');
			
 
				+        return sb.toString();
			
 
				+      }
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  // ====================================================================
			
 
				+
			
 
				+  /**
			
 
				+   * Buffer blocks to disk.
			
 
				+   */
			
 
				+  static class DiskBlockFactory extends BlockFactory {
			
 
				+
			
 
				+    DiskBlockFactory(S3AFileSystem owner) {
			
 
				+      super(owner);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Create a temp file and a block which writes to it.
			
 
				+     * @param limit limit of the block.
			
 
				+     * @return the new block
			
 
				+     * @throws IOException IO problems
			
 
				+     */
			
 
				+    @Override
			
 
				+    DataBlock create(int limit) throws IOException {
			
 
				+      File destFile = getOwner()
			
 
				+          .createTmpFileForWrite("s3ablock", limit, getOwner().getConf());
			
 
				+      return new DiskBlock(destFile, limit);
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Stream to a file.
			
 
				+   * This will stop at the limit; the caller is expected to create a new block
			
 
				+   */
			
 
				+  static class DiskBlock extends DataBlock {
			
 
				+
			
 
				+    private int bytesWritten;
			
 
				+    private final File bufferFile;
			
 
				+    private final int limit;
			
 
				+    private BufferedOutputStream out;
			
 
				+    private InputStream uploadStream;
			
 
				+
			
 
				+    DiskBlock(File bufferFile, int limit)
			
 
				+        throws FileNotFoundException {
			
 
				+      this.limit = limit;
			
 
				+      this.bufferFile = bufferFile;
			
 
				+      out = new BufferedOutputStream(new FileOutputStream(bufferFile));
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    int dataSize() {
			
 
				+      return bytesWritten;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    boolean hasCapacity(long bytes) {
			
 
				+      return dataSize() + bytes <= limit;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    int remainingCapacity() {
			
 
				+      return limit - bytesWritten;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    int write(byte[] b, int offset, int len) throws IOException {
			
 
				+      super.write(b, offset, len);
			
 
				+      int written = Math.min(remainingCapacity(), len);
			
 
				+      out.write(b, offset, written);
			
 
				+      bytesWritten += written;
			
 
				+      return written;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    InputStream startUpload() throws IOException {
			
 
				+      super.startUpload();
			
 
				+      try {
			
 
				+        out.flush();
			
 
				+      } finally {
			
 
				+        out.close();
			
 
				+        out = null;
			
 
				+      }
			
 
				+      uploadStream = new FileInputStream(bufferFile);
			
 
				+      return new FileDeletingInputStream(uploadStream);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * The close operation will delete the destination file if it still
			
 
				+     * exists.
			
 
				+     * @throws IOException IO problems
			
 
				+     */
			
 
				+    @Override
			
 
				+    protected void innerClose() throws IOException {
			
 
				+      final DestState state = getState();
			
 
				+      LOG.debug("Closing {}", this);
			
 
				+      switch (state) {
			
 
				+      case Writing:
			
 
				+        if (bufferFile.exists()) {
			
 
				+          // file was not uploaded
			
 
				+          LOG.debug("Deleting buffer file as upload did not start");
			
 
				+          boolean deleted = bufferFile.delete();
			
 
				+          if (!deleted && bufferFile.exists()) {
			
 
				+            LOG.warn("Failed to delete buffer file {}", bufferFile);
			
 
				+          }
			
 
				+        }
			
 
				+        break;
			
 
				+
			
 
				+      case Upload:
			
 
				+        LOG.debug("Buffer file {} exists —close upload stream", bufferFile);
			
 
				+        break;
			
 
				+
			
 
				+      case Closed:
			
 
				+        // no-op
			
 
				+        break;
			
 
				+
			
 
				+      default:
			
 
				+        // this state can never be reached, but checkstyle complains, so
			
 
				+        // it is here.
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Flush operation will flush to disk.
			
 
				+     * @throws IOException IOE raised on FileOutputStream
			
 
				+     */
			
 
				+    @Override
			
 
				+    void flush() throws IOException {
			
 
				+      super.flush();
			
 
				+      out.flush();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String toString() {
			
 
				+      String sb = "FileBlock{"
			
 
				+          + "destFile=" + bufferFile +
			
 
				+          ", state=" + getState() +
			
 
				+          ", dataSize=" + dataSize() +
			
 
				+          ", limit=" + limit +
			
 
				+          '}';
			
 
				+      return sb;
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * An input stream which deletes the buffer file when closed.
			
 
				+     */
			
 
				+    private final class FileDeletingInputStream extends FilterInputStream {
			
 
				+      private final AtomicBoolean closed = new AtomicBoolean(false);
			
 
				+
			
 
				+      FileDeletingInputStream(InputStream source) {
			
 
				+        super(source);
			
 
				+      }
			
 
				+
			
 
				+      /**
			
 
				+       * Delete the input file when closed.
			
 
				+       * @throws IOException IO problem
			
 
				+       */
			
 
				+      @Override
			
 
				+      public void close() throws IOException {
			
 
				+        try {
			
 
				+          super.close();
			
 
				+        } finally {
			
 
				+          if (!closed.getAndSet(true)) {
			
 
				+            if (!bufferFile.delete()) {
			
 
				+              LOG.warn("delete({}) returned false",
			
 
				+                  bufferFile.getAbsoluteFile());
			
 
				+            }
			
 
				+          }
			
 
				+        }
			
 
				+      }
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AFastOutputStream.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AFastOutputStream.java
@@ -1,410 +0,0 @@
 
				-/**
			
 
				- * Licensed to the Apache Software Foundation (ASF) under one
			
 
				- * or more contributor license agreements.  See the NOTICE file
			
 
				- * distributed with this work for additional information
			
 
				- * regarding copyright ownership.  The ASF licenses this file
			
 
				- * to you under the Apache License, Version 2.0 (the
			
 
				- * "License"); you may not use this file except in compliance
			
 
				- * with the License.  You may obtain a copy of the License at
			
 
				- *
			
 
				- *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				- *
			
 
				- * Unless required by applicable law or agreed to in writing, software
			
 
				- * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				- * See the License for the specific language governing permissions and
			
 
				- * limitations under the License.
			
 
				- */
			
 
				-
			
 
				-package org.apache.hadoop.fs.s3a;
			
 
				-
			
 
				-import com.amazonaws.AmazonClientException;
			
 
				-import com.amazonaws.event.ProgressEvent;
			
 
				-import com.amazonaws.event.ProgressListener;
			
 
				-import com.amazonaws.services.s3.AmazonS3;
			
 
				-import com.amazonaws.services.s3.model.AbortMultipartUploadRequest;
			
 
				-import com.amazonaws.services.s3.model.CannedAccessControlList;
			
 
				-import com.amazonaws.services.s3.model.CompleteMultipartUploadRequest;
			
 
				-import com.amazonaws.services.s3.model.InitiateMultipartUploadRequest;
			
 
				-import com.amazonaws.services.s3.model.ObjectMetadata;
			
 
				-import com.amazonaws.services.s3.model.PartETag;
			
 
				-import com.amazonaws.services.s3.model.PutObjectRequest;
			
 
				-import com.amazonaws.services.s3.model.PutObjectResult;
			
 
				-import com.amazonaws.services.s3.model.UploadPartRequest;
			
 
				-import com.google.common.util.concurrent.Futures;
			
 
				-import com.google.common.util.concurrent.ListenableFuture;
			
 
				-import com.google.common.util.concurrent.ListeningExecutorService;
			
 
				-import com.google.common.util.concurrent.MoreExecutors;
			
 
				-import org.apache.hadoop.classification.InterfaceAudience;
			
 
				-import org.apache.hadoop.classification.InterfaceStability;
			
 
				-import org.apache.hadoop.util.Progressable;
			
 
				-import org.slf4j.Logger;
			
 
				-
			
 
				-import java.io.ByteArrayInputStream;
			
 
				-import java.io.ByteArrayOutputStream;
			
 
				-import java.io.IOException;
			
 
				-import java.io.OutputStream;
			
 
				-import java.util.ArrayList;
			
 
				-import java.util.List;
			
 
				-
			
 
				-import java.util.concurrent.Callable;
			
 
				-import java.util.concurrent.ExecutionException;
			
 
				-import java.util.concurrent.ExecutorService;
			
 
				-
			
 
				-import static org.apache.hadoop.fs.s3a.S3AUtils.*;
			
 
				-import static org.apache.hadoop.fs.s3a.Statistic.*;
			
 
				-
			
 
				-/**
			
 
				- * Upload files/parts asap directly from a memory buffer (instead of buffering
			
 
				- * to a file).
			
 
				- * <p>
			
 
				- * Uploads are managed low-level rather than through the AWS TransferManager.
			
 
				- * This allows for uploading each part of a multi-part upload as soon as
			
 
				- * the bytes are in memory, rather than waiting until the file is closed.
			
 
				- * <p>
			
 
				- * Unstable: statistics and error handling might evolve
			
 
				- */
			
 
				-@InterfaceAudience.Private
			
 
				-@InterfaceStability.Unstable
			
 
				-public class S3AFastOutputStream extends OutputStream {
			
 
				-
			
 
				-  private static final Logger LOG = S3AFileSystem.LOG;
			
 
				-  private final String key;
			
 
				-  private final String bucket;
			
 
				-  private final AmazonS3 client;
			
 
				-  private final int partSize;
			
 
				-  private final int multiPartThreshold;
			
 
				-  private final S3AFileSystem fs;
			
 
				-  private final CannedAccessControlList cannedACL;
			
 
				-  private final ProgressListener progressListener;
			
 
				-  private final ListeningExecutorService executorService;
			
 
				-  private MultiPartUpload multiPartUpload;
			
 
				-  private boolean closed;
			
 
				-  private ByteArrayOutputStream buffer;
			
 
				-  private int bufferLimit;
			
 
				-
			
 
				-
			
 
				-  /**
			
 
				-   * Creates a fast OutputStream that uploads to S3 from memory.
			
 
				-   * For MultiPartUploads, as soon as sufficient bytes have been written to
			
 
				-   * the stream a part is uploaded immediately (by using the low-level
			
 
				-   * multi-part upload API on the AmazonS3Client).
			
 
				-   *
			
 
				-   * @param client AmazonS3Client used for S3 calls
			
 
				-   * @param fs S3AFilesystem
			
 
				-   * @param bucket S3 bucket name
			
 
				-   * @param key S3 key name
			
 
				-   * @param progress report progress in order to prevent timeouts
			
 
				-   * @param cannedACL used CannedAccessControlList
			
 
				-   * @param partSize size of a single part in a multi-part upload (except
			
 
				-   * last part)
			
 
				-   * @param multiPartThreshold files at least this size use multi-part upload
			
 
				-   * @param threadPoolExecutor thread factory
			
 
				-   * @throws IOException on any problem
			
 
				-   */
			
 
				-  public S3AFastOutputStream(AmazonS3 client,
			
 
				-      S3AFileSystem fs,
			
 
				-      String bucket,
			
 
				-      String key,
			
 
				-      Progressable progress,
			
 
				-      CannedAccessControlList cannedACL,
			
 
				-      long partSize,
			
 
				-      long multiPartThreshold,
			
 
				-      ExecutorService threadPoolExecutor)
			
 
				-      throws IOException {
			
 
				-    this.bucket = bucket;
			
 
				-    this.key = key;
			
 
				-    this.client = client;
			
 
				-    this.fs = fs;
			
 
				-    this.cannedACL = cannedACL;
			
 
				-    //Ensure limit as ByteArrayOutputStream size cannot exceed Integer.MAX_VALUE
			
 
				-    if (partSize > Integer.MAX_VALUE) {
			
 
				-      this.partSize = Integer.MAX_VALUE;
			
 
				-      LOG.warn("s3a: MULTIPART_SIZE capped to ~2.14GB (maximum allowed size " +
			
 
				-          "when using 'FAST_UPLOAD = true')");
			
 
				-    } else {
			
 
				-      this.partSize = (int) partSize;
			
 
				-    }
			
 
				-    if (multiPartThreshold > Integer.MAX_VALUE) {
			
 
				-      this.multiPartThreshold = Integer.MAX_VALUE;
			
 
				-      LOG.warn("s3a: MIN_MULTIPART_THRESHOLD capped to ~2.14GB (maximum " +
			
 
				-          "allowed size when using 'FAST_UPLOAD = true')");
			
 
				-    } else {
			
 
				-      this.multiPartThreshold = (int) multiPartThreshold;
			
 
				-    }
			
 
				-    this.bufferLimit = this.multiPartThreshold;
			
 
				-    this.closed = false;
			
 
				-    int initialBufferSize = this.fs.getConf()
			
 
				-        .getInt(Constants.FAST_BUFFER_SIZE, Constants.DEFAULT_FAST_BUFFER_SIZE);
			
 
				-    if (initialBufferSize < 0) {
			
 
				-      LOG.warn("s3a: FAST_BUFFER_SIZE should be a positive number. Using " +
			
 
				-          "default value");
			
 
				-      initialBufferSize = Constants.DEFAULT_FAST_BUFFER_SIZE;
			
 
				-    } else if (initialBufferSize > this.bufferLimit) {
			
 
				-      LOG.warn("s3a: automatically adjusting FAST_BUFFER_SIZE to not " +
			
 
				-          "exceed MIN_MULTIPART_THRESHOLD");
			
 
				-      initialBufferSize = this.bufferLimit;
			
 
				-    }
			
 
				-    this.buffer = new ByteArrayOutputStream(initialBufferSize);
			
 
				-    this.executorService = MoreExecutors.listeningDecorator(threadPoolExecutor);
			
 
				-    this.multiPartUpload = null;
			
 
				-    this.progressListener = new ProgressableListener(progress);
			
 
				-    LOG.debug("Initialized S3AFastOutputStream for bucket '{}' key '{}'",
			
 
				-        bucket, key);
			
 
				-  }
			
 
				-
			
 
				-  /**
			
 
				-   * Writes a byte to the memory buffer. If this causes the buffer to reach
			
 
				-   * its limit, the actual upload is submitted to the threadpool.
			
 
				-   * @param b the int of which the lowest byte is written
			
 
				-   * @throws IOException on any problem
			
 
				-   */
			
 
				-  @Override
			
 
				-  public synchronized void write(int b) throws IOException {
			
 
				-    buffer.write(b);
			
 
				-    if (buffer.size() == bufferLimit) {
			
 
				-      uploadBuffer();
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  /**
			
 
				-   * Writes a range of bytes from to the memory buffer. If this causes the
			
 
				-   * buffer to reach its limit, the actual upload is submitted to the
			
 
				-   * threadpool and the remainder of the array is written to memory
			
 
				-   * (recursively).
			
 
				-   * @param b byte array containing
			
 
				-   * @param off offset in array where to start
			
 
				-   * @param len number of bytes to be written
			
 
				-   * @throws IOException on any problem
			
 
				-   */
			
 
				-  @Override
			
 
				-  public synchronized void write(byte[] b, int off, int len)
			
 
				-      throws IOException {
			
 
				-    if (b == null) {
			
 
				-      throw new NullPointerException();
			
 
				-    } else if ((off < 0) || (off > b.length) || (len < 0) ||
			
 
				-        ((off + len) > b.length) || ((off + len) < 0)) {
			
 
				-      throw new IndexOutOfBoundsException();
			
 
				-    } else if (len == 0) {
			
 
				-      return;
			
 
				-    }
			
 
				-    if (buffer.size() + len < bufferLimit) {
			
 
				-      buffer.write(b, off, len);
			
 
				-    } else {
			
 
				-      int firstPart = bufferLimit - buffer.size();
			
 
				-      buffer.write(b, off, firstPart);
			
 
				-      uploadBuffer();
			
 
				-      this.write(b, off + firstPart, len - firstPart);
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  private synchronized void uploadBuffer() throws IOException {
			
 
				-    if (multiPartUpload == null) {
			
 
				-      multiPartUpload = initiateMultiPartUpload();
			
 
				-       /* Upload the existing buffer if it exceeds partSize. This possibly
			
 
				-       requires multiple parts! */
			
 
				-      final byte[] allBytes = buffer.toByteArray();
			
 
				-      buffer = null; //earlier gc?
			
 
				-      LOG.debug("Total length of initial buffer: {}", allBytes.length);
			
 
				-      int processedPos = 0;
			
 
				-      while ((multiPartThreshold - processedPos) >= partSize) {
			
 
				-        LOG.debug("Initial buffer: processing from byte {} to byte {}",
			
 
				-            processedPos, (processedPos + partSize - 1));
			
 
				-        multiPartUpload.uploadPartAsync(new ByteArrayInputStream(allBytes,
			
 
				-            processedPos, partSize), partSize);
			
 
				-        processedPos += partSize;
			
 
				-      }
			
 
				-      //resize and reset stream
			
 
				-      bufferLimit = partSize;
			
 
				-      buffer = new ByteArrayOutputStream(bufferLimit);
			
 
				-      buffer.write(allBytes, processedPos, multiPartThreshold - processedPos);
			
 
				-    } else {
			
 
				-      //upload next part
			
 
				-      multiPartUpload.uploadPartAsync(new ByteArrayInputStream(buffer
			
 
				-          .toByteArray()), partSize);
			
 
				-      buffer.reset();
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  /**
			
 
				-   * Close the stream. This will not return until the upload is complete
			
 
				-   * or the attempt to perform the upload has failed.
			
 
				-   * Exceptions raised in this method are indicative that the write has
			
 
				-   * failed and data is at risk of being lost.
			
 
				-   * @throws IOException on any failure.
			
 
				-   */
			
 
				-  @Override
			
 
				-  public synchronized void close() throws IOException {
			
 
				-    if (closed) {
			
 
				-      return;
			
 
				-    }
			
 
				-    closed = true;
			
 
				-    try {
			
 
				-      if (multiPartUpload == null) {
			
 
				-        putObject();
			
 
				-      } else {
			
 
				-        int size = buffer.size();
			
 
				-        if (size > 0) {
			
 
				-          fs.incrementPutStartStatistics(size);
			
 
				-          //send last part
			
 
				-          multiPartUpload.uploadPartAsync(new ByteArrayInputStream(buffer
			
 
				-              .toByteArray()), size);
			
 
				-        }
			
 
				-        final List<PartETag> partETags = multiPartUpload
			
 
				-            .waitForAllPartUploads();
			
 
				-        multiPartUpload.complete(partETags);
			
 
				-      }
			
 
				-      // This will delete unnecessary fake parent directories
			
 
				-      fs.finishedWrite(key);
			
 
				-      LOG.debug("Upload complete for bucket '{}' key '{}'", bucket, key);
			
 
				-    } finally {
			
 
				-      buffer = null;
			
 
				-      super.close();
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  /**
			
 
				-   * Create the default metadata for a multipart upload operation.
			
 
				-   * @return the metadata to use/extend.
			
 
				-   */
			
 
				-  private ObjectMetadata createDefaultMetadata() {
			
 
				-    return fs.newObjectMetadata();
			
 
				-  }
			
 
				-
			
 
				-  private MultiPartUpload initiateMultiPartUpload() throws IOException {
			
 
				-    final InitiateMultipartUploadRequest initiateMPURequest =
			
 
				-        new InitiateMultipartUploadRequest(bucket,
			
 
				-            key,
			
 
				-            createDefaultMetadata());
			
 
				-    initiateMPURequest.setCannedACL(cannedACL);
			
 
				-    try {
			
 
				-      return new MultiPartUpload(
			
 
				-          client.initiateMultipartUpload(initiateMPURequest).getUploadId());
			
 
				-    } catch (AmazonClientException ace) {
			
 
				-      throw translateException("initiate MultiPartUpload", key, ace);
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  private void putObject() throws IOException {
			
 
				-    LOG.debug("Executing regular upload for bucket '{}' key '{}'",
			
 
				-        bucket, key);
			
 
				-    final ObjectMetadata om = createDefaultMetadata();
			
 
				-    final int size = buffer.size();
			
 
				-    om.setContentLength(size);
			
 
				-    final PutObjectRequest putObjectRequest =
			
 
				-        fs.newPutObjectRequest(key,
			
 
				-            om,
			
 
				-            new ByteArrayInputStream(buffer.toByteArray()));
			
 
				-    putObjectRequest.setGeneralProgressListener(progressListener);
			
 
				-    ListenableFuture<PutObjectResult> putObjectResult =
			
 
				-        executorService.submit(new Callable<PutObjectResult>() {
			
 
				-          @Override
			
 
				-          public PutObjectResult call() throws Exception {
			
 
				-            fs.incrementPutStartStatistics(size);
			
 
				-            return client.putObject(putObjectRequest);
			
 
				-          }
			
 
				-        });
			
 
				-    //wait for completion
			
 
				-    try {
			
 
				-      putObjectResult.get();
			
 
				-    } catch (InterruptedException ie) {
			
 
				-      LOG.warn("Interrupted object upload: {}", ie, ie);
			
 
				-      Thread.currentThread().interrupt();
			
 
				-    } catch (ExecutionException ee) {
			
 
				-      throw extractException("regular upload", key, ee);
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-
			
 
				-  private class MultiPartUpload {
			
 
				-    private final String uploadId;
			
 
				-    private final List<ListenableFuture<PartETag>> partETagsFutures;
			
 
				-
			
 
				-    public MultiPartUpload(String uploadId) {
			
 
				-      this.uploadId = uploadId;
			
 
				-      this.partETagsFutures = new ArrayList<ListenableFuture<PartETag>>();
			
 
				-      LOG.debug("Initiated multi-part upload for bucket '{}' key '{}' with " +
			
 
				-          "id '{}'", bucket, key, uploadId);
			
 
				-    }
			
 
				-
			
 
				-    private void uploadPartAsync(ByteArrayInputStream inputStream,
			
 
				-        int partSize) {
			
 
				-      final int currentPartNumber = partETagsFutures.size() + 1;
			
 
				-      final UploadPartRequest request =
			
 
				-          new UploadPartRequest().withBucketName(bucket).withKey(key)
			
 
				-              .withUploadId(uploadId).withInputStream(inputStream)
			
 
				-              .withPartNumber(currentPartNumber).withPartSize(partSize);
			
 
				-      request.setGeneralProgressListener(progressListener);
			
 
				-      ListenableFuture<PartETag> partETagFuture =
			
 
				-          executorService.submit(new Callable<PartETag>() {
			
 
				-            @Override
			
 
				-            public PartETag call() throws Exception {
			
 
				-              LOG.debug("Uploading part {} for id '{}'", currentPartNumber,
			
 
				-                  uploadId);
			
 
				-              return fs.uploadPart(request).getPartETag();
			
 
				-            }
			
 
				-          });
			
 
				-      partETagsFutures.add(partETagFuture);
			
 
				-    }
			
 
				-
			
 
				-    private List<PartETag> waitForAllPartUploads() throws IOException {
			
 
				-      try {
			
 
				-        return Futures.allAsList(partETagsFutures).get();
			
 
				-      } catch (InterruptedException ie) {
			
 
				-        LOG.warn("Interrupted partUpload: {}", ie, ie);
			
 
				-        Thread.currentThread().interrupt();
			
 
				-        return null;
			
 
				-      } catch (ExecutionException ee) {
			
 
				-        //there is no way of recovering so abort
			
 
				-        //cancel all partUploads
			
 
				-        for (ListenableFuture<PartETag> future : partETagsFutures) {
			
 
				-          future.cancel(true);
			
 
				-        }
			
 
				-        //abort multipartupload
			
 
				-        this.abort();
			
 
				-        throw extractException("Multi-part upload with id '" + uploadId + "'",
			
 
				-            key, ee);
			
 
				-      }
			
 
				-    }
			
 
				-
			
 
				-    private void complete(List<PartETag> partETags) throws IOException {
			
 
				-      try {
			
 
				-        LOG.debug("Completing multi-part upload for key '{}', id '{}'",
			
 
				-            key, uploadId);
			
 
				-        client.completeMultipartUpload(
			
 
				-            new CompleteMultipartUploadRequest(bucket,
			
 
				-                key,
			
 
				-                uploadId,
			
 
				-                partETags));
			
 
				-      } catch (AmazonClientException e) {
			
 
				-        throw translateException("Completing multi-part upload", key, e);
			
 
				-      }
			
 
				-    }
			
 
				-
			
 
				-    public void abort() {
			
 
				-      LOG.warn("Aborting multi-part upload with id '{}'", uploadId);
			
 
				-      try {
			
 
				-        fs.incrementStatistic(OBJECT_MULTIPART_UPLOAD_ABORTED);
			
 
				-        client.abortMultipartUpload(new AbortMultipartUploadRequest(bucket,
			
 
				-            key, uploadId));
			
 
				-      } catch (Exception e2) {
			
 
				-        LOG.warn("Unable to abort multipart upload, you may need to purge  " +
			
 
				-            "uploaded parts: {}", e2, e2);
			
 
				-      }
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  private static class ProgressableListener implements ProgressListener {
			
 
				-    private final Progressable progress;
			
 
				-
			
 
				-    public ProgressableListener(Progressable progress) {
			
 
				-      this.progress = progress;
			
 
				-    }
			
 
				-
			
 
				-    public void progressChanged(ProgressEvent progressEvent) {
			
 
				-      if (progress != null) {
			
 
				-        progress.progress();
			
 
				-      }
			
 
				-    }
			
 
				-  }
			
 
				-}
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AFileSystem.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AFileSystem.java
@@ -1,4 +1,4 @@
 
				-/**
			
 
				+/*
			
 
				  * Licensed to the Apache Software Foundation (ASF) under one
			
 
				  * or more contributor license agreements.  See the NOTICE file
			
 
				  * distributed with this work for additional information
			
@@ -37,14 +37,20 @@ import java.util.concurrent.atomic.AtomicBoolean;
 
				 import com.amazonaws.AmazonClientException;
			
 
				 import com.amazonaws.AmazonServiceException;
			
 
				 import com.amazonaws.services.s3.AmazonS3;
			
 
				+import com.amazonaws.services.s3.model.AbortMultipartUploadRequest;
			
 
				 import com.amazonaws.services.s3.model.AmazonS3Exception;
			
 
				 import com.amazonaws.services.s3.model.CannedAccessControlList;
			
 
				+import com.amazonaws.services.s3.model.CompleteMultipartUploadRequest;
			
 
				+import com.amazonaws.services.s3.model.CompleteMultipartUploadResult;
			
 
				+import com.amazonaws.services.s3.model.CopyObjectRequest;
			
 
				 import com.amazonaws.services.s3.model.DeleteObjectsRequest;
			
 
				+import com.amazonaws.services.s3.model.InitiateMultipartUploadRequest;
			
 
				 import com.amazonaws.services.s3.model.ListObjectsRequest;
			
 
				 import com.amazonaws.services.s3.model.ObjectListing;
			
 
				 import com.amazonaws.services.s3.model.ObjectMetadata;
			
 
				+import com.amazonaws.services.s3.model.PartETag;
			
 
				 import com.amazonaws.services.s3.model.PutObjectRequest;
			
 
				-import com.amazonaws.services.s3.model.CopyObjectRequest;
			
 
				+import com.amazonaws.services.s3.model.PutObjectResult;
			
 
				 import com.amazonaws.services.s3.model.S3ObjectSummary;
			
 
				 import com.amazonaws.services.s3.model.UploadPartRequest;
			
 
				 import com.amazonaws.services.s3.model.UploadPartResult;
			
@@ -55,6 +61,8 @@ import com.amazonaws.services.s3.transfer.Upload;
 
				 import com.amazonaws.event.ProgressListener;
			
 
				 import com.amazonaws.event.ProgressEvent;
			
 
				 import com.google.common.annotations.VisibleForTesting;
			
 
				+import com.google.common.base.Preconditions;
			
 
				+import com.google.common.util.concurrent.ListeningExecutorService;
			
 
				 
			
 
				 import org.apache.commons.lang.StringUtils;
			
 
				 import org.apache.hadoop.classification.InterfaceAudience;
			
@@ -68,6 +76,7 @@ import org.apache.hadoop.fs.FileStatus;
 
				 import org.apache.hadoop.fs.FileSystem;
			
 
				 import org.apache.hadoop.fs.GlobalStorageStatistics;
			
 
				 import org.apache.hadoop.fs.InvalidRequestException;
			
 
				+import org.apache.hadoop.fs.LocalDirAllocator;
			
 
				 import org.apache.hadoop.fs.LocalFileSystem;
			
 
				 import org.apache.hadoop.fs.LocatedFileStatus;
			
 
				 import org.apache.hadoop.fs.Path;
			
@@ -118,9 +127,12 @@ public class S3AFileSystem extends FileSystem {
 
				   private long partSize;
			
 
				   private boolean enableMultiObjectsDelete;
			
 
				   private TransferManager transfers;
			
 
				-  private ExecutorService threadPoolExecutor;
			
 
				+  private ListeningExecutorService threadPoolExecutor;
			
 
				   private long multiPartThreshold;
			
 
				   public static final Logger LOG = LoggerFactory.getLogger(S3AFileSystem.class);
			
 
				+  private static final Logger PROGRESS =
			
 
				+      LoggerFactory.getLogger("org.apache.hadoop.fs.s3a.S3AFileSystem.Progress");
			
 
				+  private LocalDirAllocator directoryAllocator;
			
 
				   private CannedAccessControlList cannedACL;
			
 
				   private String serverSideEncryptionAlgorithm;
			
 
				   private S3AInstrumentation instrumentation;
			
@@ -131,6 +143,10 @@ public class S3AFileSystem extends FileSystem {
 
				 
			
 
				   // The maximum number of entries that can be deleted in any call to s3
			
 
				   private static final int MAX_ENTRIES_TO_DELETE = 1000;
			
 
				+  private boolean blockUploadEnabled;
			
 
				+  private String blockOutputBuffer;
			
 
				+  private S3ADataBlocks.BlockFactory blockFactory;
			
 
				+  private int blockOutputActiveBlocks;
			
 
				 
			
 
				   /** Called after a new FileSystem instance is constructed.
			
 
				    * @param name a uri whose authority section names the host, port, etc.
			
@@ -157,18 +173,11 @@ public class S3AFileSystem extends FileSystem {
 
				 
			
 
				       maxKeys = intOption(conf, MAX_PAGING_KEYS, DEFAULT_MAX_PAGING_KEYS, 1);
			
 
				       listing = new Listing(this);
			
 
				-      partSize = conf.getLong(MULTIPART_SIZE, DEFAULT_MULTIPART_SIZE);
			
 
				-      if (partSize < 5 * 1024 * 1024) {
			
 
				-        LOG.error(MULTIPART_SIZE + " must be at least 5 MB");
			
 
				-        partSize = 5 * 1024 * 1024;
			
 
				-      }
			
 
				+      partSize = getMultipartSizeProperty(conf,
			
 
				+          MULTIPART_SIZE, DEFAULT_MULTIPART_SIZE);
			
 
				+      multiPartThreshold = getMultipartSizeProperty(conf,
			
 
				+          MIN_MULTIPART_THRESHOLD, DEFAULT_MIN_MULTIPART_THRESHOLD);
			
 
				 
			
 
				-      multiPartThreshold = conf.getLong(MIN_MULTIPART_THRESHOLD,
			
 
				-          DEFAULT_MIN_MULTIPART_THRESHOLD);
			
 
				-      if (multiPartThreshold < 5 * 1024 * 1024) {
			
 
				-        LOG.error(MIN_MULTIPART_THRESHOLD + " must be at least 5 MB");
			
 
				-        multiPartThreshold = 5 * 1024 * 1024;
			
 
				-      }
			
 
				       //check but do not store the block size
			
 
				       longOption(conf, FS_S3A_BLOCK_SIZE, DEFAULT_BLOCKSIZE, 1);
			
 
				       enableMultiObjectsDelete = conf.getBoolean(ENABLE_MULTI_DELETE, true);
			
@@ -189,14 +198,14 @@ public class S3AFileSystem extends FileSystem {
 
				         LOG.warn(MAX_THREADS + " must be at least 2: forcing to 2.");
			
 
				         maxThreads = 2;
			
 
				       }
			
 
				-      int totalTasks = conf.getInt(MAX_TOTAL_TASKS, DEFAULT_MAX_TOTAL_TASKS);
			
 
				-      if (totalTasks < 1) {
			
 
				-        LOG.warn(MAX_TOTAL_TASKS + "must be at least 1: forcing to 1.");
			
 
				-        totalTasks = 1;
			
 
				-      }
			
 
				-      long keepAliveTime = conf.getLong(KEEPALIVE_TIME, DEFAULT_KEEPALIVE_TIME);
			
 
				-      threadPoolExecutor = new BlockingThreadPoolExecutorService(maxThreads,
			
 
				-          maxThreads + totalTasks, keepAliveTime, TimeUnit.SECONDS,
			
 
				+      int totalTasks = intOption(conf,
			
 
				+          MAX_TOTAL_TASKS, DEFAULT_MAX_TOTAL_TASKS, 1);
			
 
				+      long keepAliveTime = longOption(conf, KEEPALIVE_TIME,
			
 
				+          DEFAULT_KEEPALIVE_TIME, 0);
			
 
				+      threadPoolExecutor = BlockingThreadPoolExecutorService.newInstance(
			
 
				+          maxThreads,
			
 
				+          maxThreads + totalTasks,
			
 
				+          keepAliveTime, TimeUnit.SECONDS,
			
 
				           "s3a-transfer-shared");
			
 
				 
			
 
				       initTransferManager();
			
@@ -209,8 +218,25 @@ public class S3AFileSystem extends FileSystem {
 
				 
			
 
				       serverSideEncryptionAlgorithm =
			
 
				           conf.getTrimmed(SERVER_SIDE_ENCRYPTION_ALGORITHM);
			
 
				+      LOG.debug("Using encryption {}", serverSideEncryptionAlgorithm);
			
 
				       inputPolicy = S3AInputPolicy.getPolicy(
			
 
				           conf.getTrimmed(INPUT_FADVISE, INPUT_FADV_NORMAL));
			
 
				+
			
 
				+      blockUploadEnabled = conf.getBoolean(FAST_UPLOAD, DEFAULT_FAST_UPLOAD);
			
 
				+
			
 
				+      if (blockUploadEnabled) {
			
 
				+        blockOutputBuffer = conf.getTrimmed(FAST_UPLOAD_BUFFER,
			
 
				+            DEFAULT_FAST_UPLOAD_BUFFER);
			
 
				+        partSize = ensureOutputParameterInRange(MULTIPART_SIZE, partSize);
			
 
				+        blockFactory = S3ADataBlocks.createFactory(this, blockOutputBuffer);
			
 
				+        blockOutputActiveBlocks = intOption(conf,
			
 
				+            FAST_UPLOAD_ACTIVE_BLOCKS, DEFAULT_FAST_UPLOAD_ACTIVE_BLOCKS, 1);
			
 
				+        LOG.debug("Using S3ABlockOutputStream with buffer = {}; block={};" +
			
 
				+                " queue limit={}",
			
 
				+            blockOutputBuffer, partSize, blockOutputActiveBlocks);
			
 
				+      } else {
			
 
				+        LOG.debug("Using S3AOutputStream");
			
 
				+      }
			
 
				     } catch (AmazonClientException e) {
			
 
				       throw translateException("initializing ", new Path(name), e);
			
 
				     }
			
@@ -336,6 +362,33 @@ public class S3AFileSystem extends FileSystem {
 
				     return inputPolicy;
			
 
				   }
			
 
				 
			
 
				+  /**
			
 
				+   * Demand create the directory allocator, then create a temporary file.
			
 
				+   * {@link LocalDirAllocator#createTmpFileForWrite(String, long, Configuration)}.
			
 
				+   *  @param pathStr prefix for the temporary file
			
 
				+   *  @param size the size of the file that is going to be written
			
 
				+   *  @param conf the Configuration object
			
 
				+   *  @return a unique temporary file
			
 
				+   *  @throws IOException IO problems
			
 
				+   */
			
 
				+  synchronized File createTmpFileForWrite(String pathStr, long size,
			
 
				+      Configuration conf) throws IOException {
			
 
				+    if (directoryAllocator == null) {
			
 
				+      String bufferDir = conf.get(BUFFER_DIR) != null
			
 
				+          ? BUFFER_DIR : "hadoop.tmp.dir";
			
 
				+      directoryAllocator = new LocalDirAllocator(bufferDir);
			
 
				+    }
			
 
				+    return directoryAllocator.createTmpFileForWrite(pathStr, size, conf);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get the bucket of this filesystem.
			
 
				+   * @return the bucket
			
 
				+   */
			
 
				+  public String getBucket() {
			
 
				+    return bucket;
			
 
				+  }
			
 
				+
			
 
				   /**
			
 
				    * Change the input policy for this FS.
			
 
				    * @param inputPolicy new policy
			
@@ -460,6 +513,7 @@ public class S3AFileSystem extends FileSystem {
 
				    * @see #setPermission(Path, FsPermission)
			
 
				    */
			
 
				   @Override
			
 
				+  @SuppressWarnings("IOResourceOpenedButNotSafelyClosed")
			
 
				   public FSDataOutputStream create(Path f, FsPermission permission,
			
 
				       boolean overwrite, int bufferSize, short replication, long blockSize,
			
 
				       Progressable progress) throws IOException {
			
@@ -484,28 +538,33 @@ public class S3AFileSystem extends FileSystem {
 
				 
			
 
				     }
			
 
				     instrumentation.fileCreated();
			
 
				-    if (getConf().getBoolean(FAST_UPLOAD, DEFAULT_FAST_UPLOAD)) {
			
 
				-      return new FSDataOutputStream(
			
 
				-          new S3AFastOutputStream(s3,
			
 
				-              this,
			
 
				-              bucket,
			
 
				+    FSDataOutputStream output;
			
 
				+    if (blockUploadEnabled) {
			
 
				+      output = new FSDataOutputStream(
			
 
				+          new S3ABlockOutputStream(this,
			
 
				               key,
			
 
				+              new SemaphoredDelegatingExecutor(threadPoolExecutor,
			
 
				+                  blockOutputActiveBlocks, true),
			
 
				               progress,
			
 
				-              cannedACL,
			
 
				               partSize,
			
 
				-              multiPartThreshold,
			
 
				-              threadPoolExecutor),
			
 
				-          statistics);
			
 
				+              blockFactory,
			
 
				+              instrumentation.newOutputStreamStatistics(),
			
 
				+              new WriteOperationHelper(key)
			
 
				+          ),
			
 
				+          null);
			
 
				+    } else {
			
 
				+
			
 
				+      // We pass null to FSDataOutputStream so it won't count writes that
			
 
				+      // are being buffered to a file
			
 
				+      output = new FSDataOutputStream(
			
 
				+          new S3AOutputStream(getConf(),
			
 
				+              this,
			
 
				+              key,
			
 
				+              progress
			
 
				+          ),
			
 
				+          null);
			
 
				     }
			
 
				-    // We pass null to FSDataOutputStream so it won't count writes that
			
 
				-    // are being buffered to a file
			
 
				-    return new FSDataOutputStream(
			
 
				-        new S3AOutputStream(getConf(),
			
 
				-            this,
			
 
				-            key,
			
 
				-            progress
			
 
				-        ),
			
 
				-        null);
			
 
				+    return output;
			
 
				   }
			
 
				 
			
 
				   /**
			
@@ -749,6 +808,33 @@ public class S3AFileSystem extends FileSystem {
 
				     storageStatistics.incrementCounter(statistic, count);
			
 
				   }
			
 
				 
			
 
				+  /**
			
 
				+   * Decrement a gauge by a specific value.
			
 
				+   * @param statistic The operation to decrement
			
 
				+   * @param count the count to decrement
			
 
				+   */
			
 
				+  protected void decrementGauge(Statistic statistic, long count) {
			
 
				+    instrumentation.decrementGauge(statistic, count);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Increment a gauge by a specific value.
			
 
				+   * @param statistic The operation to increment
			
 
				+   * @param count the count to increment
			
 
				+   */
			
 
				+  protected void incrementGauge(Statistic statistic, long count) {
			
 
				+    instrumentation.incrementGauge(statistic, count);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get the storage statistics of this filesystem.
			
 
				+   * @return the storage statistics
			
 
				+   */
			
 
				+  @Override
			
 
				+  public S3AStorageStatistics getStorageStatistics() {
			
 
				+    return storageStatistics;
			
 
				+  }
			
 
				+
			
 
				   /**
			
 
				    * Request object metadata; increments counters in the process.
			
 
				    * @param key key
			
@@ -896,7 +982,9 @@ public class S3AFileSystem extends FileSystem {
 
				    */
			
 
				   public ObjectMetadata newObjectMetadata(long length) {
			
 
				     final ObjectMetadata om = newObjectMetadata();
			
 
				-    om.setContentLength(length);
			
 
				+    if (length >= 0) {
			
 
				+      om.setContentLength(length);
			
 
				+    }
			
 
				     return om;
			
 
				   }
			
 
				 
			
@@ -918,7 +1006,41 @@ public class S3AFileSystem extends FileSystem {
 
				       len = putObjectRequest.getMetadata().getContentLength();
			
 
				     }
			
 
				     incrementPutStartStatistics(len);
			
 
				-    return transfers.upload(putObjectRequest);
			
 
				+    try {
			
 
				+      Upload upload = transfers.upload(putObjectRequest);
			
 
				+      incrementPutCompletedStatistics(true, len);
			
 
				+      return upload;
			
 
				+    } catch (AmazonClientException e) {
			
 
				+      incrementPutCompletedStatistics(false, len);
			
 
				+      throw e;
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * PUT an object directly (i.e. not via the transfer manager).
			
 
				+   * Byte length is calculated from the file length, or, if there is no
			
 
				+   * file, from the content length of the header.
			
 
				+   * @param putObjectRequest the request
			
 
				+   * @return the upload initiated
			
 
				+   * @throws AmazonClientException on problems
			
 
				+   */
			
 
				+  public PutObjectResult putObjectDirect(PutObjectRequest putObjectRequest)
			
 
				+      throws AmazonClientException {
			
 
				+    long len;
			
 
				+    if (putObjectRequest.getFile() != null) {
			
 
				+      len = putObjectRequest.getFile().length();
			
 
				+    } else {
			
 
				+      len = putObjectRequest.getMetadata().getContentLength();
			
 
				+    }
			
 
				+    incrementPutStartStatistics(len);
			
 
				+    try {
			
 
				+      PutObjectResult result = s3.putObject(putObjectRequest);
			
 
				+      incrementPutCompletedStatistics(true, len);
			
 
				+      return result;
			
 
				+    } catch (AmazonClientException e) {
			
 
				+      incrementPutCompletedStatistics(false, len);
			
 
				+      throw e;
			
 
				+    }
			
 
				   }
			
 
				 
			
 
				   /**
			
@@ -926,10 +1048,20 @@ public class S3AFileSystem extends FileSystem {
 
				    * Increments the write and put counters
			
 
				    * @param request request
			
 
				    * @return the result of the operation.
			
 
				+   * @throws AmazonClientException on problems
			
 
				    */
			
 
				-  public UploadPartResult uploadPart(UploadPartRequest request) {
			
 
				-    incrementPutStartStatistics(request.getPartSize());
			
 
				-    return s3.uploadPart(request);
			
 
				+  public UploadPartResult uploadPart(UploadPartRequest request)
			
 
				+      throws AmazonClientException {
			
 
				+    long len = request.getPartSize();
			
 
				+    incrementPutStartStatistics(len);
			
 
				+    try {
			
 
				+      UploadPartResult uploadPartResult = s3.uploadPart(request);
			
 
				+      incrementPutCompletedStatistics(true, len);
			
 
				+      return uploadPartResult;
			
 
				+    } catch (AmazonClientException e) {
			
 
				+      incrementPutCompletedStatistics(false, len);
			
 
				+      throw e;
			
 
				+    }
			
 
				   }
			
 
				 
			
 
				   /**
			
@@ -942,9 +1074,28 @@ public class S3AFileSystem extends FileSystem {
 
				     LOG.debug("PUT start {} bytes", bytes);
			
 
				     incrementWriteOperations();
			
 
				     incrementStatistic(OBJECT_PUT_REQUESTS);
			
 
				+    incrementGauge(OBJECT_PUT_REQUESTS_ACTIVE, 1);
			
 
				+    if (bytes > 0) {
			
 
				+      incrementGauge(OBJECT_PUT_BYTES_PENDING, bytes);
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * At the end of a put/multipart upload operation, update the
			
 
				+   * relevant counters and gauges.
			
 
				+   *
			
 
				+   * @param success did the operation succeed?
			
 
				+   * @param bytes bytes in the request.
			
 
				+   */
			
 
				+  public void incrementPutCompletedStatistics(boolean success, long bytes) {
			
 
				+    LOG.debug("PUT completed success={}; {} bytes", success, bytes);
			
 
				+    incrementWriteOperations();
			
 
				     if (bytes > 0) {
			
 
				       incrementStatistic(OBJECT_PUT_BYTES, bytes);
			
 
				+      decrementGauge(OBJECT_PUT_BYTES_PENDING, bytes);
			
 
				     }
			
 
				+    incrementStatistic(OBJECT_PUT_REQUESTS_COMPLETED);
			
 
				+    decrementGauge(OBJECT_PUT_REQUESTS_ACTIVE, 1);
			
 
				   }
			
 
				 
			
 
				   /**
			
@@ -955,7 +1106,7 @@ public class S3AFileSystem extends FileSystem {
 
				    * @param bytes bytes successfully uploaded.
			
 
				    */
			
 
				   public void incrementPutProgressStatistics(String key, long bytes) {
			
 
				-    LOG.debug("PUT {}: {} bytes", key, bytes);
			
 
				+    PROGRESS.debug("PUT {}: {} bytes", key, bytes);
			
 
				     incrementWriteOperations();
			
 
				     if (bytes > 0) {
			
 
				       statistics.incrementBytesWritten(bytes);
			
@@ -1475,7 +1626,7 @@ public class S3AFileSystem extends FileSystem {
 
				     LocalFileSystem local = getLocal(getConf());
			
 
				     File srcfile = local.pathToFile(src);
			
 
				 
			
 
				-    final ObjectMetadata om = newObjectMetadata();
			
 
				+    final ObjectMetadata om = newObjectMetadata(srcfile.length());
			
 
				     PutObjectRequest putObjectRequest = newPutObjectRequest(key, om, srcfile);
			
 
				     Upload up = putObject(putObjectRequest);
			
 
				     ProgressableProgressListener listener = new ProgressableProgressListener(
			
@@ -1743,6 +1894,10 @@ public class S3AFileSystem extends FileSystem {
 
				           .append(serverSideEncryptionAlgorithm)
			
 
				           .append('\'');
			
 
				     }
			
 
				+    if (blockFactory != null) {
			
 
				+      sb.append(", blockFactory=").append(blockFactory);
			
 
				+    }
			
 
				+    sb.append(", executor=").append(threadPoolExecutor);
			
 
				     sb.append(", statistics {")
			
 
				         .append(statistics)
			
 
				         .append("}");
			
@@ -1950,4 +2105,163 @@ public class S3AFileSystem extends FileSystem {
 
				           getFileBlockLocations(status, 0, status.getLen())
			
 
				           : null);
			
 
				   }
			
 
				+
			
 
				+  /**
			
 
				+   * Helper for an ongoing write operation.
			
 
				+   * <p>
			
 
				+   * It hides direct access to the S3 API from the output stream,
			
 
				+   * and is a location where the object upload process can be evolved/enhanced.
			
 
				+   * <p>
			
 
				+   * Features
			
 
				+   * <ul>
			
 
				+   *   <li>Methods to create and submit requests to S3, so avoiding
			
 
				+   *   all direct interaction with the AWS APIs.</li>
			
 
				+   *   <li>Some extra preflight checks of arguments, so failing fast on
			
 
				+   *   errors.</li>
			
 
				+   *   <li>Callbacks to let the FS know of events in the output stream
			
 
				+   *   upload process.</li>
			
 
				+   * </ul>
			
 
				+   *
			
 
				+   * Each instance of this state is unique to a single output stream.
			
 
				+   */
			
 
				+  final class WriteOperationHelper {
			
 
				+    private final String key;
			
 
				+
			
 
				+    private WriteOperationHelper(String key) {
			
 
				+      this.key = key;
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Create a {@link PutObjectRequest} request.
			
 
				+     * The metadata is assumed to have been configured with the size of the
			
 
				+     * operation.
			
 
				+     * @param inputStream source data.
			
 
				+     * @param length size, if known. Use -1 for not known
			
 
				+     * @return the request
			
 
				+     */
			
 
				+    PutObjectRequest newPutRequest(InputStream inputStream, long length) {
			
 
				+      return newPutObjectRequest(key, newObjectMetadata(length), inputStream);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Callback on a successful write.
			
 
				+     */
			
 
				+    void writeSuccessful() {
			
 
				+      finishedWrite(key);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Callback on a write failure.
			
 
				+     * @param e Any exception raised which triggered the failure.
			
 
				+     */
			
 
				+    void writeFailed(Exception e) {
			
 
				+      LOG.debug("Write to {} failed", this, e);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Create a new object metadata instance.
			
 
				+     * Any standard metadata headers are added here, for example:
			
 
				+     * encryption.
			
 
				+     * @param length size, if known. Use -1 for not known
			
 
				+     * @return a new metadata instance
			
 
				+     */
			
 
				+    public ObjectMetadata newObjectMetadata(long length) {
			
 
				+      return S3AFileSystem.this.newObjectMetadata(length);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Start the multipart upload process.
			
 
				+     * @return the upload result containing the ID
			
 
				+     * @throws IOException IO problem
			
 
				+     */
			
 
				+    String initiateMultiPartUpload() throws IOException {
			
 
				+      LOG.debug("Initiating Multipart upload");
			
 
				+      final InitiateMultipartUploadRequest initiateMPURequest =
			
 
				+          new InitiateMultipartUploadRequest(bucket,
			
 
				+              key,
			
 
				+              newObjectMetadata(-1));
			
 
				+      initiateMPURequest.setCannedACL(cannedACL);
			
 
				+      try {
			
 
				+        return s3.initiateMultipartUpload(initiateMPURequest)
			
 
				+            .getUploadId();
			
 
				+      } catch (AmazonClientException ace) {
			
 
				+        throw translateException("initiate MultiPartUpload", key, ace);
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Complete a multipart upload operation.
			
 
				+     * @param uploadId multipart operation Id
			
 
				+     * @param partETags list of partial uploads
			
 
				+     * @return the result
			
 
				+     * @throws AmazonClientException on problems.
			
 
				+     */
			
 
				+    CompleteMultipartUploadResult completeMultipartUpload(String uploadId,
			
 
				+        List<PartETag> partETags) throws AmazonClientException {
			
 
				+      Preconditions.checkNotNull(uploadId);
			
 
				+      Preconditions.checkNotNull(partETags);
			
 
				+      Preconditions.checkArgument(!partETags.isEmpty(),
			
 
				+          "No partitions have been uploaded");
			
 
				+      return s3.completeMultipartUpload(
			
 
				+          new CompleteMultipartUploadRequest(bucket,
			
 
				+              key,
			
 
				+              uploadId,
			
 
				+              partETags));
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Abort a multipart upload operation.
			
 
				+     * @param uploadId multipart operation Id
			
 
				+     * @return the result
			
 
				+     * @throws AmazonClientException on problems.
			
 
				+     */
			
 
				+    void abortMultipartUpload(String uploadId) throws AmazonClientException {
			
 
				+      s3.abortMultipartUpload(
			
 
				+          new AbortMultipartUploadRequest(bucket, key, uploadId));
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Create and initialize a part request of a multipart upload.
			
 
				+     * @param uploadId ID of ongoing upload
			
 
				+     * @param uploadStream source of data to upload
			
 
				+     * @param partNumber current part number of the upload
			
 
				+     * @param size amount of data
			
 
				+     * @return the request.
			
 
				+     */
			
 
				+    UploadPartRequest newUploadPartRequest(String uploadId,
			
 
				+        InputStream uploadStream,
			
 
				+        int partNumber,
			
 
				+        int size) {
			
 
				+      Preconditions.checkNotNull(uploadId);
			
 
				+      Preconditions.checkNotNull(uploadStream);
			
 
				+      Preconditions.checkArgument(size > 0, "Invalid partition size %s", size);
			
 
				+      Preconditions.checkArgument(partNumber> 0 && partNumber <=10000,
			
 
				+          "partNumber must be between 1 and 10000 inclusive, but is %s",
			
 
				+          partNumber);
			
 
				+
			
 
				+      LOG.debug("Creating part upload request for {} #{} size {}",
			
 
				+          uploadId, partNumber, size);
			
 
				+      return new UploadPartRequest()
			
 
				+          .withBucketName(bucket)
			
 
				+          .withKey(key)
			
 
				+          .withUploadId(uploadId)
			
 
				+          .withInputStream(uploadStream)
			
 
				+          .withPartNumber(partNumber)
			
 
				+          .withPartSize(size);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * The toString method is intended to be used in logging/toString calls.
			
 
				+     * @return a string description.
			
 
				+     */
			
 
				+    @Override
			
 
				+    public String toString() {
			
 
				+      final StringBuilder sb = new StringBuilder(
			
 
				+          "{bucket=").append(bucket);
			
 
				+      sb.append(", key='").append(key).append('\'');
			
 
				+      sb.append('}');
			
 
				+      return sb.toString();
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AInstrumentation.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AInstrumentation.java
@@ -18,7 +18,9 @@
 
				 
			
 
				 package org.apache.hadoop.fs.s3a;
			
 
				 
			
 
				-import com.google.common.base.Preconditions;
			
 
				+import org.slf4j.Logger;
			
 
				+import org.slf4j.LoggerFactory;
			
 
				+
			
 
				 import org.apache.hadoop.classification.InterfaceAudience;
			
 
				 import org.apache.hadoop.classification.InterfaceStability;
			
 
				 import org.apache.hadoop.metrics2.MetricStringBuilder;
			
@@ -29,10 +31,12 @@ import org.apache.hadoop.metrics2.lib.MutableCounterLong;
 
				 import org.apache.hadoop.metrics2.lib.MutableGaugeLong;
			
 
				 import org.apache.hadoop.metrics2.lib.MutableMetric;
			
 
				 
			
 
				+import java.io.Closeable;
			
 
				 import java.net.URI;
			
 
				 import java.util.HashMap;
			
 
				 import java.util.Map;
			
 
				 import java.util.UUID;
			
 
				+import java.util.concurrent.atomic.AtomicLong;
			
 
				 
			
 
				 import static org.apache.hadoop.fs.s3a.Statistic.*;
			
 
				 
			
@@ -50,6 +54,9 @@ import static org.apache.hadoop.fs.s3a.Statistic.*;
 
				 @InterfaceAudience.Private
			
 
				 @InterfaceStability.Evolving
			
 
				 public class S3AInstrumentation {
			
 
				+  private static final Logger LOG = LoggerFactory.getLogger(
			
 
				+      S3AInstrumentation.class);
			
 
				+
			
 
				   public static final String CONTEXT = "S3AFileSystem";
			
 
				   private final MetricsRegistry registry =
			
 
				       new MetricsRegistry("S3AFileSystem").setContext(CONTEXT);
			
@@ -100,7 +107,23 @@ public class S3AInstrumentation {
 
				       OBJECT_METADATA_REQUESTS,
			
 
				       OBJECT_MULTIPART_UPLOAD_ABORTED,
			
 
				       OBJECT_PUT_BYTES,
			
 
				-      OBJECT_PUT_REQUESTS
			
 
				+      OBJECT_PUT_REQUESTS,
			
 
				+      OBJECT_PUT_REQUESTS_COMPLETED,
			
 
				+      STREAM_WRITE_FAILURES,
			
 
				+      STREAM_WRITE_BLOCK_UPLOADS,
			
 
				+      STREAM_WRITE_BLOCK_UPLOADS_COMMITTED,
			
 
				+      STREAM_WRITE_BLOCK_UPLOADS_ABORTED,
			
 
				+      STREAM_WRITE_TOTAL_TIME,
			
 
				+      STREAM_WRITE_TOTAL_DATA,
			
 
				+  };
			
 
				+
			
 
				+
			
 
				+  private static final Statistic[] GAUGES_TO_CREATE = {
			
 
				+      OBJECT_PUT_REQUESTS_ACTIVE,
			
 
				+      OBJECT_PUT_BYTES_PENDING,
			
 
				+      STREAM_WRITE_BLOCK_UPLOADS_ACTIVE,
			
 
				+      STREAM_WRITE_BLOCK_UPLOADS_PENDING,
			
 
				+      STREAM_WRITE_BLOCK_UPLOADS_DATA_PENDING,
			
 
				   };
			
 
				 
			
 
				   public S3AInstrumentation(URI name) {
			
@@ -143,6 +166,9 @@ public class S3AInstrumentation {
 
				     for (Statistic statistic : COUNTERS_TO_CREATE) {
			
 
				       counter(statistic);
			
 
				     }
			
 
				+    for (Statistic statistic : GAUGES_TO_CREATE) {
			
 
				+      gauge(statistic.getSymbol(), statistic.getDescription());
			
 
				+    }
			
 
				   }
			
 
				 
			
 
				   /**
			
@@ -254,13 +280,13 @@ public class S3AInstrumentation {
 
				    * Lookup a counter by name. Return null if it is not known.
			
 
				    * @param name counter name
			
 
				    * @return the counter
			
 
				+   * @throws IllegalStateException if the metric is not a counter
			
 
				    */
			
 
				   private MutableCounterLong lookupCounter(String name) {
			
 
				     MutableMetric metric = lookupMetric(name);
			
 
				     if (metric == null) {
			
 
				       return null;
			
 
				     }
			
 
				-    Preconditions.checkNotNull(metric, "not found: " + name);
			
 
				     if (!(metric instanceof MutableCounterLong)) {
			
 
				       throw new IllegalStateException("Metric " + name
			
 
				           + " is not a MutableCounterLong: " + metric);
			
@@ -268,6 +294,20 @@ public class S3AInstrumentation {
 
				     return (MutableCounterLong) metric;
			
 
				   }
			
 
				 
			
 
				+  /**
			
 
				+   * Look up a gauge.
			
 
				+   * @param name gauge name
			
 
				+   * @return the gauge or null
			
 
				+   * @throws ClassCastException if the metric is not a Gauge.
			
 
				+   */
			
 
				+  public MutableGaugeLong lookupGauge(String name) {
			
 
				+    MutableMetric metric = lookupMetric(name);
			
 
				+    if (metric == null) {
			
 
				+      LOG.debug("No gauge {}", name);
			
 
				+    }
			
 
				+    return (MutableGaugeLong) metric;
			
 
				+  }
			
 
				+
			
 
				   /**
			
 
				    * Look up a metric from both the registered set and the lighter weight
			
 
				    * stream entries.
			
@@ -349,6 +389,47 @@ public class S3AInstrumentation {
 
				       counter.incr(count);
			
 
				     }
			
 
				   }
			
 
				+  /**
			
 
				+   * Increment a specific counter.
			
 
				+   * No-op if not defined.
			
 
				+   * @param op operation
			
 
				+   * @param count atomic long containing value
			
 
				+   */
			
 
				+  public void incrementCounter(Statistic op, AtomicLong count) {
			
 
				+    incrementCounter(op, count.get());
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Increment a specific gauge.
			
 
				+   * No-op if not defined.
			
 
				+   * @param op operation
			
 
				+   * @param count increment value
			
 
				+   * @throws ClassCastException if the metric is of the wrong type
			
 
				+   */
			
 
				+  public void incrementGauge(Statistic op, long count) {
			
 
				+    MutableGaugeLong gauge = lookupGauge(op.getSymbol());
			
 
				+    if (gauge != null) {
			
 
				+      gauge.incr(count);
			
 
				+    } else {
			
 
				+      LOG.debug("No Gauge: "+ op);
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Decrement a specific gauge.
			
 
				+   * No-op if not defined.
			
 
				+   * @param op operation
			
 
				+   * @param count increment value
			
 
				+   * @throws ClassCastException if the metric is of the wrong type
			
 
				+   */
			
 
				+  public void decrementGauge(Statistic op, long count) {
			
 
				+    MutableGaugeLong gauge = lookupGauge(op.getSymbol());
			
 
				+    if (gauge != null) {
			
 
				+      gauge.decr(count);
			
 
				+    } else {
			
 
				+      LOG.debug("No Gauge: " + op);
			
 
				+    }
			
 
				+  }
			
 
				 
			
 
				   /**
			
 
				    * Create a stream input statistics instance.
			
@@ -553,4 +634,165 @@ public class S3AInstrumentation {
 
				       return sb.toString();
			
 
				     }
			
 
				   }
			
 
				+
			
 
				+  /**
			
 
				+   * Create a stream output statistics instance.
			
 
				+   * @return the new instance
			
 
				+   */
			
 
				+
			
 
				+  OutputStreamStatistics newOutputStreamStatistics() {
			
 
				+    return new OutputStreamStatistics();
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Merge in the statistics of a single output stream into
			
 
				+   * the filesystem-wide statistics.
			
 
				+   * @param statistics stream statistics
			
 
				+   */
			
 
				+  private void mergeOutputStreamStatistics(OutputStreamStatistics statistics) {
			
 
				+    incrementCounter(STREAM_WRITE_TOTAL_TIME, statistics.totalUploadDuration());
			
 
				+    incrementCounter(STREAM_WRITE_QUEUE_DURATION, statistics.queueDuration);
			
 
				+    incrementCounter(STREAM_WRITE_TOTAL_DATA, statistics.bytesUploaded);
			
 
				+    incrementCounter(STREAM_WRITE_BLOCK_UPLOADS,
			
 
				+        statistics.blockUploadsCompleted);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Statistics updated by an output stream during its actual operation.
			
 
				+   * Some of these stats may be relayed. However, as block upload is
			
 
				+   * spans multiple
			
 
				+   */
			
 
				+  @InterfaceAudience.Private
			
 
				+  @InterfaceStability.Unstable
			
 
				+  public final class OutputStreamStatistics implements Closeable {
			
 
				+    private final AtomicLong blocksSubmitted = new AtomicLong(0);
			
 
				+    private final AtomicLong blocksInQueue = new AtomicLong(0);
			
 
				+    private final AtomicLong blocksActive = new AtomicLong(0);
			
 
				+    private final AtomicLong blockUploadsCompleted = new AtomicLong(0);
			
 
				+    private final AtomicLong blockUploadsFailed = new AtomicLong(0);
			
 
				+    private final AtomicLong bytesPendingUpload = new AtomicLong(0);
			
 
				+
			
 
				+    private final AtomicLong bytesUploaded = new AtomicLong(0);
			
 
				+    private final AtomicLong transferDuration = new AtomicLong(0);
			
 
				+    private final AtomicLong queueDuration = new AtomicLong(0);
			
 
				+    private final AtomicLong exceptionsInMultipartFinalize = new AtomicLong(0);
			
 
				+
			
 
				+    /**
			
 
				+     * Block is queued for upload.
			
 
				+     */
			
 
				+    void blockUploadQueued(int blockSize) {
			
 
				+      blocksSubmitted.incrementAndGet();
			
 
				+      blocksInQueue.incrementAndGet();
			
 
				+      bytesPendingUpload.addAndGet(blockSize);
			
 
				+      incrementGauge(STREAM_WRITE_BLOCK_UPLOADS_PENDING, 1);
			
 
				+      incrementGauge(STREAM_WRITE_BLOCK_UPLOADS_DATA_PENDING, blockSize);
			
 
				+    }
			
 
				+
			
 
				+    /** Queued block has been scheduled for upload. */
			
 
				+    void blockUploadStarted(long duration, int blockSize) {
			
 
				+      queueDuration.addAndGet(duration);
			
 
				+      blocksInQueue.decrementAndGet();
			
 
				+      blocksActive.incrementAndGet();
			
 
				+      incrementGauge(STREAM_WRITE_BLOCK_UPLOADS_PENDING, -1);
			
 
				+      incrementGauge(STREAM_WRITE_BLOCK_UPLOADS_ACTIVE, 1);
			
 
				+    }
			
 
				+
			
 
				+    /** A block upload has completed. */
			
 
				+    void blockUploadCompleted(long duration, int blockSize) {
			
 
				+      this.transferDuration.addAndGet(duration);
			
 
				+      incrementGauge(STREAM_WRITE_BLOCK_UPLOADS_ACTIVE, -1);
			
 
				+      blocksActive.decrementAndGet();
			
 
				+      blockUploadsCompleted.incrementAndGet();
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     *  A block upload has failed.
			
 
				+     *  A final transfer completed event is still expected, so this
			
 
				+     *  does not decrement the active block counter.
			
 
				+     */
			
 
				+    void blockUploadFailed(long duration, int blockSize) {
			
 
				+      blockUploadsFailed.incrementAndGet();
			
 
				+    }
			
 
				+
			
 
				+    /** Intermediate report of bytes uploaded. */
			
 
				+    void bytesTransferred(long byteCount) {
			
 
				+      bytesUploaded.addAndGet(byteCount);
			
 
				+      bytesPendingUpload.addAndGet(-byteCount);
			
 
				+      incrementGauge(STREAM_WRITE_BLOCK_UPLOADS_DATA_PENDING, -byteCount);
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Note an exception in a multipart complete.
			
 
				+     */
			
 
				+    void exceptionInMultipartComplete() {
			
 
				+      exceptionsInMultipartFinalize.incrementAndGet();
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Note an exception in a multipart abort.
			
 
				+     */
			
 
				+    void exceptionInMultipartAbort() {
			
 
				+      exceptionsInMultipartFinalize.incrementAndGet();
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Get the number of bytes pending upload.
			
 
				+     * @return the number of bytes in the pending upload state.
			
 
				+     */
			
 
				+    public long getBytesPendingUpload() {
			
 
				+      return bytesPendingUpload.get();
			
 
				+    }
			
 
				+
			
 
				+    /**
			
 
				+     * Output stream has closed.
			
 
				+     * Trigger merge in of all statistics not updated during operation.
			
 
				+     */
			
 
				+    @Override
			
 
				+    public void close() {
			
 
				+      if (bytesPendingUpload.get() > 0) {
			
 
				+        LOG.warn("Closing output stream statistics while data is still marked" +
			
 
				+            " as pending upload in {}", this);
			
 
				+      }
			
 
				+      mergeOutputStreamStatistics(this);
			
 
				+    }
			
 
				+
			
 
				+    long averageQueueTime() {
			
 
				+      return blocksSubmitted.get() > 0 ?
			
 
				+          (queueDuration.get() / blocksSubmitted.get()) : 0;
			
 
				+    }
			
 
				+
			
 
				+    double effectiveBandwidth() {
			
 
				+      double duration = totalUploadDuration() / 1000.0;
			
 
				+      return duration > 0 ?
			
 
				+          (bytesUploaded.get() / duration) : 0;
			
 
				+    }
			
 
				+
			
 
				+    long totalUploadDuration() {
			
 
				+      return queueDuration.get() + transferDuration.get();
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String toString() {
			
 
				+      final StringBuilder sb = new StringBuilder(
			
 
				+          "OutputStreamStatistics{");
			
 
				+      sb.append("blocksSubmitted=").append(blocksSubmitted);
			
 
				+      sb.append(", blocksInQueue=").append(blocksInQueue);
			
 
				+      sb.append(", blocksActive=").append(blocksActive);
			
 
				+      sb.append(", blockUploadsCompleted=").append(blockUploadsCompleted);
			
 
				+      sb.append(", blockUploadsFailed=").append(blockUploadsFailed);
			
 
				+      sb.append(", bytesPendingUpload=").append(bytesPendingUpload);
			
 
				+      sb.append(", bytesUploaded=").append(bytesUploaded);
			
 
				+      sb.append(", exceptionsInMultipartFinalize=").append(
			
 
				+          exceptionsInMultipartFinalize);
			
 
				+      sb.append(", transferDuration=").append(transferDuration).append(" ms");
			
 
				+      sb.append(", queueDuration=").append(queueDuration).append(" ms");
			
 
				+      sb.append(", averageQueueTime=").append(averageQueueTime()).append(" ms");
			
 
				+      sb.append(", totalUploadDuration=").append(totalUploadDuration())
			
 
				+          .append(" ms");
			
 
				+      sb.append(", effectiveBandwidth=").append(effectiveBandwidth())
			
 
				+          .append(" bytes/s");
			
 
				+      sb.append('}');
			
 
				+      return sb.toString();
			
 
				+    }
			
 
				+  }
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AOutputStream.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AOutputStream.java
@@ -1,4 +1,4 @@
 
				-/**
			
 
				+/*
			
 
				  * Licensed to the Apache Software Foundation (ASF) under one
			
 
				  * or more contributor license agreements.  See the NOTICE file
			
 
				  * distributed with this work for additional information
			
@@ -35,8 +35,8 @@ import java.io.FileOutputStream;
 
				 import java.io.IOException;
			
 
				 import java.io.InterruptedIOException;
			
 
				 import java.io.OutputStream;
			
 
				+import java.util.concurrent.atomic.AtomicBoolean;
			
 
				 
			
 
				-import static org.apache.hadoop.fs.s3a.Constants.*;
			
 
				 import static org.apache.hadoop.fs.s3a.S3AUtils.*;
			
 
				 
			
 
				 /**
			
@@ -45,37 +45,27 @@ import static org.apache.hadoop.fs.s3a.S3AUtils.*;
 
				 @InterfaceAudience.Private
			
 
				 @InterfaceStability.Evolving
			
 
				 public class S3AOutputStream extends OutputStream {
			
 
				-  private OutputStream backupStream;
			
 
				-  private File backupFile;
			
 
				-  private boolean closed;
			
 
				-  private String key;
			
 
				-  private Progressable progress;
			
 
				-  private long partSize;
			
 
				-  private long partSizeThreshold;
			
 
				-  private S3AFileSystem fs;
			
 
				-  private LocalDirAllocator lDirAlloc;
			
 
				+  private final OutputStream backupStream;
			
 
				+  private final File backupFile;
			
 
				+  private final AtomicBoolean closed = new AtomicBoolean(false);
			
 
				+  private final String key;
			
 
				+  private final Progressable progress;
			
 
				+  private final S3AFileSystem fs;
			
 
				 
			
 
				   public static final Logger LOG = S3AFileSystem.LOG;
			
 
				 
			
 
				   public S3AOutputStream(Configuration conf,
			
 
				-      S3AFileSystem fs, String key, Progressable progress)
			
 
				+      S3AFileSystem fs,
			
 
				+      String key,
			
 
				+      Progressable progress)
			
 
				       throws IOException {
			
 
				     this.key = key;
			
 
				     this.progress = progress;
			
 
				     this.fs = fs;
			
 
				 
			
 
				-    partSize = fs.getPartitionSize();
			
 
				-    partSizeThreshold = fs.getMultiPartThreshold();
			
 
				-
			
 
				-    if (conf.get(BUFFER_DIR, null) != null) {
			
 
				-      lDirAlloc = new LocalDirAllocator(BUFFER_DIR);
			
 
				-    } else {
			
 
				-      lDirAlloc = new LocalDirAllocator("${hadoop.tmp.dir}/s3a");
			
 
				-    }
			
 
				 
			
 
				-    backupFile = lDirAlloc.createTmpFileForWrite("output-",
			
 
				+    backupFile = fs.createTmpFileForWrite("output-",
			
 
				         LocalDirAllocator.SIZE_UNKNOWN, conf);
			
 
				-    closed = false;
			
 
				 
			
 
				     LOG.debug("OutputStream for key '{}' writing to tempfile: {}",
			
 
				         key, backupFile);
			
@@ -84,25 +74,33 @@ public class S3AOutputStream extends OutputStream {
 
				         new FileOutputStream(backupFile));
			
 
				   }
			
 
				 
			
 
				+  /**
			
 
				+   * Check for the filesystem being open.
			
 
				+   * @throws IOException if the filesystem is closed.
			
 
				+   */
			
 
				+  void checkOpen() throws IOException {
			
 
				+    if (closed.get()) {
			
 
				+      throw new IOException("Output Stream closed");
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				   @Override
			
 
				   public void flush() throws IOException {
			
 
				+    checkOpen();
			
 
				     backupStream.flush();
			
 
				   }
			
 
				 
			
 
				   @Override
			
 
				-  public synchronized void close() throws IOException {
			
 
				-    if (closed) {
			
 
				+  public void close() throws IOException {
			
 
				+    if (closed.getAndSet(true)) {
			
 
				       return;
			
 
				     }
			
 
				 
			
 
				     backupStream.close();
			
 
				     LOG.debug("OutputStream for key '{}' closed. Now beginning upload", key);
			
 
				-    LOG.debug("Minimum upload part size: {} threshold {}" , partSize,
			
 
				-        partSizeThreshold);
			
 
				-
			
 
				 
			
 
				     try {
			
 
				-      final ObjectMetadata om = fs.newObjectMetadata();
			
 
				+      final ObjectMetadata om = fs.newObjectMetadata(backupFile.length());
			
 
				       Upload upload = fs.putObject(
			
 
				           fs.newPutObjectRequest(
			
 
				               key,
			
@@ -126,18 +124,19 @@ public class S3AOutputStream extends OutputStream {
 
				         LOG.warn("Could not delete temporary s3a file: {}", backupFile);
			
 
				       }
			
 
				       super.close();
			
 
				-      closed = true;
			
 
				     }
			
 
				     LOG.debug("OutputStream for key '{}' upload complete", key);
			
 
				   }
			
 
				 
			
 
				   @Override
			
 
				   public void write(int b) throws IOException {
			
 
				+    checkOpen();
			
 
				     backupStream.write(b);
			
 
				   }
			
 
				 
			
 
				   @Override
			
 
				   public void write(byte[] b, int off, int len) throws IOException {
			
 
				+    checkOpen();
			
 
				     backupStream.write(b, off, len);
			
 
				   }
			
 
				 
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AUtils.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/S3AUtils.java
@@ -49,6 +49,7 @@ import java.util.concurrent.ExecutionException;
 
				 import static org.apache.hadoop.fs.s3a.Constants.ACCESS_KEY;
			
 
				 import static org.apache.hadoop.fs.s3a.Constants.AWS_CREDENTIALS_PROVIDER;
			
 
				 import static org.apache.hadoop.fs.s3a.Constants.ENDPOINT;
			
 
				+import static org.apache.hadoop.fs.s3a.Constants.MULTIPART_MIN_SIZE;
			
 
				 import static org.apache.hadoop.fs.s3a.Constants.SECRET_KEY;
			
 
				 
			
 
				 /**
			
@@ -460,4 +461,42 @@ public final class S3AUtils {
 
				             key, v, min));
			
 
				     return v;
			
 
				   }
			
 
				+
			
 
				+  /**
			
 
				+   * Get a size property from the configuration: this property must
			
 
				+   * be at least equal to {@link Constants#MULTIPART_MIN_SIZE}.
			
 
				+   * If it is too small, it is rounded up to that minimum, and a warning
			
 
				+   * printed.
			
 
				+   * @param conf configuration
			
 
				+   * @param property property name
			
 
				+   * @param defVal default value
			
 
				+   * @return the value, guaranteed to be above the minimum size
			
 
				+   */
			
 
				+  public static long getMultipartSizeProperty(Configuration conf,
			
 
				+      String property, long defVal) {
			
 
				+    long partSize = conf.getLong(property, defVal);
			
 
				+    if (partSize < MULTIPART_MIN_SIZE) {
			
 
				+      LOG.warn("{} must be at least 5 MB; configured value is {}",
			
 
				+          property, partSize);
			
 
				+      partSize = MULTIPART_MIN_SIZE;
			
 
				+    }
			
 
				+    return partSize;
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Ensure that the long value is in the range of an integer.
			
 
				+   * @param name property name for error messages
			
 
				+   * @param size original size
			
 
				+   * @return the size, guaranteed to be less than or equal to the max
			
 
				+   * value of an integer.
			
 
				+   */
			
 
				+  public static int ensureOutputParameterInRange(String name, long size) {
			
 
				+    if (size > Integer.MAX_VALUE) {
			
 
				+      LOG.warn("s3a: {} capped to ~2.14GB" +
			
 
				+          " (maximum allowed size with current output mechanism)", name);
			
 
				+      return Integer.MAX_VALUE;
			
 
				+    } else {
			
 
				+      return (int)size;
			
 
				+    }
			
 
				+  }
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/SemaphoredDelegatingExecutor.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/SemaphoredDelegatingExecutor.java
@@ -0,0 +1,230 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+import com.google.common.util.concurrent.ForwardingListeningExecutorService;
			
 
				+import com.google.common.util.concurrent.Futures;
			
 
				+import com.google.common.util.concurrent.ListenableFuture;
			
 
				+import com.google.common.util.concurrent.ListeningExecutorService;
			
 
				+
			
 
				+import org.apache.hadoop.classification.InterfaceAudience;
			
 
				+
			
 
				+import java.util.Collection;
			
 
				+import java.util.List;
			
 
				+import java.util.concurrent.Callable;
			
 
				+import java.util.concurrent.ExecutionException;
			
 
				+import java.util.concurrent.Future;
			
 
				+import java.util.concurrent.Semaphore;
			
 
				+import java.util.concurrent.TimeUnit;
			
 
				+import java.util.concurrent.TimeoutException;
			
 
				+
			
 
				+/**
			
 
				+ * This ExecutorService blocks the submission of new tasks when its queue is
			
 
				+ * already full by using a semaphore. Task submissions require permits, task
			
 
				+ * completions release permits.
			
 
				+ * <p>
			
 
				+ * This is a refactoring of {@link BlockingThreadPoolExecutorService}; that code
			
 
				+ * contains the thread pool logic, whereas this isolates the semaphore
			
 
				+ * and submit logic for use with other thread pools and delegation models.
			
 
				+ * In particular, it <i>permits multiple per stream executors to share a
			
 
				+ * single per-FS-instance executor; the latter to throttle overall
			
 
				+ * load from the the FS, the others to limit the amount of load which
			
 
				+ * a single output stream can generate.</i>
			
 
				+ * <p>
			
 
				+ * This is inspired by <a href="https://github.com/apache/incubator-s4/blob/master/subprojects/s4-comm/src/main/java/org/apache/s4/comm/staging/BlockingThreadPoolExecutorService.java">
			
 
				+ * this s4 threadpool</a>
			
 
				+ */
			
 
				+@SuppressWarnings("NullableProblems")
			
 
				+@InterfaceAudience.Private
			
 
				+class SemaphoredDelegatingExecutor extends
			
 
				+    ForwardingListeningExecutorService {
			
 
				+
			
 
				+  private final Semaphore queueingPermits;
			
 
				+  private final ListeningExecutorService executorDelegatee;
			
 
				+  private final int permitCount;
			
 
				+
			
 
				+  /**
			
 
				+   * Instantiate.
			
 
				+   * @param executorDelegatee Executor to delegate to
			
 
				+   * @param permitCount number of permits into the queue permitted
			
 
				+   * @param fair should the semaphore be "fair"
			
 
				+   */
			
 
				+  SemaphoredDelegatingExecutor(ListeningExecutorService executorDelegatee,
			
 
				+      int permitCount,
			
 
				+      boolean fair) {
			
 
				+    this.permitCount = permitCount;
			
 
				+    queueingPermits = new Semaphore(permitCount, fair);
			
 
				+    this.executorDelegatee = executorDelegatee;
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  protected ListeningExecutorService delegate() {
			
 
				+    return executorDelegatee;
			
 
				+  }
			
 
				+
			
 
				+
			
 
				+  @Override
			
 
				+  public <T> List<Future<T>> invokeAll(Collection<? extends Callable<T>> tasks)
			
 
				+      throws InterruptedException {
			
 
				+    throw new RuntimeException("Not implemented");
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public <T> List<Future<T>> invokeAll(Collection<? extends Callable<T>> tasks,
			
 
				+      long timeout, TimeUnit unit) throws InterruptedException {
			
 
				+    throw new RuntimeException("Not implemented");
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public <T> T invokeAny(Collection<? extends Callable<T>> tasks)
			
 
				+      throws InterruptedException, ExecutionException {
			
 
				+    throw new RuntimeException("Not implemented");
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public <T> T invokeAny(Collection<? extends Callable<T>> tasks, long timeout,
			
 
				+      TimeUnit unit)
			
 
				+      throws InterruptedException, ExecutionException, TimeoutException {
			
 
				+    throw new RuntimeException("Not implemented");
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public <T> ListenableFuture<T> submit(Callable<T> task) {
			
 
				+    try {
			
 
				+      queueingPermits.acquire();
			
 
				+    } catch (InterruptedException e) {
			
 
				+      Thread.currentThread().interrupt();
			
 
				+      return Futures.immediateFailedCheckedFuture(e);
			
 
				+    }
			
 
				+    return super.submit(new CallableWithPermitRelease<>(task));
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public <T> ListenableFuture<T> submit(Runnable task, T result) {
			
 
				+    try {
			
 
				+      queueingPermits.acquire();
			
 
				+    } catch (InterruptedException e) {
			
 
				+      Thread.currentThread().interrupt();
			
 
				+      return Futures.immediateFailedCheckedFuture(e);
			
 
				+    }
			
 
				+    return super.submit(new RunnableWithPermitRelease(task), result);
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public ListenableFuture<?> submit(Runnable task) {
			
 
				+    try {
			
 
				+      queueingPermits.acquire();
			
 
				+    } catch (InterruptedException e) {
			
 
				+      Thread.currentThread().interrupt();
			
 
				+      return Futures.immediateFailedCheckedFuture(e);
			
 
				+    }
			
 
				+    return super.submit(new RunnableWithPermitRelease(task));
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public void execute(Runnable command) {
			
 
				+    try {
			
 
				+      queueingPermits.acquire();
			
 
				+    } catch (InterruptedException e) {
			
 
				+      Thread.currentThread().interrupt();
			
 
				+    }
			
 
				+    super.execute(new RunnableWithPermitRelease(command));
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get the number of permits available; guaranteed to be
			
 
				+   * {@code 0 <= availablePermits <= size}.
			
 
				+   * @return the number of permits available at the time of invocation.
			
 
				+   */
			
 
				+  public int getAvailablePermits() {
			
 
				+    return queueingPermits.availablePermits();
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get the number of threads waiting to acquire a permit.
			
 
				+   * @return snapshot of the length of the queue of blocked threads.
			
 
				+   */
			
 
				+  public int getWaitingCount() {
			
 
				+    return queueingPermits.getQueueLength();
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Total number of permits.
			
 
				+   * @return the number of permits as set in the constructor
			
 
				+   */
			
 
				+  public int getPermitCount() {
			
 
				+    return permitCount;
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public String toString() {
			
 
				+    final StringBuilder sb = new StringBuilder(
			
 
				+        "SemaphoredDelegatingExecutor{");
			
 
				+    sb.append("permitCount=").append(getPermitCount());
			
 
				+    sb.append(", available=").append(getAvailablePermits());
			
 
				+    sb.append(", waiting=").append(getWaitingCount());
			
 
				+    sb.append('}');
			
 
				+    return sb.toString();
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Releases a permit after the task is executed.
			
 
				+   */
			
 
				+  class RunnableWithPermitRelease implements Runnable {
			
 
				+
			
 
				+    private Runnable delegatee;
			
 
				+
			
 
				+    public RunnableWithPermitRelease(Runnable delegatee) {
			
 
				+      this.delegatee = delegatee;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void run() {
			
 
				+      try {
			
 
				+        delegatee.run();
			
 
				+      } finally {
			
 
				+        queueingPermits.release();
			
 
				+      }
			
 
				+
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Releases a permit after the task is completed.
			
 
				+   */
			
 
				+  class CallableWithPermitRelease<T> implements Callable<T> {
			
 
				+
			
 
				+    private Callable<T> delegatee;
			
 
				+
			
 
				+    public CallableWithPermitRelease(Callable<T> delegatee) {
			
 
				+      this.delegatee = delegatee;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public T call() throws Exception {
			
 
				+      try {
			
 
				+        return delegatee.call();
			
 
				+      } finally {
			
 
				+        queueingPermits.release();
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/Statistic.java
+++ b/hadoop-tools/hadoop-aws/src/main/java/org/apache/hadoop/fs/s3a/Statistic.java
@@ -81,10 +81,16 @@ public enum Statistic {
 
				       "Object multipart upload aborted"),
			
 
				   OBJECT_PUT_REQUESTS("object_put_requests",
			
 
				       "Object put/multipart upload count"),
			
 
				+  OBJECT_PUT_REQUESTS_COMPLETED("object_put_requests_completed",
			
 
				+      "Object put/multipart upload completed count"),
			
 
				+  OBJECT_PUT_REQUESTS_ACTIVE("object_put_requests_active",
			
 
				+      "Current number of active put requests"),
			
 
				   OBJECT_PUT_BYTES("object_put_bytes", "number of bytes uploaded"),
			
 
				+  OBJECT_PUT_BYTES_PENDING("object_put_bytes_pending",
			
 
				+      "number of bytes queued for upload/being actively uploaded"),
			
 
				   STREAM_ABORTED("stream_aborted",
			
 
				       "Count of times the TCP stream was aborted"),
			
 
				-  STREAM_BACKWARD_SEEK_OPERATIONS("stream_backward_seek_pperations",
			
 
				+  STREAM_BACKWARD_SEEK_OPERATIONS("stream_backward_seek_operations",
			
 
				       "Number of executed seek operations which went backwards in a stream"),
			
 
				   STREAM_CLOSED("streamClosed", "Count of times the TCP stream was closed"),
			
 
				   STREAM_CLOSE_OPERATIONS("stream_close_operations",
			
@@ -112,7 +118,29 @@ public enum Statistic {
 
				   STREAM_CLOSE_BYTES_READ("stream_bytes_read_in_close",
			
 
				       "Count of bytes read when closing streams during seek operations."),
			
 
				   STREAM_ABORT_BYTES_DISCARDED("stream_bytes_discarded_in_abort",
			
 
				-      "Count of bytes discarded by aborting the stream");
			
 
				+      "Count of bytes discarded by aborting the stream"),
			
 
				+  STREAM_WRITE_FAILURES("stream_write_failures",
			
 
				+      "Count of stream write failures reported"),
			
 
				+  STREAM_WRITE_BLOCK_UPLOADS("stream_write_block_uploads",
			
 
				+      "Count of block/partition uploads completed"),
			
 
				+  STREAM_WRITE_BLOCK_UPLOADS_ACTIVE("stream_write_block_uploads_active",
			
 
				+      "Count of block/partition uploads completed"),
			
 
				+  STREAM_WRITE_BLOCK_UPLOADS_COMMITTED("stream_write_block_uploads_committed",
			
 
				+      "Count of number of block uploads committed"),
			
 
				+  STREAM_WRITE_BLOCK_UPLOADS_ABORTED("stream_write_block_uploads_aborted",
			
 
				+      "Count of number of block uploads aborted"),
			
 
				+
			
 
				+  STREAM_WRITE_BLOCK_UPLOADS_PENDING("stream_write_block_uploads_pending",
			
 
				+      "Gauge of block/partitions uploads queued to be written"),
			
 
				+  STREAM_WRITE_BLOCK_UPLOADS_DATA_PENDING(
			
 
				+      "stream_write_block_uploads_data_pending",
			
 
				+      "Gauge of block/partitions data uploads queued to be written"),
			
 
				+  STREAM_WRITE_TOTAL_TIME("stream_write_total_time",
			
 
				+      "Count of total time taken for uploads to complete"),
			
 
				+  STREAM_WRITE_TOTAL_DATA("stream_write_total_data",
			
 
				+      "Count of total data uploaded in block output"),
			
 
				+  STREAM_WRITE_QUEUE_DURATION("stream_write_queue_duration",
			
 
				+      "Total queue duration of all block uploads");
			
 
				 
			
 
				   private static final Map<String, Statistic> SYMBOL_MAP =
			
 
				       new HashMap<>(Statistic.values().length);
			
--- a/hadoop-tools/hadoop-aws/src/site/markdown/tools/hadoop-aws/index.md
+++ b/hadoop-tools/hadoop-aws/src/site/markdown/tools/hadoop-aws/index.md
@@ -1,3 +1,4 @@
 
				+
			
 
				 <!---
			
 
				   Licensed under the Apache License, Version 2.0 (the "License");
			
 
				   you may not use this file except in compliance with the License.
			
@@ -852,40 +853,361 @@ Seoul
 
				 If the wrong endpoint is used, the request may fail. This may be reported as a 301/redirect error,
			
 
				 or as a 400 Bad Request.
			
 
				 
			
 
				-### S3AFastOutputStream
			
 
				- **Warning: NEW in hadoop 2.7. UNSTABLE, EXPERIMENTAL: use at own risk**
			
 
				 
			
 
				-    <property>
			
 
				-      <name>fs.s3a.fast.upload</name>
			
 
				-      <value>false</value>
			
 
				-      <description>Upload directly from memory instead of buffering to
			
 
				-      disk first. Memory usage and parallelism can be controlled as up to
			
 
				-      fs.s3a.multipart.size memory is consumed for each (part)upload actively
			
 
				-      uploading (fs.s3a.threads.max) or queueing (fs.s3a.max.total.tasks)</description>
			
 
				-    </property>
			
 
				 
			
 
				-    <property>
			
 
				-      <name>fs.s3a.fast.buffer.size</name>
			
 
				-      <value>1048576</value>
			
 
				-      <description>Size (in bytes) of initial memory buffer allocated for an
			
 
				-      upload. No effect if fs.s3a.fast.upload is false.</description>
			
 
				-    </property>
			
 
				+### <a name="s3a_fast_upload"></a>Stabilizing: S3A Fast Upload
			
 
				+
			
 
				+
			
 
				+**New in Hadoop 2.7; significantly enhanced in Hadoop 2.9**
			
 
				+
			
 
				+
			
 
				+Because of the nature of the S3 object store, data written to an S3A `OutputStream`
			
 
				+is not written incrementally —instead, by default, it is buffered to disk
			
 
				+until the stream is closed in its `close()` method.
			
 
				+
			
 
				+This can make output slow:
			
 
				+
			
 
				+* The execution time for `OutputStream.close()` is proportional to the amount of data
			
 
				+buffered and inversely proportional to the bandwidth. That is `O(data/bandwidth)`.
			
 
				+* The bandwidth is that available from the host to S3: other work in the same
			
 
				+process, server or network at the time of upload may increase the upload time,
			
 
				+hence the duration of the `close()` call.
			
 
				+* If a process uploading data fails before `OutputStream.close()` is called,
			
 
				+all data is lost.
			
 
				+* The disks hosting temporary directories defined in `fs.s3a.buffer.dir` must
			
 
				+have the capacity to store the entire buffered file.
			
 
				+
			
 
				+Put succinctly: the further the process is from the S3 endpoint, or the smaller
			
 
				+the EC-hosted VM is, the longer it will take work to complete.
			
 
				+
			
 
				+This can create problems in application code:
			
 
				+
			
 
				+* Code often assumes that the `close()` call is fast;
			
 
				+ the delays can create bottlenecks in operations.
			
 
				+* Very slow uploads sometimes cause applications to time out. (generally,
			
 
				+threads blocking during the upload stop reporting progress, so trigger timeouts)
			
 
				+* Streaming very large amounts of data may consume all disk space before the upload begins.
			
 
				+
			
 
				+
			
 
				+Work to addess this began in Hadoop 2.7 with the `S3AFastOutputStream`
			
 
				+[HADOOP-11183](https://issues.apache.org/jira/browse/HADOOP-11183), and
			
 
				+has continued with ` S3ABlockOutputStream`
			
 
				+[HADOOP-13560](https://issues.apache.org/jira/browse/HADOOP-13560).
			
 
				+
			
 
				+
			
 
				+This adds an alternative output stream, "S3a Fast Upload" which:
			
 
				+
			
 
				+1.  Always uploads large files as blocks with the size set by
			
 
				+    `fs.s3a.multipart.size`. That is: the threshold at which multipart uploads
			
 
				+    begin and the size of each upload are identical.
			
 
				+1.  Buffers blocks to disk (default) or in on-heap or off-heap memory.
			
 
				+1.  Uploads blocks in parallel in background threads.
			
 
				+1.  Begins uploading blocks as soon as the buffered data exceeds this partition
			
 
				+    size.
			
 
				+1.  When buffering data to disk, uses the directory/directories listed in
			
 
				+    `fs.s3a.buffer.dir`. The size of data which can be buffered is limited
			
 
				+    to the available disk space.
			
 
				+1.  Generates output statistics as metrics on the filesystem, including
			
 
				+    statistics of active and pending block uploads.
			
 
				+1.  Has the time to `close()` set by the amount of remaning data to upload, rather
			
 
				+    than the total size of the file.
			
 
				+
			
 
				+With incremental writes of blocks, "S3A fast upload" offers an upload
			
 
				+time at least as fast as the "classic" mechanism, with significant benefits
			
 
				+on long-lived output streams, and when very large amounts of data are generated.
			
 
				+The in memory buffering mechanims may also  offer speedup when running adjacent to
			
 
				+S3 endpoints, as disks are not used for intermediate data storage.
			
 
				+
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload</name>
			
 
				+  <value>true</value>
			
 
				+  <description>
			
 
				+    Use the incremental block upload mechanism with
			
 
				+    the buffering mechanism set in fs.s3a.fast.upload.buffer.
			
 
				+    The number of threads performing uploads in the filesystem is defined
			
 
				+    by fs.s3a.threads.max; the queue of waiting uploads limited by
			
 
				+    fs.s3a.max.total.tasks.
			
 
				+    The size of each buffer is set by fs.s3a.multipart.size.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.buffer</name>
			
 
				+  <value>disk</value>
			
 
				+  <description>
			
 
				+    The buffering mechanism to use when using S3A fast upload
			
 
				+    (fs.s3a.fast.upload=true). Values: disk, array, bytebuffer.
			
 
				+    This configuration option has no effect if fs.s3a.fast.upload is false.
			
 
				+
			
 
				+    "disk" will use the directories listed in fs.s3a.buffer.dir as
			
 
				+    the location(s) to save data prior to being uploaded.
			
 
				+
			
 
				+    "array" uses arrays in the JVM heap
			
 
				+
			
 
				+    "bytebuffer" uses off-heap memory within the JVM.
			
 
				+
			
 
				+    Both "array" and "bytebuffer" will consume memory in a single stream up to the number
			
 
				+    of blocks set by:
			
 
				+
			
 
				+        fs.s3a.multipart.size * fs.s3a.fast.upload.active.blocks.
			
 
				+
			
 
				+    If using either of these mechanisms, keep this value low
			
 
				+
			
 
				+    The total number of threads performing work across all threads is set by
			
 
				+    fs.s3a.threads.max, with fs.s3a.max.total.tasks values setting the number of queued
			
 
				+    work items.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.multipart.size</name>
			
 
				+  <value>104857600</value>
			
 
				+  <description>
			
 
				+  How big (in bytes) to split upload or copy operations up into.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.active.blocks</name>
			
 
				+  <value>8</value>
			
 
				+  <description>
			
 
				+    Maximum Number of blocks a single output stream can have
			
 
				+    active (uploading, or queued to the central FileSystem
			
 
				+    instance's pool of queued operations.
			
 
				+
			
 
				+    This stops a single stream overloading the shared thread pool.
			
 
				+  </description>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+**Notes**
			
 
				+
			
 
				+* If the amount of data written to a stream is below that set in `fs.s3a.multipart.size`,
			
 
				+the upload is performed in the `OutputStream.close()` operation —as with
			
 
				+the original output stream.
			
 
				+
			
 
				+* The published Hadoop metrics monitor include live queue length and
			
 
				+upload operation counts, so identifying when there is a backlog of work/
			
 
				+a mismatch between data generation rates and network bandwidth. Per-stream
			
 
				+statistics can also be logged by calling `toString()` on the current stream.
			
 
				+
			
 
				+* Incremental writes are not visible; the object can only be listed
			
 
				+or read when the multipart operation completes in the `close()` call, which
			
 
				+will block until the upload is completed.
			
 
				+
			
 
				+
			
 
				+#### <a name="s3a_fast_upload_disk"></a>Fast Upload with Disk Buffers `fs.s3a.fast.upload.buffer=disk`
			
 
				+
			
 
				+When `fs.s3a.fast.upload.buffer` is set to `disk`, all data is buffered
			
 
				+to local hard disks prior to upload. This minimizes the amount of memory
			
 
				+consumed, and so eliminates heap size as the limiting factor in queued uploads
			
 
				+—exactly as the original "direct to disk" buffering used when
			
 
				+`fs.s3a.fast.upload=false`.
			
 
				+
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload</name>
			
 
				+  <value>true</value>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.buffer</name>
			
 
				+  <value>disk</value>
			
 
				+</property>
			
 
				+
			
 
				+```
			
 
				+
			
 
				+
			
 
				+#### <a name="s3a_fast_upload_bytebuffer"></a>Fast Upload with ByteBuffers: `fs.s3a.fast.upload.buffer=bytebuffer`
			
 
				+
			
 
				+When `fs.s3a.fast.upload.buffer` is set to `bytebuffer`, all data is buffered
			
 
				+in "Direct" ByteBuffers prior to upload. This *may* be faster than buffering to disk,
			
 
				+and, if disk space is small (for example, tiny EC2 VMs), there may not
			
 
				+be much disk space to buffer with.
			
 
				+
			
 
				+The ByteBuffers are created in the memory of the JVM, but not in the Java Heap itself.
			
 
				+The amount of data which can be buffered is
			
 
				+limited by the Java runtime, the operating system, and, for YARN applications,
			
 
				+the amount of memory requested for each container.
			
 
				+
			
 
				+The slower the write bandwidth to S3, the greater the risk of running out
			
 
				+of memory —and so the more care is needed in
			
 
				+[tuning the upload settings](#s3a_fast_upload_thread_tuning).
			
 
				+
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload</name>
			
 
				+  <value>true</value>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.buffer</name>
			
 
				+  <value>bytebuffer</value>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+#### <a name="s3a_fast_upload_array"></a>Fast Upload with Arrays: `fs.s3a.fast.upload.buffer=array`
			
 
				+
			
 
				+When `fs.s3a.fast.upload.buffer` is set to `array`, all data is buffered
			
 
				+in byte arrays in the JVM's heap prior to upload.
			
 
				+This *may* be faster than buffering to disk.
			
 
				+
			
 
				+This `array` option is similar to the in-memory-only stream offered in
			
 
				+Hadoop 2.7 with `fs.s3a.fast.upload=true`
			
 
				+
			
 
				+The amount of data which can be buffered is limited by the available
			
 
				+size of the JVM heap heap. The slower the write bandwidth to S3, the greater
			
 
				+the risk of heap overflows. This risk can be mitigated by
			
 
				+[tuning the upload settings](#s3a_fast_upload_thread_tuning).
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload</name>
			
 
				+  <value>true</value>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.buffer</name>
			
 
				+  <value>array</value>
			
 
				+</property>
			
 
				+
			
 
				+```
			
 
				+#### <a name="s3a_fast_upload_thread_tuning"></a>S3A Fast Upload Thread Tuning
			
 
				+
			
 
				+Both the [Array](#s3a_fast_upload_array) and [Byte buffer](#s3a_fast_upload_bytebuffer)
			
 
				+buffer mechanisms can consume very large amounts of memory, on-heap or
			
 
				+off-heap respectively. The [disk buffer](#s3a_fast_upload_disk) mechanism
			
 
				+does not use much memory up, but will consume hard disk capacity.
			
 
				+
			
 
				+If there are many output streams being written to in a single process, the
			
 
				+amount of memory or disk used is the multiple of all stream's active memory/disk use.
			
 
				+
			
 
				+Careful tuning may be needed to reduce the risk of running out memory, especially
			
 
				+if the data is buffered in memory.
			
 
				+
			
 
				+There are a number parameters which can be tuned:
			
 
				+
			
 
				+1. The total number of threads available in the filesystem for data
			
 
				+uploads *or any other queued filesystem operation*. This is set in
			
 
				+`fs.s3a.threads.max`
			
 
				+
			
 
				+1. The number of operations which can be queued for execution:, *awaiting
			
 
				+a thread*: `fs.s3a.max.total.tasks`
			
 
				+
			
 
				+1. The number of blocks which a single output stream can have active,
			
 
				+that is: being uploaded by a thread, or queued in the filesystem thread queue:
			
 
				+`fs.s3a.fast.upload.active.blocks`
			
 
				+
			
 
				+1. How long an idle thread can stay in the thread pool before it is retired: `fs.s3a.threads.keepalivetime`
			
 
				+
			
 
				+
			
 
				+When the maximum allowed number of active blocks of a single stream is reached,
			
 
				+no more blocks can be uploaded from that stream until one or more of those active
			
 
				+blocks' uploads completes. That is: a `write()` call which would trigger an upload
			
 
				+of a now full datablock, will instead block until there is capacity in the queue.
			
 
				+
			
 
				+How does that come together?
			
 
				+
			
 
				+* As the pool of threads set in `fs.s3a.threads.max` is shared (and intended
			
 
				+to be used across all threads), a larger number here can allow for more
			
 
				+parallel operations. However, as uploads require network bandwidth, adding more
			
 
				+threads does not guarantee speedup.
			
 
				+
			
 
				+* The extra queue of tasks for the thread pool (`fs.s3a.max.total.tasks`)
			
 
				+covers all ongoing background S3A operations (future plans include: parallelized
			
 
				+rename operations, asynchronous directory operations).
			
 
				+
			
 
				+* When using memory buffering, a small value of `fs.s3a.fast.upload.active.blocks`
			
 
				+limits the amount of memory which can be consumed per stream.
			
 
				+
			
 
				+* When using disk buffering a larger value of `fs.s3a.fast.upload.active.blocks`
			
 
				+does not consume much memory. But it may result in a large number of blocks to
			
 
				+compete with other filesystem operations.
			
 
				+
			
 
				+
			
 
				+We recommend a low value of `fs.s3a.fast.upload.active.blocks`; enough
			
 
				+to start background upload without overloading other parts of the system,
			
 
				+then experiment to see if higher values deliver more throughtput —especially
			
 
				+from VMs running on EC2.
			
 
				+
			
 
				+```xml
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.fast.upload.active.blocks</name>
			
 
				+  <value>4</value>
			
 
				+  <description>
			
 
				+    Maximum Number of blocks a single output stream can have
			
 
				+    active (uploading, or queued to the central FileSystem
			
 
				+    instance's pool of queued operations.
			
 
				+
			
 
				+    This stops a single stream overloading the shared thread pool.
			
 
				+  </description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.threads.max</name>
			
 
				+  <value>10</value>
			
 
				+  <description>The total number of threads available in the filesystem for data
			
 
				+    uploads *or any other queued filesystem operation*.</description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.max.total.tasks</name>
			
 
				+  <value>5</value>
			
 
				+  <description>The number of operations which can be queued for execution</description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.threads.keepalivetime</name>
			
 
				+  <value>60</value>
			
 
				+  <description>Number of seconds a thread can be idle before being
			
 
				+    terminated.</description>
			
 
				+</property>
			
 
				+
			
 
				+```
			
 
				+
			
 
				+
			
 
				+#### <a name="s3a_multipart_purge"></a>Cleaning up After Incremental Upload Failures: `fs.s3a.multipart.purge`
			
 
				+
			
 
				+
			
 
				+If an incremental streaming operation is interrupted, there may be
			
 
				+intermediate partitions uploaded to S3 —data which will be billed for.
			
 
				+
			
 
				+These charges can be reduced by enabling `fs.s3a.multipart.purge`,
			
 
				+and setting a purge time in seconds, such as 86400 seconds —24 hours.
			
 
				+When an S3A FileSystem instance is instantiated with the purge time greater
			
 
				+than zero, it will, on startup, delete all outstanding partition requests
			
 
				+older than this time.
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.multipart.purge</name>
			
 
				+  <value>true</value>
			
 
				+  <description>True if you want to purge existing multipart uploads that may not have been
			
 
				+     completed/aborted correctly</description>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.multipart.purge.age</name>
			
 
				+  <value>86400</value>
			
 
				+  <description>Minimum age in seconds of multipart uploads to purge</description>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+If an S3A client is instantited with `fs.s3a.multipart.purge=true`,
			
 
				+it will delete all out of date uploads *in the entire bucket*. That is: it will affect all
			
 
				+multipart uploads to that bucket, from all applications.
			
 
				 
			
 
				-Writes are buffered in memory instead of to a file on local disk. This
			
 
				-removes the throughput bottleneck of the local disk write and read cycle
			
 
				-before starting the actual upload. Furthermore, it allows handling files that
			
 
				-are larger than the remaining local disk space.
			
 
				-
			
 
				-However, non-trivial memory tuning is needed for optimal results and careless
			
 
				-settings could cause memory overflow. Up to `fs.s3a.threads.max` parallel
			
 
				-(part)uploads are active. Furthermore, up to `fs.s3a.max.total.tasks`
			
 
				-additional part(uploads) can be waiting (and thus memory buffers are created).
			
 
				-The memory buffer is uploaded as a single upload if it is not larger than
			
 
				-`fs.s3a.multipart.threshold`. Else, a multi-part upload is initiated and
			
 
				-parts of size `fs.s3a.multipart.size` are used to protect against overflowing
			
 
				-the available memory. These settings should be tuned to the envisioned
			
 
				-workflow (some large files, many small ones, ...) and the physical
			
 
				-limitations of the machine and cluster (memory, network bandwidth).
			
 
				+Leaving `fs.s3a.multipart.purge` to its default, `false`,
			
 
				+means that the client will not make any attempt to reset or change the partition
			
 
				+rate.
			
 
				+
			
 
				+The best practise for using this option is to disable multipart purges in
			
 
				+normal use of S3A, enabling only in manual/scheduled housekeeping operations.
			
 
				 
			
 
				 ### S3A Experimental "fadvise" input policy support
			
 
				 
			
@@ -1221,7 +1543,143 @@ can be used:
 
				 Using the explicit endpoint for the region is recommended for speed and the
			
 
				 ability to use the V4 signing API.
			
 
				 
			
 
				-## Visible S3 Inconsistency
			
 
				+
			
 
				+### "Timeout waiting for connection from pool" when writing to S3A
			
 
				+
			
 
				+This happens when using the Block output stream, `fs.s3a.fast.upload=true` and
			
 
				+the thread pool runs out of capacity.
			
 
				+
			
 
				+```
			
 
				+[s3a-transfer-shared-pool1-t20] INFO  http.AmazonHttpClient (AmazonHttpClient.java:executeHelper(496)) - Unable to execute HTTP request: Timeout waiting for connection from poolorg.apache.http.conn.ConnectionPoolTimeoutException: Timeout waiting for connection from pool
			
 
				+  at org.apache.http.impl.conn.PoolingClientConnectionManager.leaseConnection(PoolingClientConnectionManager.java:230)
			
 
				+  at org.apache.http.impl.conn.PoolingClientConnectionManager$1.getConnection(PoolingClientConnectionManager.java:199)
			
 
				+  at sun.reflect.GeneratedMethodAccessor13.invoke(Unknown Source)
			
 
				+  at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
			
 
				+  at java.lang.reflect.Method.invoke(Method.java:498)
			
 
				+  at com.amazonaws.http.conn.ClientConnectionRequestFactory$Handler.invoke(ClientConnectionRequestFactory.java:70)
			
 
				+  at com.amazonaws.http.conn.$Proxy10.getConnection(Unknown Source)
			
 
				+  at org.apache.http.impl.client.DefaultRequestDirector.execute(DefaultRequestDirector.java:424)
			
 
				+  at org.apache.http.impl.client.AbstractHttpClient.doExecute(AbstractHttpClient.java:884)
			
 
				+  at org.apache.http.impl.client.CloseableHttpClient.execute(CloseableHttpClient.java:82)
			
 
				+  at org.apache.http.impl.client.CloseableHttpClient.execute(CloseableHttpClient.java:55)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.executeOneRequest(AmazonHttpClient.java:728)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.executeHelper(AmazonHttpClient.java:489)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.execute(AmazonHttpClient.java:310)
			
 
				+  at com.amazonaws.services.s3.AmazonS3Client.invoke(AmazonS3Client.java:3785)
			
 
				+  at com.amazonaws.services.s3.AmazonS3Client.doUploadPart(AmazonS3Client.java:2921)
			
 
				+  at com.amazonaws.services.s3.AmazonS3Client.uploadPart(AmazonS3Client.java:2906)
			
 
				+  at org.apache.hadoop.fs.s3a.S3AFileSystem.uploadPart(S3AFileSystem.java:1025)
			
 
				+  at org.apache.hadoop.fs.s3a.S3ABlockOutputStream$MultiPartUpload$1.call(S3ABlockOutputStream.java:360)
			
 
				+  at org.apache.hadoop.fs.s3a.S3ABlockOutputStream$MultiPartUpload$1.call(S3ABlockOutputStream.java:355)
			
 
				+  at org.apache.hadoop.fs.s3a.BlockingThreadPoolExecutorService$CallableWithPermitRelease.call(BlockingThreadPoolExecutorService.java:239)
			
 
				+  at java.util.concurrent.FutureTask.run(FutureTask.java:266)
			
 
				+  at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)
			
 
				+  at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)
			
 
				+  at java.lang.Thread.run(Thread.java:745)
			
 
				+```
			
 
				+
			
 
				+Make sure that `fs.s3a.connection.maximum` is at least larger
			
 
				+than `fs.s3a.threads.max`.
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.threads.max</name>
			
 
				+  <value>20</value>
			
 
				+</property>
			
 
				+
			
 
				+<property>
			
 
				+  <name>fs.s3a.connection.maximum</name>
			
 
				+  <value>30</value>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+### "Timeout waiting for connection from pool" when reading from S3A
			
 
				+
			
 
				+This happens when more threads are trying to read from an S3A system than
			
 
				+the maximum number of allocated HTTP connections.
			
 
				+
			
 
				+Set `fs.s3a.connection.maximum` to a larger value (and at least as large as
			
 
				+`fs.s3a.threads.max`)
			
 
				+
			
 
				+### Out of heap memory when writing to S3A via Fast Upload
			
 
				+
			
 
				+This can happen when using the fast upload mechanism (`fs.s3a.fast.upload=true`)
			
 
				+and in-memory buffering (either `fs.s3a.fast.upload.buffer=array` or
			
 
				+`fs.s3a.fast.upload.buffer=bytebuffer`).
			
 
				+
			
 
				+More data is being generated than in the JVM than it can upload to S3 —and
			
 
				+so much data has been buffered that the JVM has run out of memory.
			
 
				+
			
 
				+Consult [S3A Fast Upload Thread Tuning](#s3a_fast_upload_thread_tuning) for
			
 
				+detail on this issue and options to address it. Consider also buffering to
			
 
				+disk, rather than memory.
			
 
				+
			
 
				+
			
 
				+### When writing to S3A: "java.io.FileNotFoundException: Completing multi-part upload"
			
 
				+
			
 
				+
			
 
				+```
			
 
				+java.io.FileNotFoundException: Completing multi-part upload on fork-5/test/multipart/1c397ca6-9dfb-4ac1-9cf7-db666673246b: com.amazonaws.services.s3.model.AmazonS3Exception: The specified upload does not exist. The upload ID may be invalid, or the upload may have been aborted or completed. (Service: Amazon S3; Status Code: 404; Error Code: NoSuchUpload; Request ID: 84FF8057174D9369), S3 Extended Request ID: Ij5Yn6Eq/qIERH4Z6Io3YL2t9/qNZ7z9gjPb1FrTtTovZ8k1MXqh+zCYYjqmfJ/fCY6E1+JR9jA=
			
 
				+  at com.amazonaws.http.AmazonHttpClient.handleErrorResponse(AmazonHttpClient.java:1182)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.executeOneRequest(AmazonHttpClient.java:770)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.executeHelper(AmazonHttpClient.java:489)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.execute(AmazonHttpClient.java:310)
			
 
				+  at com.amazonaws.services.s3.AmazonS3Client.invoke(AmazonS3Client.java:3785)
			
 
				+  at com.amazonaws.services.s3.AmazonS3Client.completeMultipartUpload(AmazonS3Client.java:2705)
			
 
				+  at org.apache.hadoop.fs.s3a.S3ABlockOutputStream$MultiPartUpload.complete(S3ABlockOutputStream.java:473)
			
 
				+  at org.apache.hadoop.fs.s3a.S3ABlockOutputStream$MultiPartUpload.access$200(S3ABlockOutputStream.java:382)
			
 
				+  at org.apache.hadoop.fs.s3a.S3ABlockOutputStream.close(S3ABlockOutputStream.java:272)
			
 
				+  at org.apache.hadoop.fs.FSDataOutputStream$PositionCache.close(FSDataOutputStream.java:72)
			
 
				+  at org.apache.hadoop.fs.FSDataOutputStream.close(FSDataOutputStream.java:106)
			
 
				+```
			
 
				+
			
 
				+This surfaces if, while a multipart upload was taking place, all outstanding multipart
			
 
				+uploads were garbage collected. The upload operation cannot complete because
			
 
				+the data uploaded has been deleted.
			
 
				+
			
 
				+Consult [Cleaning up After Incremental Upload Failures](#s3a_multipart_purge) for
			
 
				+details on how the multipart purge timeout can be set. If multipart uploads
			
 
				+are failing with the message above, it may be a sign that this value is too low.
			
 
				+
			
 
				+### When writing to S3A, HTTP Exceptions logged at info from `AmazonHttpClient`
			
 
				+
			
 
				+```
			
 
				+[s3a-transfer-shared-pool4-t6] INFO  http.AmazonHttpClient (AmazonHttpClient.java:executeHelper(496)) - Unable to execute HTTP request: hwdev-steve-ireland-new.s3.amazonaws.com:443 failed to respond
			
 
				+org.apache.http.NoHttpResponseException: bucket.s3.amazonaws.com:443 failed to respond
			
 
				+  at org.apache.http.impl.conn.DefaultHttpResponseParser.parseHead(DefaultHttpResponseParser.java:143)
			
 
				+  at org.apache.http.impl.conn.DefaultHttpResponseParser.parseHead(DefaultHttpResponseParser.java:57)
			
 
				+  at org.apache.http.impl.io.AbstractMessageParser.parse(AbstractMessageParser.java:261)
			
 
				+  at org.apache.http.impl.AbstractHttpClientConnection.receiveResponseHeader(AbstractHttpClientConnection.java:283)
			
 
				+  at org.apache.http.impl.conn.DefaultClientConnection.receiveResponseHeader(DefaultClientConnection.java:259)
			
 
				+  at org.apache.http.impl.conn.ManagedClientConnectionImpl.receiveResponseHeader(ManagedClientConnectionImpl.java:209)
			
 
				+  at org.apache.http.protocol.HttpRequestExecutor.doReceiveResponse(HttpRequestExecutor.java:272)
			
 
				+  at com.amazonaws.http.protocol.SdkHttpRequestExecutor.doReceiveResponse(SdkHttpRequestExecutor.java:66)
			
 
				+  at org.apache.http.protocol.HttpRequestExecutor.execute(HttpRequestExecutor.java:124)
			
 
				+  at org.apache.http.impl.client.DefaultRequestDirector.tryExecute(DefaultRequestDirector.java:686)
			
 
				+  at org.apache.http.impl.client.DefaultRequestDirector.execute(DefaultRequestDirector.java:488)
			
 
				+  at org.apache.http.impl.client.AbstractHttpClient.doExecute(AbstractHttpClient.java:884)
			
 
				+  at org.apache.http.impl.client.CloseableHttpClient.execute(CloseableHttpClient.java:82)
			
 
				+  at org.apache.http.impl.client.CloseableHttpClient.execute(CloseableHttpClient.java:55)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.executeOneRequest(AmazonHttpClient.java:728)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.executeHelper(AmazonHttpClient.java:489)
			
 
				+  at com.amazonaws.http.AmazonHttpClient.execute(AmazonHttpClient.java:310)
			
 
				+  at com.amazonaws.services.s3.AmazonS3Client.invoke(AmazonS3Client.java:3785)
			
 
				+  at com.amazonaws.services.s3.AmazonS3Client.copyPart(AmazonS3Client.java:1731)
			
 
				+  at com.amazonaws.services.s3.transfer.internal.CopyPartCallable.call(CopyPartCallable.java:41)
			
 
				+  at com.amazonaws.services.s3.transfer.internal.CopyPartCallable.call(CopyPartCallable.java:28)
			
 
				+  at org.apache.hadoop.fs.s3a.BlockingThreadPoolExecutorService$CallableWithPermitRelease.call(BlockingThreadPoolExecutorService.java:239)
			
 
				+  at java.util.concurrent.FutureTask.run(FutureTask.java:266)
			
 
				+  at java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)
			
 
				+  at java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)
			
 
				+  at java.lang.Thread.run(Thread.java:745)
			
 
				+```
			
 
				+
			
 
				+These are HTTP I/O exceptions caught and logged inside the AWS SDK. The client
			
 
				+will attempt to retry the operation; it may just be a transient event. If there
			
 
				+are many such exceptions in logs, it may be a symptom of connectivity or network
			
 
				+problems.
			
 
				+
			
 
				+### Visible S3 Inconsistency
			
 
				 
			
 
				 Amazon S3 is *an eventually consistent object store*. That is: not a filesystem.
			
 
				 
			
@@ -1564,7 +2022,7 @@ tests or the `it.test` property for integration tests.
 
				 
			
 
				     mvn clean test -Dtest=TestS3AInputPolicies
			
 
				 
			
 
				-    mvn clean verify -Dit.test=ITestS3AFileContextStatistics
			
 
				+    mvn clean verify -Dit.test=ITestS3AFileContextStatistics -Dtest=none
			
 
				 
			
 
				     mvn clean verify -Dtest=TestS3A* -Dit.test=ITestS3A*
			
 
				 
			
@@ -1614,7 +2072,7 @@ An alternate endpoint may be defined in `test.fs.s3a.sts.endpoint`.
 
				 
			
 
				 The default is ""; meaning "use the amazon default value".
			
 
				 
			
 
				-#### CSV Data source Tests
			
 
				+### CSV Data source Tests
			
 
				 
			
 
				 The `TestS3AInputStreamPerformance` tests require read access to a multi-MB
			
 
				 text file. The default file for these tests is one published by amazon,
			
@@ -1661,18 +2119,89 @@ endpoint:
 
				   <value>s3.amazonaws.com</value>
			
 
				 </property>
			
 
				 ```
			
 
				+### Viewing Integration Test Reports
			
 
				 
			
 
				-#### Scale test operation count
			
 
				+
			
 
				+Integration test results and logs are stored in `target/failsafe-reports/`.
			
 
				+An HTML report can be generated during site generation, or with the `surefire-report`
			
 
				+plugin:
			
 
				+
			
 
				+```
			
 
				+mvn surefire-report:failsafe-report-only
			
 
				+```
			
 
				+### Scale Tests
			
 
				+
			
 
				+There are a set of tests designed to measure the scalability and performance
			
 
				+at scale of the S3A tests, *Scale Tests*. Tests include: creating
			
 
				+and traversing directory trees, uploading large files, renaming them,
			
 
				+deleting them, seeking through the files, performing random IO, and others.
			
 
				+This makes them a foundational part of the benchmarking.
			
 
				+
			
 
				+By their very nature they are slow. And, as their execution time is often
			
 
				+limited by bandwidth between the computer running the tests and the S3 endpoint,
			
 
				+parallel execution does not speed these tests up.
			
 
				+
			
 
				+#### Enabling the Scale Tests
			
 
				+
			
 
				+The tests are enabled if the `scale` property is set in the maven build
			
 
				+this can be done regardless of whether or not the parallel test profile
			
 
				+is used
			
 
				+
			
 
				+```bash
			
 
				+mvn verify -Dscale
			
 
				+
			
 
				+mvn verify -Dparallel-tests -Dscale -DtestsThreadCount=8
			
 
				+```
			
 
				+
			
 
				+The most bandwidth intensive tests (those which upload data) always run
			
 
				+sequentially; those which are slow due to HTTPS setup costs or server-side
			
 
				+actionsare included in the set of parallelized tests.
			
 
				+
			
 
				+
			
 
				+#### Maven build tuning options
			
 
				+
			
 
				+
			
 
				+Some of the tests can be tuned from the maven build or from the
			
 
				+configuration file used to run the tests.
			
 
				+
			
 
				+```bash
			
 
				+mvn verify -Dscale -Dfs.s3a.scale.test.huge.filesize=128M
			
 
				+```
			
 
				+
			
 
				+The algorithm is
			
 
				+
			
 
				+1. The value is queried from the configuration file, using a default value if
			
 
				+it is not set.
			
 
				+1. The value is queried from the JVM System Properties, where it is passed
			
 
				+down by maven.
			
 
				+1. If the system property is null, empty, or it has the value `unset`, then
			
 
				+the configuration value is used. The `unset` option is used to
			
 
				+[work round a quirk in maven property propagation](http://stackoverflow.com/questions/7773134/null-versus-empty-arguments-in-maven).
			
 
				+
			
 
				+Only a few properties can be set this way; more will be added.
			
 
				+
			
 
				+| Property | Meaninging |
			
 
				+|-----------|-------------|
			
 
				+| `fs.s3a.scale.test.timeout`| Timeout in seconds for scale tests |
			
 
				+| `fs.s3a.scale.test.huge.filesize`| Size for huge file uploads |
			
 
				+| `fs.s3a.scale.test.huge.huge.partitionsize`| Size for partitions in huge file uploads |
			
 
				+
			
 
				+The file and partition sizes are numeric values with a k/m/g/t/p suffix depending
			
 
				+on the desired size. For example: 128M, 128m, 2G, 2G, 4T or even 1P.
			
 
				+
			
 
				+#### Scale test configuration options
			
 
				 
			
 
				 Some scale tests perform multiple operations (such as creating many directories).
			
 
				 
			
 
				 The exact number of operations to perform is configurable in the option
			
 
				 `scale.test.operation.count`
			
 
				 
			
 
				-      <property>
			
 
				-        <name>scale.test.operation.count</name>
			
 
				-        <value>10</value>
			
 
				-      </property>
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>scale.test.operation.count</name>
			
 
				+  <value>10</value>
			
 
				+</property>
			
 
				+```
			
 
				 
			
 
				 Larger values generate more load, and are recommended when testing locally,
			
 
				 or in batch runs.
			
@@ -1685,19 +2214,64 @@ the width and depth of tests creating recursive directories. Larger
 
				 values create exponentially more directories, with consequent performance
			
 
				 impact.
			
 
				 
			
 
				-      <property>
			
 
				-        <name>scale.test.directory.count</name>
			
 
				-        <value>2</value>
			
 
				-      </property>
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>scale.test.directory.count</name>
			
 
				+  <value>2</value>
			
 
				+</property>
			
 
				+```
			
 
				 
			
 
				 DistCp tests targeting S3A support a configurable file size.  The default is
			
 
				 10 MB, but the configuration value is expressed in KB so that it can be tuned
			
 
				 smaller to achieve faster test runs.
			
 
				 
			
 
				-      <property>
			
 
				-        <name>scale.test.distcp.file.size.kb</name>
			
 
				-        <value>10240</value>
			
 
				-      </property>
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>scale.test.distcp.file.size.kb</name>
			
 
				+  <value>10240</value>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+S3A specific scale test properties are
			
 
				+
			
 
				+##### `fs.s3a.scale.test.huge.filesize`: size in MB for "Huge file tests".
			
 
				+
			
 
				+The Huge File tests validate S3A's ability to handle large files —the property
			
 
				+`fs.s3a.scale.test.huge.filesize` declares the file size to use.
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.scale.test.huge.filesize</name>
			
 
				+  <value>200M</value>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+Amazon S3 handles files larger than 5GB differently than smaller ones.
			
 
				+Setting the huge filesize to a number greater than that) validates support
			
 
				+for huge files.
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.scale.test.huge.filesize</name>
			
 
				+  <value>6G</value>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+Tests at this scale are slow: they are best executed from hosts running in
			
 
				+the cloud infrastructure where the S3 endpoint is based.
			
 
				+Otherwise, set a large timeout in `fs.s3a.scale.test.timeout`
			
 
				+
			
 
				+```xml
			
 
				+<property>
			
 
				+  <name>fs.s3a.scale.test.timeout</name>
			
 
				+  <value>432000</value>
			
 
				+</property>
			
 
				+```
			
 
				+
			
 
				+
			
 
				+The tests are executed in an order to only clean up created files after
			
 
				+the end of all the tests. If the tests are interrupted, the test data will remain.
			
 
				+
			
 
				 
			
 
				 
			
 
				 ### Testing against non AWS S3 endpoints.
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/contract/s3a/ITestS3AContractDistCp.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/contract/s3a/ITestS3AContractDistCp.java
@@ -18,24 +18,26 @@
 
				 
			
 
				 package org.apache.hadoop.fs.contract.s3a;
			
 
				 
			
 
				-import static org.apache.hadoop.fs.s3a.Constants.MIN_MULTIPART_THRESHOLD;
			
 
				-import static org.apache.hadoop.fs.s3a.Constants.MULTIPART_SIZE;
			
 
				+import static org.apache.hadoop.fs.s3a.Constants.*;
			
 
				 
			
 
				 import org.apache.hadoop.conf.Configuration;
			
 
				 import org.apache.hadoop.tools.contract.AbstractContractDistCpTest;
			
 
				 
			
 
				 /**
			
 
				  * Contract test suite covering S3A integration with DistCp.
			
 
				+ * Uses the block output stream, buffered to disk. This is the
			
 
				+ * recommended output mechanism for DistCP due to its scalability.
			
 
				  */
			
 
				 public class ITestS3AContractDistCp extends AbstractContractDistCpTest {
			
 
				 
			
 
				-  private static final long MULTIPART_SETTING = 8 * 1024 * 1024; // 8 MB
			
 
				+  private static final long MULTIPART_SETTING = MULTIPART_MIN_SIZE;
			
 
				 
			
 
				   @Override
			
 
				   protected Configuration createConfiguration() {
			
 
				     Configuration newConf = super.createConfiguration();
			
 
				-    newConf.setLong(MIN_MULTIPART_THRESHOLD, MULTIPART_SETTING);
			
 
				     newConf.setLong(MULTIPART_SIZE, MULTIPART_SETTING);
			
 
				+    newConf.setBoolean(FAST_UPLOAD, true);
			
 
				+    newConf.set(FAST_UPLOAD_BUFFER, FAST_UPLOAD_BUFFER_DISK);
			
 
				     return newConf;
			
 
				   }
			
 
				 
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/AbstractS3ATestBase.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/AbstractS3ATestBase.java
@@ -48,6 +48,7 @@ public abstract class AbstractS3ATestBase extends AbstractFSContractTestBase
 
				   @Override
			
 
				   public void teardown() throws Exception {
			
 
				     super.teardown();
			
 
				+    describe("closing file system");
			
 
				     IOUtils.closeStream(getFileSystem());
			
 
				   }
			
 
				 
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestBlockingThreadPoolExecutorService.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestBlockingThreadPoolExecutorService.java
@@ -1,4 +1,4 @@
 
				-/**
			
 
				+/*
			
 
				  * Licensed to the Apache Software Foundation (ASF) under one
			
 
				  * or more contributor license agreements.  See the NOTICE file
			
 
				  * distributed with this work for additional information
			
@@ -20,18 +20,23 @@ package org.apache.hadoop.fs.s3a;
 
				 
			
 
				 import com.google.common.util.concurrent.ListenableFuture;
			
 
				 import org.apache.hadoop.util.StopWatch;
			
 
				-import org.junit.*;
			
 
				+
			
 
				+import org.junit.AfterClass;
			
 
				+import org.junit.Rule;
			
 
				+import org.junit.Test;
			
 
				+import org.junit.rules.Timeout;
			
 
				 import org.slf4j.Logger;
			
 
				 import org.slf4j.LoggerFactory;
			
 
				 
			
 
				 import java.util.concurrent.Callable;
			
 
				+import java.util.concurrent.ExecutorService;
			
 
				 import java.util.concurrent.TimeUnit;
			
 
				 
			
 
				 import static org.junit.Assert.assertEquals;
			
 
				 import static org.junit.Assert.assertFalse;
			
 
				 
			
 
				 /**
			
 
				- * Basic unit test for S3A's blocking executor service.
			
 
				+ * Basic test for S3A's blocking executor service.
			
 
				  */
			
 
				 public class ITestBlockingThreadPoolExecutorService {
			
 
				 
			
@@ -47,7 +52,10 @@ public class ITestBlockingThreadPoolExecutorService {
 
				 
			
 
				   private static final Integer SOME_VALUE = 1337;
			
 
				 
			
 
				-  private static BlockingThreadPoolExecutorService tpe = null;
			
 
				+  private static BlockingThreadPoolExecutorService tpe;
			
 
				+
			
 
				+  @Rule
			
 
				+  public Timeout testTimeout = new Timeout(60 * 1000);
			
 
				 
			
 
				   @AfterClass
			
 
				   public static void afterClass() throws Exception {
			
@@ -71,13 +79,23 @@ public class ITestBlockingThreadPoolExecutorService {
 
				   @Test
			
 
				   public void testSubmitRunnable() throws Exception {
			
 
				     ensureCreated();
			
 
				-    int totalTasks = NUM_ACTIVE_TASKS + NUM_WAITING_TASKS;
			
 
				+    verifyQueueSize(tpe, NUM_ACTIVE_TASKS + NUM_WAITING_TASKS);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Verify the size of the executor's queue, by verifying that the first
			
 
				+   * submission to block is {@code expectedQueueSize + 1}.
			
 
				+   * @param executorService executor service to test
			
 
				+   * @param expectedQueueSize size of queue
			
 
				+   */
			
 
				+  protected void verifyQueueSize(ExecutorService executorService,
			
 
				+      int expectedQueueSize) {
			
 
				     StopWatch stopWatch = new StopWatch().start();
			
 
				-    for (int i = 0; i < totalTasks; i++) {
			
 
				-      tpe.submit(sleeper);
			
 
				+    for (int i = 0; i < expectedQueueSize; i++) {
			
 
				+      executorService.submit(sleeper);
			
 
				       assertDidntBlock(stopWatch);
			
 
				     }
			
 
				-    tpe.submit(sleeper);
			
 
				+    executorService.submit(sleeper);
			
 
				     assertDidBlock(stopWatch);
			
 
				   }
			
 
				 
			
@@ -93,6 +111,15 @@ public class ITestBlockingThreadPoolExecutorService {
 
				     ensureDestroyed();
			
 
				   }
			
 
				 
			
 
				+  @Test
			
 
				+  public void testChainedQueue() throws Throwable {
			
 
				+    ensureCreated();
			
 
				+    int size = 2;
			
 
				+    ExecutorService wrapper = new SemaphoredDelegatingExecutor(tpe,
			
 
				+        size, true);
			
 
				+    verifyQueueSize(wrapper, size);
			
 
				+  }
			
 
				+
			
 
				   // Helper functions, etc.
			
 
				 
			
 
				   private void assertDidntBlock(StopWatch sw) {
			
@@ -141,8 +168,9 @@ public class ITestBlockingThreadPoolExecutorService {
 
				   private static void ensureCreated() throws Exception {
			
 
				     if (tpe == null) {
			
 
				       LOG.debug("Creating thread pool");
			
 
				-      tpe = new BlockingThreadPoolExecutorService(NUM_ACTIVE_TASKS,
			
 
				-          NUM_WAITING_TASKS, 1, TimeUnit.SECONDS, "btpetest");
			
 
				+      tpe = BlockingThreadPoolExecutorService.newInstance(
			
 
				+          NUM_ACTIVE_TASKS, NUM_WAITING_TASKS,
			
 
				+          1, TimeUnit.SECONDS, "btpetest");
			
 
				     }
			
 
				   }
			
 
				 
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockOutputArray.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockOutputArray.java
@@ -0,0 +1,90 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+import org.apache.hadoop.conf.Configuration;
			
 
				+import org.apache.hadoop.fs.FSDataOutputStream;
			
 
				+import org.apache.hadoop.fs.Path;
			
 
				+import org.apache.hadoop.fs.contract.ContractTestUtils;
			
 
				+import org.apache.hadoop.io.IOUtils;
			
 
				+
			
 
				+import org.junit.Test;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+
			
 
				+import static org.apache.hadoop.fs.s3a.Constants.*;
			
 
				+
			
 
				+/**
			
 
				+ * Tests small file upload functionality for
			
 
				+ * {@link S3ABlockOutputStream} with the blocks buffered in byte arrays.
			
 
				+ *
			
 
				+ * File sizes are kept small to reduce test duration on slow connections;
			
 
				+ * multipart tests are kept in scale tests.
			
 
				+ */
			
 
				+public class ITestS3ABlockOutputArray extends AbstractS3ATestBase {
			
 
				+
			
 
				+  @Override
			
 
				+  protected Configuration createConfiguration() {
			
 
				+    Configuration conf = super.createConfiguration();
			
 
				+    S3ATestUtils.disableFilesystemCaching(conf);
			
 
				+    conf.setLong(MIN_MULTIPART_THRESHOLD, MULTIPART_MIN_SIZE);
			
 
				+    conf.setInt(MULTIPART_SIZE, MULTIPART_MIN_SIZE);
			
 
				+    conf.setBoolean(Constants.FAST_UPLOAD, true);
			
 
				+    conf.set(FAST_UPLOAD_BUFFER, getBlockOutputBufferName());
			
 
				+    return conf;
			
 
				+  }
			
 
				+
			
 
				+  protected String getBlockOutputBufferName() {
			
 
				+    return FAST_UPLOAD_BUFFER_ARRAY;
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testZeroByteUpload() throws IOException {
			
 
				+    verifyUpload("0", 0);
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testRegularUpload() throws IOException {
			
 
				+    verifyUpload("regular", 1024);
			
 
				+  }
			
 
				+
			
 
				+  @Test(expected = IOException.class)
			
 
				+  public void testDoubleStreamClose() throws Throwable {
			
 
				+    Path dest = path("testDoubleStreamClose");
			
 
				+    describe(" testDoubleStreamClose");
			
 
				+    FSDataOutputStream stream = getFileSystem().create(dest, true);
			
 
				+    byte[] data = ContractTestUtils.dataset(16, 'a', 26);
			
 
				+    try {
			
 
				+      stream.write(data);
			
 
				+      stream.close();
			
 
				+      stream.write(data);
			
 
				+    } finally {
			
 
				+      IOUtils.closeStream(stream);
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  public void verifyUpload(String name, int fileSize) throws IOException {
			
 
				+    Path dest = path(name);
			
 
				+    describe(name + " upload to " + dest);
			
 
				+    ContractTestUtils.createAndVerifyFile(
			
 
				+        getFileSystem(),
			
 
				+        dest,
			
 
				+        fileSize);
			
 
				+  }
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockOutputByteBuffer.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockOutputByteBuffer.java
@@ -0,0 +1,30 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+/**
			
 
				+ * Use {@link Constants#FAST_UPLOAD_BYTEBUFFER} for buffering.
			
 
				+ */
			
 
				+public class ITestS3ABlockOutputByteBuffer extends ITestS3ABlockOutputArray {
			
 
				+
			
 
				+  protected String getBlockOutputBufferName() {
			
 
				+    return Constants.FAST_UPLOAD_BYTEBUFFER;
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockOutputDisk.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockOutputDisk.java
@@ -0,0 +1,30 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+/**
			
 
				+ * Use {@link Constants#FAST_UPLOAD_BUFFER_DISK} for buffering.
			
 
				+ */
			
 
				+public class ITestS3ABlockOutputDisk extends ITestS3ABlockOutputArray {
			
 
				+
			
 
				+  protected String getBlockOutputBufferName() {
			
 
				+    return Constants.FAST_UPLOAD_BUFFER_DISK;
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockingThreadPool.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ABlockingThreadPool.java
@@ -72,6 +72,8 @@ public class ITestS3ABlockingThreadPool {
 
				   @Test
			
 
				   public void testFastMultiPartUpload() throws Exception {
			
 
				     conf.setBoolean(Constants.FAST_UPLOAD, true);
			
 
				+    conf.set(Constants.FAST_UPLOAD_BUFFER,
			
 
				+        Constants.FAST_UPLOAD_BYTEBUFFER);
			
 
				     fs = S3ATestUtils.createTestFileSystem(conf);
			
 
				     ContractTestUtils.createAndVerifyFile(fs, getTestPath(), 16 * 1024 *
			
 
				         1024);
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3AConfiguration.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3AConfiguration.java
@@ -28,6 +28,7 @@ import org.apache.hadoop.conf.Configuration;
 
				 import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.fs.contract.ContractTestUtils;
			
 
				 import org.apache.hadoop.fs.s3native.S3xLoginHelper;
			
 
				+import org.apache.hadoop.test.GenericTestUtils;
			
 
				 import org.junit.Rule;
			
 
				 import org.junit.Test;
			
 
				 import org.junit.rules.Timeout;
			
@@ -35,6 +36,7 @@ import org.slf4j.Logger;
 
				 import org.slf4j.LoggerFactory;
			
 
				 
			
 
				 import static org.junit.Assert.assertFalse;
			
 
				+import static org.junit.Assert.assertNotEquals;
			
 
				 import static org.junit.Assert.assertNotNull;
			
 
				 import static org.junit.Assert.assertTrue;
			
 
				 import static org.junit.Assert.assertEquals;
			
@@ -417,6 +419,33 @@ public class ITestS3AConfiguration {
 
				     fs.close();
			
 
				   }
			
 
				 
			
 
				+  @Test
			
 
				+  public void testDirectoryAllocatorDefval() throws Throwable {
			
 
				+    conf = new Configuration();
			
 
				+    conf.unset(Constants.BUFFER_DIR);
			
 
				+    fs = S3ATestUtils.createTestFileSystem(conf);
			
 
				+    File tmp = fs.createTmpFileForWrite("out-", 1024, conf);
			
 
				+    assertTrue("not found: " + tmp, tmp.exists());
			
 
				+    tmp.delete();
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testDirectoryAllocatorRR() throws Throwable {
			
 
				+    File dir1 = GenericTestUtils.getRandomizedTestDir();
			
 
				+    File dir2 = GenericTestUtils.getRandomizedTestDir();
			
 
				+    dir1.mkdirs();
			
 
				+    dir2.mkdirs();
			
 
				+    conf = new Configuration();
			
 
				+    conf.set(Constants.BUFFER_DIR, dir1 +", " + dir2);
			
 
				+    fs = S3ATestUtils.createTestFileSystem(conf);
			
 
				+    File tmp1 = fs.createTmpFileForWrite("out-", 1024, conf);
			
 
				+    tmp1.delete();
			
 
				+    File tmp2 = fs.createTmpFileForWrite("out-", 1024, conf);
			
 
				+    tmp2.delete();
			
 
				+    assertNotEquals("round robin not working",
			
 
				+        tmp1.getParent(), tmp2.getParent());
			
 
				+  }
			
 
				+
			
 
				   /**
			
 
				    * Reads and returns a field from an object using reflection.  If the field
			
 
				    * cannot be found, is null, or is not the expected type, then this method
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3AEncryptionBlockOutputStream.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3AEncryptionBlockOutputStream.java
@@ -21,15 +21,16 @@ package org.apache.hadoop.fs.s3a;
 
				 import org.apache.hadoop.conf.Configuration;
			
 
				 
			
 
				 /**
			
 
				- * Run the encryption tests against the Fast output stream.
			
 
				- * This verifies that both file writing paths can encrypt their data.
			
 
				+ * Run the encryption tests against the block output stream.
			
 
				  */
			
 
				-public class ITestS3AEncryptionFastOutputStream extends ITestS3AEncryption {
			
 
				+public class ITestS3AEncryptionBlockOutputStream extends ITestS3AEncryption {
			
 
				 
			
 
				   @Override
			
 
				   protected Configuration createConfiguration() {
			
 
				     Configuration conf = super.createConfiguration();
			
 
				     conf.setBoolean(Constants.FAST_UPLOAD, true);
			
 
				+    conf.set(Constants.FAST_UPLOAD_BUFFER,
			
 
				+        Constants.FAST_UPLOAD_BYTEBUFFER);
			
 
				     return conf;
			
 
				   }
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3AFastOutputStream.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3AFastOutputStream.java
@@ -1,74 +0,0 @@
 
				-/**
			
 
				- * Licensed to the Apache Software Foundation (ASF) under one
			
 
				- * or more contributor license agreements.  See the NOTICE file
			
 
				- * distributed with this work for additional information
			
 
				- * regarding copyright ownership.  The ASF licenses this file
			
 
				- * to you under the Apache License, Version 2.0 (the
			
 
				- * "License"); you may not use this file except in compliance
			
 
				- * with the License.  You may obtain a copy of the License at
			
 
				- *
			
 
				- *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				- *
			
 
				- * Unless required by applicable law or agreed to in writing, software
			
 
				- * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				- * See the License for the specific language governing permissions and
			
 
				- * limitations under the License.
			
 
				- */
			
 
				-
			
 
				-package org.apache.hadoop.fs.s3a;
			
 
				-
			
 
				-import org.apache.hadoop.fs.FileSystem;
			
 
				-import org.apache.hadoop.fs.contract.ContractTestUtils;
			
 
				-import org.junit.After;
			
 
				-import org.junit.Before;
			
 
				-import org.junit.Rule;
			
 
				-import org.junit.Test;
			
 
				-import org.junit.rules.Timeout;
			
 
				-import org.apache.hadoop.conf.Configuration;
			
 
				-import org.apache.hadoop.fs.Path;
			
 
				-
			
 
				-import java.io.IOException;
			
 
				-
			
 
				-/**
			
 
				- * Tests regular and multi-part upload functionality for S3AFastOutputStream.
			
 
				- * File sizes are kept small to reduce test duration on slow connections
			
 
				- */
			
 
				-public class ITestS3AFastOutputStream {
			
 
				-  private FileSystem fs;
			
 
				-
			
 
				-
			
 
				-  @Rule
			
 
				-  public Timeout testTimeout = new Timeout(30 * 60 * 1000);
			
 
				-
			
 
				-  @Before
			
 
				-  public void setUp() throws Exception {
			
 
				-    Configuration conf = new Configuration();
			
 
				-    conf.setLong(Constants.MIN_MULTIPART_THRESHOLD, 5 * 1024 * 1024);
			
 
				-    conf.setInt(Constants.MULTIPART_SIZE, 5 * 1024 * 1024);
			
 
				-    conf.setBoolean(Constants.FAST_UPLOAD, true);
			
 
				-    fs = S3ATestUtils.createTestFileSystem(conf);
			
 
				-  }
			
 
				-
			
 
				-  @After
			
 
				-  public void tearDown() throws Exception {
			
 
				-    if (fs != null) {
			
 
				-      fs.delete(getTestPath(), true);
			
 
				-    }
			
 
				-  }
			
 
				-
			
 
				-  protected Path getTestPath() {
			
 
				-    return new Path("/tests3a");
			
 
				-  }
			
 
				-
			
 
				-  @Test
			
 
				-  public void testRegularUpload() throws IOException {
			
 
				-    ContractTestUtils.createAndVerifyFile(fs, getTestPath(), 1024 * 1024);
			
 
				-  }
			
 
				-
			
 
				-  @Test
			
 
				-  public void testMultiPartUpload() throws IOException {
			
 
				-    ContractTestUtils.createAndVerifyFile(fs, getTestPath(), 6 * 1024 *
			
 
				-        1024);
			
 
				-  }
			
 
				-}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ATestUtils.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/ITestS3ATestUtils.java
@@ -0,0 +1,98 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+import org.apache.hadoop.conf.Configuration;
			
 
				+import org.junit.Assert;
			
 
				+import org.junit.Before;
			
 
				+import org.junit.Test;
			
 
				+import org.slf4j.Logger;
			
 
				+import org.slf4j.LoggerFactory;
			
 
				+
			
 
				+import static org.apache.hadoop.fs.s3a.S3ATestUtils.*;
			
 
				+
			
 
				+/**
			
 
				+ * Test the test utils. Why an integration test? it's needed to
			
 
				+ * verify property pushdown.
			
 
				+ */
			
 
				+public class ITestS3ATestUtils extends Assert {
			
 
				+  private static final Logger LOG =
			
 
				+      LoggerFactory.getLogger(ITestS3ATestUtils.class);
			
 
				+  public static final String KEY = "undefined.property";
			
 
				+
			
 
				+  @Before
			
 
				+  public void clear() {
			
 
				+    System.clearProperty(KEY);
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testGetTestProperty() throws Throwable {
			
 
				+    Configuration conf = new Configuration(false);
			
 
				+    assertEquals("a", getTestProperty(conf, KEY, "a"));
			
 
				+    conf.set(KEY, "\t b \n");
			
 
				+    assertEquals("b", getTestProperty(conf, KEY, "a"));
			
 
				+    System.setProperty(KEY, "c");
			
 
				+    assertEquals("c", getTestProperty(conf, KEY, "a"));
			
 
				+    unsetSysprop();
			
 
				+    assertEquals("b", getTestProperty(conf, KEY, "a"));
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testGetTestPropertyLong() throws Throwable {
			
 
				+    Configuration conf = new Configuration(false);
			
 
				+    assertEquals(1, getTestPropertyLong(conf, KEY, 1));
			
 
				+    conf.setInt(KEY, 2);
			
 
				+    assertEquals(2, getTestPropertyLong(conf, KEY, 1));
			
 
				+    System.setProperty(KEY, "3");
			
 
				+    assertEquals(3, getTestPropertyLong(conf, KEY, 1));
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testGetTestPropertyInt() throws Throwable {
			
 
				+    Configuration conf = new Configuration(false);
			
 
				+    assertEquals(1, getTestPropertyInt(conf, KEY, 1));
			
 
				+    conf.setInt(KEY, 2);
			
 
				+    assertEquals(2, getTestPropertyInt(conf, KEY, 1));
			
 
				+    System.setProperty(KEY, "3");
			
 
				+    assertEquals(3, getTestPropertyInt(conf, KEY, 1));
			
 
				+    conf.unset(KEY);
			
 
				+    assertEquals(3, getTestPropertyInt(conf, KEY, 1));
			
 
				+    unsetSysprop();
			
 
				+    assertEquals(5, getTestPropertyInt(conf, KEY, 5));
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void testGetTestPropertyBool() throws Throwable {
			
 
				+    Configuration conf = new Configuration(false);
			
 
				+    assertTrue(getTestPropertyBool(conf, KEY, true));
			
 
				+    conf.set(KEY, "\tfalse \n");
			
 
				+    assertFalse(getTestPropertyBool(conf, KEY, true));
			
 
				+    System.setProperty(KEY, "true");
			
 
				+    assertTrue(getTestPropertyBool(conf, KEY, true));
			
 
				+    unsetSysprop();
			
 
				+    assertEquals("false", getTestProperty(conf, KEY, "true"));
			
 
				+    conf.unset(KEY);
			
 
				+    assertTrue(getTestPropertyBool(conf, KEY, true));
			
 
				+  }
			
 
				+
			
 
				+  protected void unsetSysprop() {
			
 
				+    System.setProperty(KEY, UNSET_PROPERTY);
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/S3ATestConstants.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/S3ATestConstants.java
@@ -43,15 +43,36 @@ public interface S3ATestConstants {
 
				    */
			
 
				   String TEST_FS_S3A_NAME = TEST_FS_S3A + "name";
			
 
				 
			
 
				+  /**
			
 
				+   * Run the encryption tests?
			
 
				+   */
			
 
				+  String KEY_ENCRYPTION_TESTS = TEST_FS_S3A + "encryption.enabled";
			
 
				+
			
 
				+  /**
			
 
				+   * Tell tests that they are being executed in parallel: {@value}.
			
 
				+   */
			
 
				+  String KEY_PARALLEL_TEST_EXECUTION = "test.parallel.execution";
			
 
				+
			
 
				+  /**
			
 
				+   * A property set to true in maven if scale tests are enabled: {@value}.
			
 
				+   */
			
 
				+  String KEY_SCALE_TESTS_ENABLED = S3A_SCALE_TEST + "enabled";
			
 
				+
			
 
				   /**
			
 
				    * The number of operations to perform: {@value}.
			
 
				    */
			
 
				   String KEY_OPERATION_COUNT = SCALE_TEST + "operation.count";
			
 
				 
			
 
				+  /**
			
 
				+   * The number of directory operations to perform: {@value}.
			
 
				+   */
			
 
				+  String KEY_DIRECTORY_COUNT = SCALE_TEST + "directory.count";
			
 
				+
			
 
				   /**
			
 
				    * The readahead buffer: {@value}.
			
 
				    */
			
 
				   String KEY_READ_BUFFER_SIZE = S3A_SCALE_TEST + "read.buffer.size";
			
 
				+
			
 
				   int DEFAULT_READ_BUFFER_SIZE = 16384;
			
 
				 
			
 
				   /**
			
@@ -64,13 +85,63 @@ public interface S3ATestConstants {
 
				    */
			
 
				   String DEFAULT_CSVTEST_FILE = "s3a://landsat-pds/scene_list.gz";
			
 
				 
			
 
				+  /**
			
 
				+   * Endpoint for the S3 CSV/scale tests. This defaults to
			
 
				+   * being us-east.
			
 
				+   */
			
 
				+  String KEY_CSVTEST_ENDPOINT = S3A_SCALE_TEST + "csvfile.endpoint";
			
 
				+
			
 
				+  /**
			
 
				+   * Endpoint for the S3 CSV/scale tests. This defaults to
			
 
				+   * being us-east.
			
 
				+   */
			
 
				+  String DEFAULT_CSVTEST_ENDPOINT = "s3.amazonaws.com";
			
 
				+
			
 
				+  /**
			
 
				+   * Name of the property to define the timeout for scale tests: {@value}.
			
 
				+   * Measured in seconds.
			
 
				+   */
			
 
				+  String KEY_TEST_TIMEOUT = S3A_SCALE_TEST + "timeout";
			
 
				+
			
 
				+  /**
			
 
				+   * Name of the property to define the file size for the huge file
			
 
				+   * tests: {@value}.
			
 
				+   * Measured in KB; a suffix like "M", or "G" will change the unit.
			
 
				+   */
			
 
				+  String KEY_HUGE_FILESIZE = S3A_SCALE_TEST + "huge.filesize";
			
 
				+
			
 
				+  /**
			
 
				+   * Name of the property to define the partition size for the huge file
			
 
				+   * tests: {@value}.
			
 
				+   * Measured in KB; a suffix like "M", or "G" will change the unit.
			
 
				+   */
			
 
				+  String KEY_HUGE_PARTITION_SIZE = S3A_SCALE_TEST + "huge.partitionsize";
			
 
				+
			
 
				+  /**
			
 
				+   * The default huge size is small —full 5GB+ scale tests are something
			
 
				+   * to run in long test runs on EC2 VMs. {@value}.
			
 
				+   */
			
 
				+  String DEFAULT_HUGE_FILESIZE = "10M";
			
 
				+
			
 
				   /**
			
 
				    * The default number of operations to perform: {@value}.
			
 
				    */
			
 
				   long DEFAULT_OPERATION_COUNT = 2005;
			
 
				 
			
 
				   /**
			
 
				-   * Run the encryption tests?
			
 
				+   * Default number of directories to create when performing
			
 
				+   * directory performance/scale tests.
			
 
				    */
			
 
				-  String KEY_ENCRYPTION_TESTS = TEST_FS_S3A + "encryption.enabled";
			
 
				+  int DEFAULT_DIRECTORY_COUNT = 2;
			
 
				+
			
 
				+  /**
			
 
				+   * Default scale test timeout in seconds: {@value}.
			
 
				+   */
			
 
				+  int DEFAULT_TEST_TIMEOUT = 30 * 60;
			
 
				+
			
 
				+  /**
			
 
				+   * Default policy on scale tests: {@value}.
			
 
				+   */
			
 
				+  boolean DEFAULT_SCALE_TESTS_ENABLED = false;
			
 
				+
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/S3ATestUtils.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/S3ATestUtils.java
@@ -39,6 +39,12 @@ import static org.apache.hadoop.fs.s3a.Constants.*;
 
				  */
			
 
				 public class S3ATestUtils {
			
 
				 
			
 
				+  /**
			
 
				+   * Value to set a system property to (in maven) to declare that
			
 
				+   * a property has been unset.
			
 
				+   */
			
 
				+  public static final String UNSET_PROPERTY = "unset";
			
 
				+
			
 
				   /**
			
 
				    * Create the test filesystem.
			
 
				    *
			
@@ -53,8 +59,25 @@ public class S3ATestUtils {
 
				    */
			
 
				   public static S3AFileSystem createTestFileSystem(Configuration conf)
			
 
				       throws IOException {
			
 
				-    String fsname = conf.getTrimmed(TEST_FS_S3A_NAME, "");
			
 
				+    return createTestFileSystem(conf, true);
			
 
				+  }
			
 
				 
			
 
				+  /**
			
 
				+   * Create the test filesystem with or without multipart purging
			
 
				+   *
			
 
				+   * If the test.fs.s3a.name property is not set, this will
			
 
				+   * trigger a JUnit failure.
			
 
				+   * @param conf configuration
			
 
				+   * @param purge flag to enable Multipart purging
			
 
				+   * @return the FS
			
 
				+   * @throws IOException IO Problems
			
 
				+   * @throws AssumptionViolatedException if the FS is not named
			
 
				+   */
			
 
				+  public static S3AFileSystem createTestFileSystem(Configuration conf,
			
 
				+      boolean purge)
			
 
				+      throws IOException {
			
 
				+
			
 
				+    String fsname = conf.getTrimmed(TEST_FS_S3A_NAME, "");
			
 
				 
			
 
				     boolean liveTest = !StringUtils.isEmpty(fsname);
			
 
				     URI testURI = null;
			
@@ -70,8 +93,12 @@ public class S3ATestUtils {
 
				     }
			
 
				     S3AFileSystem fs1 = new S3AFileSystem();
			
 
				     //enable purging in tests
			
 
				-    conf.setBoolean(PURGE_EXISTING_MULTIPART, true);
			
 
				-    conf.setInt(PURGE_EXISTING_MULTIPART_AGE, 0);
			
 
				+    if (purge) {
			
 
				+      conf.setBoolean(PURGE_EXISTING_MULTIPART, true);
			
 
				+      // but a long delay so that parallel multipart tests don't
			
 
				+      // suddenly start timing out
			
 
				+      conf.setInt(PURGE_EXISTING_MULTIPART_AGE, 30 * 60);
			
 
				+    }
			
 
				     fs1.initialize(testURI, conf);
			
 
				     return fs1;
			
 
				   }
			
@@ -148,6 +175,121 @@ public class S3ATestUtils {
 
				     }
			
 
				   }
			
 
				 
			
 
				+  /**
			
 
				+   * Get a long test property.
			
 
				+   * <ol>
			
 
				+   *   <li>Look up configuration value (which can pick up core-default.xml),
			
 
				+   *       using {@code defVal} as the default value (if conf != null).
			
 
				+   *   </li>
			
 
				+   *   <li>Fetch the system property.</li>
			
 
				+   *   <li>If the system property is not empty or "(unset)":
			
 
				+   *   it overrides the conf value.
			
 
				+   *   </li>
			
 
				+   * </ol>
			
 
				+   * This puts the build properties in charge of everything. It's not a
			
 
				+   * perfect design; having maven set properties based on a file, as ant let
			
 
				+   * you do, is better for customization.
			
 
				+   *
			
 
				+   * As to why there's a special (unset) value, see
			
 
				+   * {@link http://stackoverflow.com/questions/7773134/null-versus-empty-arguments-in-maven}
			
 
				+   * @param conf config: may be null
			
 
				+   * @param key key to look up
			
 
				+   * @param defVal default value
			
 
				+   * @return the evaluated test property.
			
 
				+   */
			
 
				+  public static long getTestPropertyLong(Configuration conf,
			
 
				+      String key, long defVal) {
			
 
				+    return Long.valueOf(
			
 
				+        getTestProperty(conf, key, Long.toString(defVal)));
			
 
				+  }
			
 
				+  /**
			
 
				+   * Get a test property value in bytes, using k, m, g, t, p, e suffixes.
			
 
				+   * {@link org.apache.hadoop.util.StringUtils.TraditionalBinaryPrefix#string2long(String)}
			
 
				+   * <ol>
			
 
				+   *   <li>Look up configuration value (which can pick up core-default.xml),
			
 
				+   *       using {@code defVal} as the default value (if conf != null).
			
 
				+   *   </li>
			
 
				+   *   <li>Fetch the system property.</li>
			
 
				+   *   <li>If the system property is not empty or "(unset)":
			
 
				+   *   it overrides the conf value.
			
 
				+   *   </li>
			
 
				+   * </ol>
			
 
				+   * This puts the build properties in charge of everything. It's not a
			
 
				+   * perfect design; having maven set properties based on a file, as ant let
			
 
				+   * you do, is better for customization.
			
 
				+   *
			
 
				+   * As to why there's a special (unset) value, see
			
 
				+   * {@link http://stackoverflow.com/questions/7773134/null-versus-empty-arguments-in-maven}
			
 
				+   * @param conf config: may be null
			
 
				+   * @param key key to look up
			
 
				+   * @param defVal default value
			
 
				+   * @return the evaluated test property.
			
 
				+   */
			
 
				+  public static long getTestPropertyBytes(Configuration conf,
			
 
				+      String key, String defVal) {
			
 
				+    return org.apache.hadoop.util.StringUtils.TraditionalBinaryPrefix
			
 
				+        .string2long(getTestProperty(conf, key, defVal));
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get an integer test property; algorithm described in
			
 
				+   * {@link #getTestPropertyLong(Configuration, String, long)}.
			
 
				+   * @param key key to look up
			
 
				+   * @param defVal default value
			
 
				+   * @return the evaluated test property.
			
 
				+   */
			
 
				+  public static int getTestPropertyInt(Configuration conf,
			
 
				+      String key, int defVal) {
			
 
				+    return (int) getTestPropertyLong(conf, key, defVal);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get a boolean test property; algorithm described in
			
 
				+   * {@link #getTestPropertyLong(Configuration, String, long)}.
			
 
				+   * @param key key to look up
			
 
				+   * @param defVal default value
			
 
				+   * @return the evaluated test property.
			
 
				+   */
			
 
				+  public static boolean getTestPropertyBool(Configuration conf,
			
 
				+      String key,
			
 
				+      boolean defVal) {
			
 
				+    return Boolean.valueOf(
			
 
				+        getTestProperty(conf, key, Boolean.toString(defVal)));
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get a string test property.
			
 
				+   * <ol>
			
 
				+   *   <li>Look up configuration value (which can pick up core-default.xml),
			
 
				+   *       using {@code defVal} as the default value (if conf != null).
			
 
				+   *   </li>
			
 
				+   *   <li>Fetch the system property.</li>
			
 
				+   *   <li>If the system property is not empty or "(unset)":
			
 
				+   *   it overrides the conf value.
			
 
				+   *   </li>
			
 
				+   * </ol>
			
 
				+   * This puts the build properties in charge of everything. It's not a
			
 
				+   * perfect design; having maven set properties based on a file, as ant let
			
 
				+   * you do, is better for customization.
			
 
				+   *
			
 
				+   * As to why there's a special (unset) value, see
			
 
				+   * @see <a href="http://stackoverflow.com/questions/7773134/null-versus-empty-arguments-in-maven">
			
 
				+   *   Stack Overflow</a>
			
 
				+   * @param conf config: may be null
			
 
				+   * @param key key to look up
			
 
				+   * @param defVal default value
			
 
				+   * @return the evaluated test property.
			
 
				+   */
			
 
				+
			
 
				+  public static String getTestProperty(Configuration conf,
			
 
				+      String key,
			
 
				+      String defVal) {
			
 
				+    String confVal = conf != null ? conf.getTrimmed(key, defVal) : defVal;
			
 
				+    String propval = System.getProperty(key);
			
 
				+    return StringUtils.isNotEmpty(propval) && !UNSET_PROPERTY.equals(propval)
			
 
				+        ? propval : confVal;
			
 
				+  }
			
 
				+
			
 
				   /**
			
 
				    * The exception to raise so as to exit fast from
			
 
				    * {@link #eventually(int, Callable)}.
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/TestDataBlocks.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/TestDataBlocks.java
@@ -0,0 +1,124 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a;
			
 
				+
			
 
				+import org.apache.hadoop.fs.contract.ContractTestUtils;
			
 
				+import org.junit.Assert;
			
 
				+import org.junit.Before;
			
 
				+import org.junit.Rule;
			
 
				+import org.junit.Test;
			
 
				+import org.junit.rules.Timeout;
			
 
				+
			
 
				+/**
			
 
				+ * Unit tests for {@link S3ADataBlocks}.
			
 
				+ */
			
 
				+public class TestDataBlocks extends Assert {
			
 
				+
			
 
				+  @Rule
			
 
				+  public Timeout testTimeout = new Timeout(30 * 1000);
			
 
				+
			
 
				+  @Before
			
 
				+  public void nameThread() {
			
 
				+    Thread.currentThread().setName("JUnit");
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Test the {@link S3ADataBlocks.ByteBufferBlockFactory}.
			
 
				+   * That code implements an input stream over a ByteBuffer, and has to
			
 
				+   * return the buffer to the pool after the read complete.
			
 
				+   *
			
 
				+   * This test verifies the basic contract of the process.
			
 
				+   */
			
 
				+  @Test
			
 
				+  public void testByteBufferIO() throws Throwable {
			
 
				+    try (S3ADataBlocks.ByteBufferBlockFactory factory =
			
 
				+             new S3ADataBlocks.ByteBufferBlockFactory(null)) {
			
 
				+      int limit = 128;
			
 
				+      S3ADataBlocks.ByteBufferBlockFactory.ByteBufferBlock block
			
 
				+          = factory.create(limit);
			
 
				+      assertEquals("outstanding buffers in " + factory,
			
 
				+          1, factory.getOutstandingBufferCount());
			
 
				+
			
 
				+      byte[] buffer = ContractTestUtils.toAsciiByteArray("test data");
			
 
				+      int bufferLen = buffer.length;
			
 
				+      block.write(buffer, 0, bufferLen);
			
 
				+      assertEquals(bufferLen, block.dataSize());
			
 
				+      assertEquals("capacity in " + block,
			
 
				+          limit - bufferLen, block.remainingCapacity());
			
 
				+      assertTrue("hasCapacity(64) in " + block, block.hasCapacity(64));
			
 
				+      assertTrue("No capacity in " + block,
			
 
				+          block.hasCapacity(limit - bufferLen));
			
 
				+
			
 
				+      // now start the write
			
 
				+      S3ADataBlocks.ByteBufferBlockFactory.ByteBufferInputStream
			
 
				+          stream = block.startUpload();
			
 
				+      assertTrue("!hasRemaining() in " + stream, stream.hasRemaining());
			
 
				+      int expected = bufferLen;
			
 
				+      assertEquals("wrong available() in " + stream,
			
 
				+          expected, stream.available());
			
 
				+
			
 
				+      assertEquals('t', stream.read());
			
 
				+      expected--;
			
 
				+      assertEquals("wrong available() in " + stream,
			
 
				+          expected, stream.available());
			
 
				+
			
 
				+      // close the block. The buffer must remain outstanding here;
			
 
				+      // the stream manages the lifecycle of it now
			
 
				+      block.close();
			
 
				+      assertEquals("outstanding buffers in " + factory,
			
 
				+          1, factory.getOutstandingBufferCount());
			
 
				+      block.close();
			
 
				+
			
 
				+      // read into a byte array with an offset
			
 
				+      int offset = 5;
			
 
				+      byte[] in = new byte[limit];
			
 
				+      assertEquals(2, stream.read(in, offset, 2));
			
 
				+      assertEquals('e', in[offset]);
			
 
				+      assertEquals('s', in[offset + 1]);
			
 
				+      expected -= 2;
			
 
				+      assertEquals("wrong available() in " + stream,
			
 
				+          expected, stream.available());
			
 
				+
			
 
				+      // read to end
			
 
				+      byte[] remainder = new byte[limit];
			
 
				+      int c;
			
 
				+      int index = 0;
			
 
				+      while ((c = stream.read()) >= 0) {
			
 
				+        remainder[index++] = (byte) c;
			
 
				+      }
			
 
				+      assertEquals(expected, index);
			
 
				+      assertEquals('a', remainder[--index]);
			
 
				+
			
 
				+      assertEquals("wrong available() in " + stream,
			
 
				+          0, stream.available());
			
 
				+      assertTrue("hasRemaining() in " + stream, !stream.hasRemaining());
			
 
				+
			
 
				+      // when the stream is closed, the data should be returned
			
 
				+      stream.close();
			
 
				+      assertEquals("outstanding buffers in " + factory,
			
 
				+          0, factory.getOutstandingBufferCount());
			
 
				+      stream.close();
			
 
				+      assertEquals("outstanding buffers in " + factory,
			
 
				+          0, factory.getOutstandingBufferCount());
			
 
				+
			
 
				+    }
			
 
				+
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/fileContext/ITestS3AFileContextStatistics.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/fileContext/ITestS3AFileContextStatistics.java
@@ -34,6 +34,7 @@ public class ITestS3AFileContextStatistics extends FCStatisticsBaseTest {
 
				     fc = S3ATestUtils.createTestFileContext(conf);
			
 
				     fc.mkdir(fileContextTestHelper.getTestRootPath(fc, "test"),
			
 
				         FileContext.DEFAULT_PERM, true);
			
 
				+    FileContext.clearStatistics();
			
 
				   }
			
 
				 
			
 
				   @After
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/AbstractSTestS3AHugeFiles.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/AbstractSTestS3AHugeFiles.java
@@ -0,0 +1,412 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a.scale;
			
 
				+
			
 
				+import java.io.IOException;
			
 
				+import java.util.concurrent.atomic.AtomicInteger;
			
 
				+import java.util.concurrent.atomic.AtomicLong;
			
 
				+
			
 
				+import com.amazonaws.event.ProgressEvent;
			
 
				+import com.amazonaws.event.ProgressEventType;
			
 
				+import com.amazonaws.event.ProgressListener;
			
 
				+import org.junit.FixMethodOrder;
			
 
				+import org.junit.Test;
			
 
				+import org.junit.runners.MethodSorters;
			
 
				+import org.slf4j.Logger;
			
 
				+import org.slf4j.LoggerFactory;
			
 
				+
			
 
				+import org.apache.hadoop.conf.Configuration;
			
 
				+import org.apache.hadoop.fs.FSDataInputStream;
			
 
				+import org.apache.hadoop.fs.FSDataOutputStream;
			
 
				+import org.apache.hadoop.fs.Path;
			
 
				+import org.apache.hadoop.fs.StorageStatistics;
			
 
				+import org.apache.hadoop.fs.contract.ContractTestUtils;
			
 
				+import org.apache.hadoop.fs.s3a.S3AFileStatus;
			
 
				+import org.apache.hadoop.fs.s3a.Statistic;
			
 
				+import org.apache.hadoop.util.Progressable;
			
 
				+
			
 
				+import static org.apache.hadoop.fs.contract.ContractTestUtils.*;
			
 
				+import static org.apache.hadoop.fs.s3a.Constants.*;
			
 
				+import static org.apache.hadoop.fs.s3a.S3ATestUtils.*;
			
 
				+
			
 
				+/**
			
 
				+ * Scale test which creates a huge file.
			
 
				+ *
			
 
				+ * <b>Important:</b> the order in which these tests execute is fixed to
			
 
				+ * alphabetical order. Test cases are numbered {@code test_123_} to impose
			
 
				+ * an ordering based on the numbers.
			
 
				+ *
			
 
				+ * Having this ordering allows the tests to assume that the huge file
			
 
				+ * exists. Even so: they should all have a {@link #assumeHugeFileExists()}
			
 
				+ * check at the start, in case an individual test is executed.
			
 
				+ */
			
 
				+@FixMethodOrder(MethodSorters.NAME_ASCENDING)
			
 
				+public abstract class AbstractSTestS3AHugeFiles extends S3AScaleTestBase {
			
 
				+  private static final Logger LOG = LoggerFactory.getLogger(
			
 
				+      AbstractSTestS3AHugeFiles.class);
			
 
				+  public static final int DEFAULT_UPLOAD_BLOCKSIZE = 64 * _1KB;
			
 
				+  public static final String DEFAULT_PARTITION_SIZE = "8M";
			
 
				+  private Path scaleTestDir;
			
 
				+  private Path hugefile;
			
 
				+  private Path hugefileRenamed;
			
 
				+
			
 
				+  private int uploadBlockSize = DEFAULT_UPLOAD_BLOCKSIZE;
			
 
				+  private int partitionSize;
			
 
				+
			
 
				+  @Override
			
 
				+  public void setUp() throws Exception {
			
 
				+    super.setUp();
			
 
				+
			
 
				+    final Path testPath = getTestPath();
			
 
				+    scaleTestDir = new Path(testPath, "scale");
			
 
				+    hugefile = new Path(scaleTestDir, "hugefile");
			
 
				+    hugefileRenamed = new Path(scaleTestDir, "hugefileRenamed");
			
 
				+  }
			
 
				+
			
 
				+  @Override
			
 
				+  public void tearDown() throws Exception {
			
 
				+    // do nothing. Specifically: do not delete the test dir
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Note that this can get called before test setup.
			
 
				+   * @return the configuration to use.
			
 
				+   */
			
 
				+  @Override
			
 
				+  protected Configuration createConfiguration() {
			
 
				+    Configuration conf = super.createConfiguration();
			
 
				+    partitionSize = (int)getTestPropertyBytes(conf,
			
 
				+        KEY_HUGE_PARTITION_SIZE,
			
 
				+        DEFAULT_PARTITION_SIZE);
			
 
				+    assertTrue("Partition size too small: " + partitionSize,
			
 
				+        partitionSize > MULTIPART_MIN_SIZE);
			
 
				+    conf.setLong(SOCKET_SEND_BUFFER, _1MB);
			
 
				+    conf.setLong(SOCKET_RECV_BUFFER, _1MB);
			
 
				+    conf.setLong(MIN_MULTIPART_THRESHOLD, partitionSize);
			
 
				+    conf.setInt(MULTIPART_SIZE, partitionSize);
			
 
				+    conf.set(USER_AGENT_PREFIX, "STestS3AHugeFileCreate");
			
 
				+    conf.setBoolean(FAST_UPLOAD, true);
			
 
				+    conf.set(FAST_UPLOAD_BUFFER, getBlockOutputBufferName());
			
 
				+    return conf;
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * The name of the buffering mechanism to use.
			
 
				+   * @return a buffering mechanism
			
 
				+   */
			
 
				+  protected abstract String getBlockOutputBufferName();
			
 
				+
			
 
				+  @Test
			
 
				+  public void test_010_CreateHugeFile() throws IOException {
			
 
				+    assertFalse("Please run this test sequentially to avoid timeouts" +
			
 
				+            " and bandwidth problems", isParallelExecution());
			
 
				+    long filesize = getTestPropertyBytes(getConf(), KEY_HUGE_FILESIZE,
			
 
				+        DEFAULT_HUGE_FILESIZE);
			
 
				+    long filesizeMB = filesize / _1MB;
			
 
				+
			
 
				+    // clean up from any previous attempts
			
 
				+    deleteHugeFile();
			
 
				+
			
 
				+    describe("Creating file %s of size %d MB" +
			
 
				+            " with partition size %d buffered by %s",
			
 
				+        hugefile, filesizeMB, partitionSize, getBlockOutputBufferName());
			
 
				+
			
 
				+    // now do a check of available upload time, with a pessimistic bandwidth
			
 
				+    // (that of remote upload tests). If the test times out then not only is
			
 
				+    // the test outcome lost, as the follow-on tests continue, they will
			
 
				+    // overlap with the ongoing upload test, for much confusion.
			
 
				+    int timeout = getTestTimeoutSeconds();
			
 
				+    // assume 1 MB/s upload bandwidth
			
 
				+    int bandwidth = _1MB;
			
 
				+    long uploadTime = filesize / bandwidth;
			
 
				+    assertTrue(String.format("Timeout set in %s seconds is too low;" +
			
 
				+            " estimating upload time of %d seconds at 1 MB/s." +
			
 
				+            " Rerun tests with -D%s=%d",
			
 
				+            timeout, uploadTime, KEY_TEST_TIMEOUT, uploadTime * 2),
			
 
				+        uploadTime < timeout);
			
 
				+    assertEquals("File size set in " + KEY_HUGE_FILESIZE + " = " + filesize
			
 
				+            + " is not a multiple of " + uploadBlockSize,
			
 
				+        0, filesize % uploadBlockSize);
			
 
				+
			
 
				+    byte[] data = new byte[uploadBlockSize];
			
 
				+    for (int i = 0; i < uploadBlockSize; i++) {
			
 
				+      data[i] = (byte) (i % 256);
			
 
				+    }
			
 
				+
			
 
				+    long blocks = filesize / uploadBlockSize;
			
 
				+    long blocksPerMB = _1MB / uploadBlockSize;
			
 
				+
			
 
				+    // perform the upload.
			
 
				+    // there's lots of logging here, so that a tail -f on the output log
			
 
				+    // can give a view of what is happening.
			
 
				+    StorageStatistics storageStatistics = fs.getStorageStatistics();
			
 
				+    String putRequests = Statistic.OBJECT_PUT_REQUESTS.getSymbol();
			
 
				+    String putBytes = Statistic.OBJECT_PUT_BYTES.getSymbol();
			
 
				+    Statistic putRequestsActive = Statistic.OBJECT_PUT_REQUESTS_ACTIVE;
			
 
				+    Statistic putBytesPending = Statistic.OBJECT_PUT_BYTES_PENDING;
			
 
				+
			
 
				+    ContractTestUtils.NanoTimer timer = new ContractTestUtils.NanoTimer();
			
 
				+
			
 
				+    long blocksPer10MB = blocksPerMB * 10;
			
 
				+    ProgressCallback progress = new ProgressCallback(timer);
			
 
				+    try (FSDataOutputStream out = fs.create(hugefile,
			
 
				+        true,
			
 
				+        uploadBlockSize,
			
 
				+        progress)) {
			
 
				+
			
 
				+      for (long block = 1; block <= blocks; block++) {
			
 
				+        out.write(data);
			
 
				+        long written = block * uploadBlockSize;
			
 
				+        // every 10 MB and on file upload @ 100%, print some stats
			
 
				+        if (block % blocksPer10MB == 0 || written == filesize) {
			
 
				+          long percentage = written * 100 / filesize;
			
 
				+          double elapsedTime = timer.elapsedTime() / 1.0e9;
			
 
				+          double writtenMB = 1.0 * written / _1MB;
			
 
				+          LOG.info(String.format("[%02d%%] Buffered %.2f MB out of %d MB;" +
			
 
				+                  " PUT %d bytes (%d pending) in %d operations (%d active);" +
			
 
				+                  " elapsedTime=%.2fs; write to buffer bandwidth=%.2f MB/s",
			
 
				+              percentage,
			
 
				+              writtenMB,
			
 
				+              filesizeMB,
			
 
				+              storageStatistics.getLong(putBytes),
			
 
				+              gaugeValue(putBytesPending),
			
 
				+              storageStatistics.getLong(putRequests),
			
 
				+              gaugeValue(putRequestsActive),
			
 
				+              elapsedTime,
			
 
				+              writtenMB / elapsedTime));
			
 
				+        }
			
 
				+      }
			
 
				+      // now close the file
			
 
				+      LOG.info("Closing file and completing write operation");
			
 
				+      ContractTestUtils.NanoTimer closeTimer
			
 
				+          = new ContractTestUtils.NanoTimer();
			
 
				+      out.close();
			
 
				+      closeTimer.end("time to close() output stream");
			
 
				+    }
			
 
				+
			
 
				+    timer.end("time to write %d MB in blocks of %d",
			
 
				+        filesizeMB, uploadBlockSize);
			
 
				+    logFSState();
			
 
				+    bandwidth(timer, filesize);
			
 
				+    long putRequestCount = storageStatistics.getLong(putRequests);
			
 
				+    Long putByteCount = storageStatistics.getLong(putBytes);
			
 
				+    LOG.info("PUT {} bytes in {} operations; {} MB/operation",
			
 
				+        putByteCount, putRequestCount,
			
 
				+        putByteCount / (putRequestCount * _1MB));
			
 
				+    LOG.info("Time per PUT {} nS",
			
 
				+        toHuman(timer.nanosPerOperation(putRequestCount)));
			
 
				+    assertEquals("active put requests in \n" + fs,
			
 
				+        0, gaugeValue(putRequestsActive));
			
 
				+    ContractTestUtils.assertPathExists(fs, "Huge file", hugefile);
			
 
				+    S3AFileStatus status = fs.getFileStatus(hugefile);
			
 
				+    ContractTestUtils.assertIsFile(hugefile, status);
			
 
				+    assertEquals("File size in " + status, filesize, status.getLen());
			
 
				+    progress.verifyNoFailures("Put file " + hugefile + " of size " + filesize);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Progress callback from AWS. Likely to come in on a different thread.
			
 
				+   */
			
 
				+  private final class ProgressCallback implements Progressable,
			
 
				+      ProgressListener {
			
 
				+    private AtomicLong bytesTransferred = new AtomicLong(0);
			
 
				+    private AtomicInteger failures = new AtomicInteger(0);
			
 
				+    private final ContractTestUtils.NanoTimer timer;
			
 
				+
			
 
				+    private ProgressCallback(NanoTimer timer) {
			
 
				+      this.timer = timer;
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void progress() {
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public void progressChanged(ProgressEvent progressEvent) {
			
 
				+      ProgressEventType eventType = progressEvent.getEventType();
			
 
				+      if (eventType.isByteCountEvent()) {
			
 
				+        bytesTransferred.addAndGet(progressEvent.getBytesTransferred());
			
 
				+      }
			
 
				+      switch (eventType) {
			
 
				+      case TRANSFER_PART_FAILED_EVENT:
			
 
				+        // failure
			
 
				+        failures.incrementAndGet();
			
 
				+        LOG.warn("Transfer failure");
			
 
				+        break;
			
 
				+      case TRANSFER_PART_COMPLETED_EVENT:
			
 
				+        // completion
			
 
				+        long elapsedTime = timer.elapsedTime();
			
 
				+        double elapsedTimeS = elapsedTime / 1.0e9;
			
 
				+        long written = bytesTransferred.get();
			
 
				+        long writtenMB = written / _1MB;
			
 
				+        LOG.info(String.format(
			
 
				+            "Event %s; total uploaded=%d MB in %.1fs;" +
			
 
				+                " effective upload bandwidth = %.2f MB/s",
			
 
				+            progressEvent,
			
 
				+            writtenMB, elapsedTimeS, writtenMB / elapsedTimeS));
			
 
				+        break;
			
 
				+      default:
			
 
				+        if (eventType.isByteCountEvent()) {
			
 
				+          LOG.debug("Event {}", progressEvent);
			
 
				+        } else {
			
 
				+          LOG.info("Event {}", progressEvent);
			
 
				+        }
			
 
				+        break;
			
 
				+      }
			
 
				+    }
			
 
				+
			
 
				+    @Override
			
 
				+    public String toString() {
			
 
				+      String sb = "ProgressCallback{"
			
 
				+          + "bytesTransferred=" + bytesTransferred +
			
 
				+          ", failures=" + failures +
			
 
				+          '}';
			
 
				+      return sb;
			
 
				+    }
			
 
				+
			
 
				+    private void verifyNoFailures(String operation) {
			
 
				+      assertEquals("Failures in " + operation +": " + this, 0, failures.get());
			
 
				+    }
			
 
				+  }
			
 
				+
			
 
				+  void assumeHugeFileExists() throws IOException {
			
 
				+    ContractTestUtils.assertPathExists(fs, "huge file not created", hugefile);
			
 
				+    ContractTestUtils.assertIsFile(fs, hugefile);
			
 
				+  }
			
 
				+
			
 
				+  private void logFSState() {
			
 
				+    LOG.info("File System state after operation:\n{}", fs);
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void test_040_PositionedReadHugeFile() throws Throwable {
			
 
				+    assumeHugeFileExists();
			
 
				+    final String encryption = getConf().getTrimmed(
			
 
				+        SERVER_SIDE_ENCRYPTION_ALGORITHM);
			
 
				+    boolean encrypted = encryption != null;
			
 
				+    if (encrypted) {
			
 
				+      LOG.info("File is encrypted with algorithm {}", encryption);
			
 
				+    }
			
 
				+    String filetype = encrypted ? "encrypted file" : "file";
			
 
				+    describe("Positioned reads of %s %s", filetype, hugefile);
			
 
				+    S3AFileStatus status = fs.getFileStatus(hugefile);
			
 
				+    long filesize = status.getLen();
			
 
				+    int ops = 0;
			
 
				+    final int bufferSize = 8192;
			
 
				+    byte[] buffer = new byte[bufferSize];
			
 
				+    long eof = filesize - 1;
			
 
				+
			
 
				+    ContractTestUtils.NanoTimer timer = new ContractTestUtils.NanoTimer();
			
 
				+    ContractTestUtils.NanoTimer readAtByte0, readAtByte0Again, readAtEOF;
			
 
				+    try (FSDataInputStream in = fs.open(hugefile, uploadBlockSize)) {
			
 
				+      readAtByte0 = new ContractTestUtils.NanoTimer();
			
 
				+      in.readFully(0, buffer);
			
 
				+      readAtByte0.end("time to read data at start of file");
			
 
				+      ops++;
			
 
				+
			
 
				+      readAtEOF = new ContractTestUtils.NanoTimer();
			
 
				+      in.readFully(eof - bufferSize, buffer);
			
 
				+      readAtEOF.end("time to read data at end of file");
			
 
				+      ops++;
			
 
				+
			
 
				+      readAtByte0Again = new ContractTestUtils.NanoTimer();
			
 
				+      in.readFully(0, buffer);
			
 
				+      readAtByte0Again.end("time to read data at start of file again");
			
 
				+      ops++;
			
 
				+      LOG.info("Final stream state: {}", in);
			
 
				+    }
			
 
				+    long mb = Math.max(filesize / _1MB, 1);
			
 
				+
			
 
				+    logFSState();
			
 
				+    timer.end("time to performed positioned reads of %s of %d MB ",
			
 
				+        filetype, mb);
			
 
				+    LOG.info("Time per positioned read = {} nS",
			
 
				+        toHuman(timer.nanosPerOperation(ops)));
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void test_050_readHugeFile() throws Throwable {
			
 
				+    assumeHugeFileExists();
			
 
				+    describe("Reading %s", hugefile);
			
 
				+    S3AFileStatus status = fs.getFileStatus(hugefile);
			
 
				+    long filesize = status.getLen();
			
 
				+    long blocks = filesize / uploadBlockSize;
			
 
				+    byte[] data = new byte[uploadBlockSize];
			
 
				+
			
 
				+    ContractTestUtils.NanoTimer timer = new ContractTestUtils.NanoTimer();
			
 
				+    try (FSDataInputStream in = fs.open(hugefile, uploadBlockSize)) {
			
 
				+      for (long block = 0; block < blocks; block++) {
			
 
				+        in.readFully(data);
			
 
				+      }
			
 
				+      LOG.info("Final stream state: {}", in);
			
 
				+    }
			
 
				+
			
 
				+    long mb = Math.max(filesize / _1MB, 1);
			
 
				+    timer.end("time to read file of %d MB ", mb);
			
 
				+    LOG.info("Time per MB to read = {} nS",
			
 
				+        toHuman(timer.nanosPerOperation(mb)));
			
 
				+    bandwidth(timer, filesize);
			
 
				+    logFSState();
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void test_100_renameHugeFile() throws Throwable {
			
 
				+    assumeHugeFileExists();
			
 
				+    describe("renaming %s to %s", hugefile, hugefileRenamed);
			
 
				+    S3AFileStatus status = fs.getFileStatus(hugefile);
			
 
				+    long filesize = status.getLen();
			
 
				+    fs.delete(hugefileRenamed, false);
			
 
				+    ContractTestUtils.NanoTimer timer = new ContractTestUtils.NanoTimer();
			
 
				+    fs.rename(hugefile, hugefileRenamed);
			
 
				+    long mb = Math.max(filesize / _1MB, 1);
			
 
				+    timer.end("time to rename file of %d MB", mb);
			
 
				+    LOG.info("Time per MB to rename = {} nS",
			
 
				+        toHuman(timer.nanosPerOperation(mb)));
			
 
				+    bandwidth(timer, filesize);
			
 
				+    logFSState();
			
 
				+    S3AFileStatus destFileStatus = fs.getFileStatus(hugefileRenamed);
			
 
				+    assertEquals(filesize, destFileStatus.getLen());
			
 
				+
			
 
				+    // rename back
			
 
				+    ContractTestUtils.NanoTimer timer2 = new ContractTestUtils.NanoTimer();
			
 
				+    fs.rename(hugefileRenamed, hugefile);
			
 
				+    timer2.end("Renaming back");
			
 
				+    LOG.info("Time per MB to rename = {} nS",
			
 
				+        toHuman(timer2.nanosPerOperation(mb)));
			
 
				+    bandwidth(timer2, filesize);
			
 
				+  }
			
 
				+
			
 
				+  @Test
			
 
				+  public void test_999_DeleteHugeFiles() throws IOException {
			
 
				+    deleteHugeFile();
			
 
				+    ContractTestUtils.NanoTimer timer2 = new ContractTestUtils.NanoTimer();
			
 
				+
			
 
				+    fs.delete(hugefileRenamed, false);
			
 
				+    timer2.end("time to delete %s", hugefileRenamed);
			
 
				+    ContractTestUtils.rm(fs, getTestPath(), true, true);
			
 
				+  }
			
 
				+
			
 
				+  protected void deleteHugeFile() throws IOException {
			
 
				+    describe("Deleting %s", hugefile);
			
 
				+    NanoTimer timer = new NanoTimer();
			
 
				+    fs.delete(hugefile, false);
			
 
				+    timer.end("time to delete %s", hugefile);
			
 
				+  }
			
 
				+
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3ADeleteManyFiles.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3ADeleteManyFiles.java
@@ -116,20 +116,9 @@ public class ITestS3ADeleteManyFiles extends S3AScaleTestBase {
 
				 
			
 
				   @Test
			
 
				   public void testOpenCreate() throws IOException {
			
 
				-    Path dir = new Path("/tests3a");
			
 
				-    ContractTestUtils.createAndVerifyFile(fs, dir, 1024);
			
 
				-    ContractTestUtils.createAndVerifyFile(fs, dir, 5 * 1024 * 1024);
			
 
				-    ContractTestUtils.createAndVerifyFile(fs, dir, 20 * 1024 * 1024);
			
 
				-
			
 
				-
			
 
				-    /*
			
 
				-    Enable to test the multipart upload
			
 
				-    try {
			
 
				-      ContractTestUtils.createAndVerifyFile(fs, dir,
			
 
				-          (long)6 * 1024 * 1024 * 1024);
			
 
				-    } catch (IOException e) {
			
 
				-      fail(e.getMessage());
			
 
				-    }
			
 
				-    */
			
 
				+    final Path scaleTestDir = getTestPath();
			
 
				+    final Path srcDir = new Path(scaleTestDir, "opencreate");
			
 
				+    ContractTestUtils.createAndVerifyFile(fs, srcDir, 1024);
			
 
				+    ContractTestUtils.createAndVerifyFile(fs, srcDir, 50 * 1024);
			
 
				   }
			
 
				 }
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesArrayBlocks.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesArrayBlocks.java
@@ -0,0 +1,31 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a.scale;
			
 
				+
			
 
				+import org.apache.hadoop.fs.s3a.Constants;
			
 
				+
			
 
				+/**
			
 
				+ * Use {@link Constants#FAST_UPLOAD_BUFFER_ARRAY} for buffering.
			
 
				+ */
			
 
				+public class ITestS3AHugeFilesArrayBlocks extends AbstractSTestS3AHugeFiles {
			
 
				+
			
 
				+  protected String getBlockOutputBufferName() {
			
 
				+    return Constants.FAST_UPLOAD_BUFFER_ARRAY;
			
 
				+  }
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesByteBufferBlocks.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesByteBufferBlocks.java
@@ -0,0 +1,34 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a.scale;
			
 
				+
			
 
				+import org.apache.hadoop.fs.s3a.Constants;
			
 
				+
			
 
				+import static org.apache.hadoop.fs.s3a.Constants.FAST_UPLOAD_BYTEBUFFER;
			
 
				+
			
 
				+/**
			
 
				+ * Use {@link Constants#FAST_UPLOAD_BYTEBUFFER} for buffering.
			
 
				+ */
			
 
				+public class ITestS3AHugeFilesByteBufferBlocks
			
 
				+    extends AbstractSTestS3AHugeFiles {
			
 
				+
			
 
				+  protected String getBlockOutputBufferName() {
			
 
				+    return FAST_UPLOAD_BYTEBUFFER;
			
 
				+  }
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesClassicOutput.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesClassicOutput.java
@@ -0,0 +1,41 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a.scale;
			
 
				+
			
 
				+import org.apache.hadoop.conf.Configuration;
			
 
				+import org.apache.hadoop.fs.s3a.Constants;
			
 
				+
			
 
				+/**
			
 
				+ * Use classic output for writing things; tweaks the configuration to do
			
 
				+ * this after it has been set up in the superclass.
			
 
				+ * The generator test has been copied and re
			
 
				+ */
			
 
				+public class ITestS3AHugeFilesClassicOutput extends AbstractSTestS3AHugeFiles {
			
 
				+
			
 
				+  @Override
			
 
				+  protected Configuration createConfiguration() {
			
 
				+    final Configuration conf = super.createConfiguration();
			
 
				+    conf.setBoolean(Constants.FAST_UPLOAD, false);
			
 
				+    return conf;
			
 
				+  }
			
 
				+
			
 
				+  protected String getBlockOutputBufferName() {
			
 
				+    return "classic";
			
 
				+  }
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesDiskBlocks.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/ITestS3AHugeFilesDiskBlocks.java
@@ -0,0 +1,31 @@
 
				+/*
			
 
				+ * Licensed to the Apache Software Foundation (ASF) under one
			
 
				+ * or more contributor license agreements.  See the NOTICE file
			
 
				+ * distributed with this work for additional information
			
 
				+ * regarding copyright ownership.  The ASF licenses this file
			
 
				+ * to you under the Apache License, Version 2.0 (the
			
 
				+ * "License"); you may not use this file except in compliance
			
 
				+ * with the License.  You may obtain a copy of the License at
			
 
				+ *
			
 
				+ *     http://www.apache.org/licenses/LICENSE-2.0
			
 
				+ *
			
 
				+ * Unless required by applicable law or agreed to in writing, software
			
 
				+ * distributed under the License is distributed on an "AS IS" BASIS,
			
 
				+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
			
 
				+ * See the License for the specific language governing permissions and
			
 
				+ * limitations under the License.
			
 
				+ */
			
 
				+
			
 
				+package org.apache.hadoop.fs.s3a.scale;
			
 
				+
			
 
				+import org.apache.hadoop.fs.s3a.Constants;
			
 
				+
			
 
				+/**
			
 
				+ * Use {@link Constants#FAST_UPLOAD_BUFFER_DISK} for buffering.
			
 
				+ */
			
 
				+public class ITestS3AHugeFilesDiskBlocks extends AbstractSTestS3AHugeFiles {
			
 
				+
			
 
				+  protected String getBlockOutputBufferName() {
			
 
				+    return Constants.FAST_UPLOAD_BUFFER_DISK;
			
 
				+  }
			
 
				+}
			
--- a/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/S3AScaleTestBase.java
+++ b/hadoop-tools/hadoop-aws/src/test/java/org/apache/hadoop/fs/s3a/scale/S3AScaleTestBase.java
@@ -20,18 +20,18 @@ package org.apache.hadoop.fs.s3a.scale;
 
				 
			
 
				 import org.apache.hadoop.conf.Configuration;
			
 
				 import org.apache.hadoop.fs.FSDataInputStream;
			
 
				+import org.apache.hadoop.fs.Path;
			
 
				 import org.apache.hadoop.fs.contract.ContractTestUtils;
			
 
				 import org.apache.hadoop.fs.s3a.S3AFileSystem;
			
 
				-import org.apache.hadoop.fs.Path;
			
 
				-
			
 
				 import org.apache.hadoop.fs.s3a.S3AInputStream;
			
 
				 import org.apache.hadoop.fs.s3a.S3AInstrumentation;
			
 
				 import org.apache.hadoop.fs.s3a.S3ATestConstants;
			
 
				-import org.apache.hadoop.fs.s3a.S3ATestUtils;
			
 
				+import org.apache.hadoop.fs.s3a.Statistic;
			
 
				+import org.apache.hadoop.metrics2.lib.MutableGaugeLong;
			
 
				 import org.junit.After;
			
 
				 import org.junit.Assert;
			
 
				+import org.junit.Assume;
			
 
				 import org.junit.Before;
			
 
				-import org.junit.BeforeClass;
			
 
				 import org.junit.Rule;
			
 
				 import org.junit.rules.TestName;
			
 
				 import org.junit.rules.Timeout;
			
@@ -40,6 +40,8 @@ import org.slf4j.LoggerFactory;
 
				 
			
 
				 import java.io.InputStream;
			
 
				 
			
 
				+import static org.apache.hadoop.fs.s3a.S3ATestUtils.*;
			
 
				+
			
 
				 /**
			
 
				  * Base class for scale tests; here is where the common scale configuration
			
 
				  * keys are defined.
			
@@ -47,71 +49,18 @@ import java.io.InputStream;
 
				 public class S3AScaleTestBase extends Assert implements S3ATestConstants {
			
 
				 
			
 
				   @Rule
			
 
				-  public TestName methodName = new TestName();
			
 
				+  public final TestName methodName = new TestName();
			
 
				 
			
 
				   @Rule
			
 
				-  public Timeout testTimeout = new Timeout(30 * 60 * 1000);
			
 
				+  public Timeout testTimeout = createTestTimeout();
			
 
				 
			
 
				-  @BeforeClass
			
 
				-  public static void nameThread() {
			
 
				+  @Before
			
 
				+  public void nameThread() {
			
 
				     Thread.currentThread().setName("JUnit");
			
 
				   }
			
 
				 
			
 
				-  /**
			
 
				-   * The number of operations to perform: {@value}.
			
 
				-   */
			
 
				-  public static final String KEY_OPERATION_COUNT =
			
 
				-      SCALE_TEST + "operation.count";
			
 
				-
			
 
				-  /**
			
 
				-   * The number of directory operations to perform: {@value}.
			
 
				-   */
			
 
				-  public static final String KEY_DIRECTORY_COUNT =
			
 
				-      SCALE_TEST + "directory.count";
			
 
				-
			
 
				-  /**
			
 
				-   * The readahead buffer: {@value}.
			
 
				-   */
			
 
				-  public static final String KEY_READ_BUFFER_SIZE =
			
 
				-      S3A_SCALE_TEST + "read.buffer.size";
			
 
				-
			
 
				-  public static final int DEFAULT_READ_BUFFER_SIZE = 16384;
			
 
				-
			
 
				-  /**
			
 
				-   * Key for a multi MB test file: {@value}.
			
 
				-   */
			
 
				-  public static final String KEY_CSVTEST_FILE =
			
 
				-      S3A_SCALE_TEST + "csvfile";
			
 
				-  /**
			
 
				-   * Default path for the multi MB test file: {@value}.
			
 
				-   */
			
 
				-  public static final String DEFAULT_CSVTEST_FILE
			
 
				-      = "s3a://landsat-pds/scene_list.gz";
			
 
				-
			
 
				-  /**
			
 
				-   * Endpoint for the S3 CSV/scale tests. This defaults to
			
 
				-   * being us-east.
			
 
				-   */
			
 
				-  public static final String KEY_CSVTEST_ENDPOINT =
			
 
				-      S3A_SCALE_TEST + "csvfile.endpoint";
			
 
				-
			
 
				-  /**
			
 
				-   * Endpoint for the S3 CSV/scale tests. This defaults to
			
 
				-   * being us-east.
			
 
				-   */
			
 
				-  public static final String DEFAULT_CSVTEST_ENDPOINT =
			
 
				-      "s3.amazonaws.com";
			
 
				-
			
 
				-  /**
			
 
				-   * The default number of operations to perform: {@value}.
			
 
				-   */
			
 
				-  public static final long DEFAULT_OPERATION_COUNT = 2005;
			
 
				-
			
 
				-  /**
			
 
				-   * Default number of directories to create when performing
			
 
				-   * directory performance/scale tests.
			
 
				-   */
			
 
				-  public static final int DEFAULT_DIRECTORY_COUNT = 2;
			
 
				+  public static final int _1KB = 1024;
			
 
				+  public static final int _1MB = _1KB * _1KB;
			
 
				 
			
 
				   protected S3AFileSystem fs;
			
 
				 
			
@@ -120,6 +69,8 @@ public class S3AScaleTestBase extends Assert implements S3ATestConstants {
 
				 
			
 
				   private Configuration conf;
			
 
				 
			
 
				+  private boolean enabled;
			
 
				+
			
 
				   /**
			
 
				    * Configuration generator. May be overridden to inject
			
 
				    * some custom options.
			
@@ -137,11 +88,33 @@ public class S3AScaleTestBase extends Assert implements S3ATestConstants {
 
				     return conf;
			
 
				   }
			
 
				 
			
 
				+  /**
			
 
				+   * Setup. This triggers creation of the configuration.
			
 
				+   */
			
 
				   @Before
			
 
				   public void setUp() throws Exception {
			
 
				-    conf = createConfiguration();
			
 
				+    demandCreateConfiguration();
			
 
				     LOG.debug("Scale test operation count = {}", getOperationCount());
			
 
				-    fs = S3ATestUtils.createTestFileSystem(conf);
			
 
				+    // multipart purges are disabled on the scale tests
			
 
				+    fs = createTestFileSystem(conf, false);
			
 
				+    // check for the test being enabled
			
 
				+    enabled = getTestPropertyBool(
			
 
				+        getConf(),
			
 
				+        KEY_SCALE_TESTS_ENABLED,
			
 
				+        DEFAULT_SCALE_TESTS_ENABLED);
			
 
				+    Assume.assumeTrue("Scale test disabled: to enable set property " +
			
 
				+        KEY_SCALE_TESTS_ENABLED, enabled);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Create the configuration if it is not already set up.
			
 
				+   * @return the configuration.
			
 
				+   */
			
 
				+  private synchronized Configuration demandCreateConfiguration() {
			
 
				+    if (conf == null) {
			
 
				+      conf = createConfiguration();
			
 
				+    }
			
 
				+    return conf;
			
 
				   }
			
 
				 
			
 
				   @After
			
@@ -160,7 +133,27 @@ public class S3AScaleTestBase extends Assert implements S3ATestConstants {
 
				   }
			
 
				 
			
 
				   /**
			
 
				-   * Describe a test in the logs
			
 
				+   * Create the timeout for tests. Some large tests may need a larger value.
			
 
				+   * @return the test timeout to use
			
 
				+   */
			
 
				+  protected Timeout createTestTimeout() {
			
 
				+    demandCreateConfiguration();
			
 
				+    return new Timeout(
			
 
				+        getTestTimeoutSeconds() * 1000);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Get the test timeout in seconds.
			
 
				+   * @return the test timeout as set in system properties or the default.
			
 
				+   */
			
 
				+  protected static int getTestTimeoutSeconds() {
			
 
				+    return getTestPropertyInt(null,
			
 
				+        KEY_TEST_TIMEOUT,
			
 
				+        DEFAULT_TEST_TIMEOUT);
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Describe a test in the logs.
			
 
				    * @param text text to print
			
 
				    * @param args arguments to format in the printing
			
 
				    */
			
@@ -189,4 +182,30 @@ public class S3AScaleTestBase extends Assert implements S3ATestConstants {
 
				     }
			
 
				   }
			
 
				 
			
 
				+  /**
			
 
				+   * Get the gauge value of a statistic. Raises an assertion if
			
 
				+   * there is no such gauge.
			
 
				+   * @param statistic statistic to look up
			
 
				+   * @return the value.
			
 
				+   */
			
 
				+  public long gaugeValue(Statistic statistic) {
			
 
				+    S3AInstrumentation instrumentation = fs.getInstrumentation();
			
 
				+    MutableGaugeLong gauge = instrumentation.lookupGauge(statistic.getSymbol());
			
 
				+    assertNotNull("No gauge " + statistic
			
 
				+        + " in " + instrumentation.dump("", " = ", "\n", true), gauge);
			
 
				+    return gauge.value();
			
 
				+  }
			
 
				+
			
 
				+  protected boolean isEnabled() {
			
 
				+    return enabled;
			
 
				+  }
			
 
				+
			
 
				+  /**
			
 
				+   * Flag to indicate that this test is being used sequentially. This
			
 
				+   * is used by some of the scale tests to validate test time expectations.
			
 
				+   * @return true if the build indicates this test is being run in parallel.
			
 
				+   */
			
 
				+  protected boolean isParallelExecution() {
			
 
				+    return Boolean.getBoolean(S3ATestConstants.KEY_PARALLEL_TEST_EXECUTION);
			
 
				+  }
			
 
				 }