amazon-archives
diff --git a/‎.gitignore
+5 b/‎.gitignore
+5
diff --git a/‎README.md
+141-82 b/‎README.md
+141-82
diff --git a/‎pom.xml
+19-10 b/‎pom.xml
+19-10
@@ -0,0 +1,5 @@
+/.idea
+/target
+/*.iml
+.*~
+*~
@@ -1,79 +1,127 @@
 # DynamoDB Import Export Tool
-The DynamoDB Import Export Tool is designed to perform parallel scans on the source table, store scan results in a queue, then consume the queue by writing the items asynchronously to a destination table.
+The DynamoDB Import Export Tool is designed to perform parallel scans on the source table,
+store scan results in a queue, then consume the queue by writing the items asynchronously to a destination table.
 
 ## Requirements ##
 * Maven
 * JRE 1.7+
-* Pre-existing source and destination DynamoDB tables
+* Pre-existing source DynamoDB tables. The destination table is optional in the CLI; you can choose to create the
+destination table if it does not exist.
 
 ## Running as an executable
-
-1. Build the library:
-
-```
-    mvn install
+1. Build the library with `mvn install`. This produces the target jar in the target/ directory.
+The CLI's usage follows with required parameters marked by asterisks.
+
+```bash
+    --consistentScan
+      Use this flag to use strongly consistent scan. If the flag is not used 
+      it will default to eventually consistent scan
+      Default: false
+    --createDestination
+      Create destination table if it does not exist
+      Default: false
+    --copyStreamSpecificationWhenCreating
+      Use the source table stream specification for the destination table 
+      during its creation.
+      Default: false
+    --destinationEndpoint
+      Endpoint of the destination table
+  * --destinationRegion
+      Signing region for the destination endpoint
+  * --destinationTable
+      Name of the destination table
+    --help
+      Display usage information
+    --maxWriteThreads
+      Number of max threads to write to destination table
+      Default: 1024
+  * --readThroughputRatio
+      Percentage of total read throughput to scan the source table
+      Default: 0.0
+    --section
+      Section number to scan when running multiple programs concurrently [0, 
+      1... totalSections-1]
+      Default: 0
+    --sourceEndpoint
+      Endpoint of the source table
+  * --sourceRegion
+      Signing region for the source endpoint
+  * --sourceTable
+      Name of the source table
+    --totalSections
+      Total number of sections to divide the scan into
+      Default: 1
+  * --writeThroughputRatio
+      Percentage of total write throughput to write the destination table
+      Default: 0.0
 ```
 
-2. This produces the target jar in the target/ directory, to start the replication process:
-
-java -jar dynamodb-import-export-tool.jar
-
---destinationEndpoint <destination_endpoint> // the DynamoDB endpoint where the destination table is located.
-
---destinationTable <destination_table> // the destination table to write to.
-
---sourceEndpoint <source_endpoint> // the endpoint where the source table is located.
-
---sourceTable <source_table>// the source table to read from.
-
---readThroughputRatio <ratio_in_decimal> // the ratio of read throughput to consume from the source table.
-
---writeThroughputRatio <ratio_in_decimal> // the ratio of write throughput to consume from the destination table.
-
---maxWriteThreads <numWriteThreads> // (Optional, default=128 * Available_Processors) Maximum number of write threads to create.
-
---totalSections <numSections> // (Optional, default=1) Total number of sections to split the bootstrap into. Each application will only scan and write one section.
-
---section <sectionSequence> // (Optional, default=0) section to read and write. Only will scan this one section of all sections, [0...totalSections-1].
-
---consistentScan <boolean> // (Optional, default=false) indicates whether consistent scan should be used when reading from the source table.
+2. An example command you can use on one EC2 host to copy from one table `foo` in `us-east-1` to a new table
+called `bar` in `us-east-2` follows.
+
+```bash
+java -jar target/dynamodb-import-export-tool-1.1.0.jar \
+--sourceRegion us-east-1 \
+--sourceTable foo \
+--destinationRegion us-east-2 \
+--destinationTable bar \
+--readThroughputRatio 1 \
+--writeThroughputRatio 1
+```
 
-> **NOTE**: To split the replication process across multiple machines, simply use the totalSections & section command line arguments, where each machine will run one section out of [0 ... totalSections-1].
+> **NOTE**: To split the replication process across multiple machines, simply use the totalSections & section
+command line arguments, where each machine will run one section out of [0 ... totalSections-1].
 
 ## Using the API
+Find some examples of how to use the Import-Export tool's API below.
+The first demonstrates how to use the API to copy data from one DynamoDB table to another.
+The second demonstrates how to enqueue the data in a DynamoDB table in a
+`BlockingQueueConsumer` in memory.
 
 ### 1. Transfer Data from One DynamoDB Table to Another DynamoDB Table
 
-The below example will read from "mySourceTable" at 100 reads per second, using 4 threads. And it will write to "myDestinationTable" at 50 writes per second, using 8 threads.
-Both tables are located at "dynamodb.us-west-1.amazonaws.com". (to transfer to a different region, create 2 AmazonDynamoDBClients
+The below example will read from "mySourceTable" at 100 reads per second, using four threads.
+And it will write to "myDestinationTable" at 50 writes per second, using eight threads.
+Both tables are located at "dynamodb.us-west-1.amazonaws.com".
+To transfer to a different region, create two AmazonDynamoDBClients
 with different endpoints to pass into the DynamoDBBootstrapWorker and the DynamoDBConsumer.
 
 ```java
-AmazonDynamoDBClient client = new AmazonDynamoDBClient(new ProfileCredentialsProvider());
-client.setEndpoint("dynamodb.us-west-1.amazonaws.com");
-
-DynamoDBBootstrapWorker worker = null;
-
-try {
-    // 100.0 read operations per second. 4 threads to scan the table.
-    worker = new DynamoDBBootstrapWorker(client,
-                100.0, "mySourceTable", 4);
-} catch (NullReadCapacityException e) {
-    LOGGER.error("The DynamoDB source table returned a null read capacity.", e);
-    System.exit(1);
-}
-
- // 50.0 write operations per second. 8 threads to scan the table.
-DynamoDBConsumer consumer = new DynamoDBConsumer(client, "myDestinationTable", 50.0, Executors.newFixedThreadPool(8));
-
-try {
-    worker.pipe(consumer);
-} catch (ExecutionException e) {
-    LOGGER.error("Encountered exception when executing transfer.", e);
-    System.exit(1);
-} catch (InterruptedException e){
-    LOGGER.error("Interrupted when executing transfer.", e);
-    System.exit(1);
+import com.amazonaws.dynamodb.bootstrap.DynamoDBBootstrapWorker;
+import com.amazonaws.dynamodb.bootstrap.DynamoDBConsumer;
+import com.amazonaws.dynamodb.bootstrap.exception.NullReadCapacityException;
+import com.amazonaws.services.dynamodbv2.AmazonDynamoDB;
+import com.amazonaws.services.dynamodbv2.AmazonDynamoDBClientBuilder;
+
+import java.util.concurrent.ExecutionException;
+import java.util.concurrent.Executors;
+
+class TransferDataFromOneTableToAnother {
+    public static void main(String[] args) {
+        AmazonDynamoDB client = AmazonDynamoDBClientBuilder.standard()
+                .withRegion(com.amazonaws.regions.Regions.US_WEST_1).build();
+        DynamoDBBootstrapWorker worker = null;
+        try {
+            // 100.0 read operations per second. 4 threads to scan the table.
+            worker = new DynamoDBBootstrapWorker(client,
+                    100.0, "mySourceTable", 4);
+        } catch (NullReadCapacityException e) {
+            System.err.println("The DynamoDB source table returned a null read capacity.");
+            System.exit(1);
+        }
+        // 50.0 write operations per second. 8 threads to scan the table.
+        DynamoDBConsumer consumer = new DynamoDBConsumer(client, "myDestinationTable", 50.0,
+                Executors.newFixedThreadPool(8));
+        try {
+            worker.pipe(consumer);
+        } catch (ExecutionException e) {
+            System.err.println("Encountered exception when executing transfer: " + e.getMessage());
+            System.exit(1);
+        } catch (InterruptedException e){
+            System.err.println("Interrupted when executing transfer: " + e.getMessage());
+            System.exit(1);
+        }
+    }
 }
 ```
 
@@ -85,29 +133,40 @@ the DynamoDB entries but does not have a setup application for it. They can just
 to then process the new entries.
 
 ```java
-AmazonDynamoDBClient client = new AmazonDynamoDBClient(new ProfileCredentialsProvider());
-client.setEndpoint("dynamodb.us-west-1.amazonaws.com");
-
-DynamoDBBootstrapWorker worker = null;
-
-try {
-    // 100.0 read operations per second. 4 threads to scan the table.
-    worker = new DynamoDBBootstrapWorker(client,
-                100.0, "mySourceTable", 4);
-} catch (NullReadCapacityException e) {
-    LOGGER.error("The DynamoDB source table returned a null read capacity.", e);
-    System.exit(1);
-}
-
-BlockingQueueConsumer consumer = new BlockingQueueConsumer(8);
-
-try {
-    worker.pipe(consumer);
-} catch (ExecutionException e) {
-    LOGGER.error("Encountered exception when executing transfer.", e);
-    System.exit(1);
-} catch (InterruptedException e){
-    LOGGER.error("Interrupted when executing transfer.", e);
-    System.exit(1);
+import com.amazonaws.dynamodb.bootstrap.BlockingQueueConsumer;
+import com.amazonaws.dynamodb.bootstrap.DynamoDBBootstrapWorker;
+import com.amazonaws.dynamodb.bootstrap.exception.NullReadCapacityException;
+import com.amazonaws.services.dynamodbv2.AmazonDynamoDB;
+import com.amazonaws.services.dynamodbv2.AmazonDynamoDBClientBuilder;
+
+import java.util.concurrent.ExecutionException;
+
+class TransferDataFromOneTableToBlockingQueue {
+    public static void main(String[] args) {
+        AmazonDynamoDB client = AmazonDynamoDBClientBuilder.standard()
+                .withRegion(com.amazonaws.regions.Regions.US_WEST_1).build();
+
+        DynamoDBBootstrapWorker worker = null;
+
+        try {
+            // 100.0 read operations per second. 4 threads to scan the table.
+            worker = new DynamoDBBootstrapWorker(client, 100.0, "mySourceTable", 4);
+        } catch (NullReadCapacityException e) {
+            System.err.println("The DynamoDB source table returned a null read capacity.");
+            System.exit(1);
+        }
+
+        BlockingQueueConsumer consumer = new BlockingQueueConsumer(8);
+
+        try {
+            worker.pipe(consumer);
+        } catch (ExecutionException e) {
+            System.err.println("Encountered exception when executing transfer: " + e.getMessage());
+            System.exit(1);
+        } catch (InterruptedException e){
+            System.err.println("Interrupted when executing transfer: " + e.getMessage());
+            System.exit(1);
+        }
+    }
 }
 ```
@@ -1,7 +1,7 @@
 <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
     <modelVersion>4.0.0</modelVersion>
     <groupId>com.amazonaws</groupId>
-    <version>1.0.1</version>
+    <version>1.1.0</version>
     <artifactId>dynamodb-import-export-tool</artifactId>
     <packaging>jar</packaging>
     <name>DynamoDB Import Export Tool</name>
@@ -11,14 +11,17 @@
         <url>https://github.com/awslabs/dynamodb-import-export-tool.git</url>
     </scm>
     <properties>
-        <aws.java.sdk.version>1.10.10</aws.java.sdk.version>
-        <powermock.version>1.6.2</powermock.version>
-        <jcommander.version>1.48</jcommander.version>
-        <guava.version>15.0</guava.version>
+        <jdk.version>1.7</jdk.version>
+        <aws.java.sdk.version>1.11.123</aws.java.sdk.version>
+        <powermock.version>1.6.6</powermock.version>
+        <jcommander.version>1.69</jcommander.version>
+        <guava.version>21.0</guava.version>
         <log4j.core.version>1.2.17</log4j.core.version>
-        <easymock.version>3.2</easymock.version>
+        <easymock.version>3.4</easymock.version>
         <commons.logging.version>1.2</commons.logging.version>
-        <maven.shade.version>2.4.1</maven.shade.version>
+        <maven.shade.version>3.0.0</maven.shade.version>
+        <maven.compiler.version>3.0</maven.compiler.version>
+        <maven.gpg.version>1.6</maven.gpg.version>
         <gpg.skip>true</gpg.skip>
     </properties>
     <developers>
@@ -84,6 +87,11 @@
             <artifactId>log4j</artifactId>
             <version>${log4j.core.version}</version>
         </dependency>
+        <dependency>
+            <groupId>org.projectlombok</groupId>
+            <artifactId>lombok</artifactId>
+            <version>1.16.14</version>
+        </dependency>
         <dependency>
             <groupId>org.powermock</groupId>
             <artifactId>powermock-module-junit4</artifactId>
@@ -109,14 +117,15 @@
             <plugin>
                 <artifactId>maven-compiler-plugin</artifactId>
                 <configuration>
-                    <source>1.7</source>
-                    <target>1.7</target>
+                    <source>${jdk.version}</source>
+                    <target>${jdk.version}</target>
                 </configuration>
-                <version>3.0</version>
+                <version>${maven.compiler.version}</version>
             </plugin>
             <plugin>
                 <groupId>org.apache.maven.plugins</groupId>
                 <artifactId>maven-gpg-plugin</artifactId>
+                <version>${maven.gpg.version}</version>
                 <executions>
                     <execution>
                         <id>sign-artifacts</id>
-Original file line number
+Diff line change
 +/.idea
 +/target
 +/*.iml
 +.*~
 +*~