diff --git a/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/DataflowRunner.java b/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/DataflowRunner.java
index c41cdf647a69..c65812f01d95 100644
--- a/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/DataflowRunner.java
+++ b/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/DataflowRunner.java
@@ -189,580 +189,615 @@
 import org.slf4j.LoggerFactory;
 
 /**
- * A {@link PipelineRunner} that executes the operations in the pipeline by first translating them
- * to the Dataflow representation using the {@link DataflowPipelineTranslator} and then submitting
- * them to a Dataflow service for execution.
+ * A {@link PipelineRunner} that executes the operations in the pipeline by
+ * first translating them to the Dataflow representation using the
+ * {@link DataflowPipelineTranslator} and then submitting them to a Dataflow
+ * service for execution.
  *
  * <h3>Permissions</h3>
  *
- * <p>When reading from a Dataflow source or writing to a Dataflow sink using {@code
- * DataflowRunner}, the Google cloudservices account and the Google compute engine service account
- * of the GCP project running the Dataflow Job will need access to the corresponding source/sink.
+ * <p>
+ * When reading from a Dataflow source or writing to a Dataflow sink using {@code
+ * DataflowRunner}, the Google cloudservices account and the Google compute
+ * engine service account of the GCP project running the Dataflow Job will need
+ * access to the corresponding source/sink.
  *
- * <p>Please see <a href="https://cloud.google.com/dataflow/security-and-permissions">Google Cloud
- * Dataflow Security and Permissions</a> for more details.
+ * <p>
+ * Please see
+ * <a href="https://cloud.google.com/dataflow/security-and-permissions">Google
+ * Cloud Dataflow Security and Permissions</a> for more details.
+ *
+ * <p>
+ * DataflowRunner now supports creating job templates using the
+ * {@code --templateLocation} option. If this option is set, the runner will
+ * generate a template instead of running the pipeline immediately.
+ *
+ * Example:
+ * <pre>{@code
+ * --runner=DataflowRunner
+ * --templateLocation=gs://your-bucket/templates/my-template
+ * }</pre>
  */
 @SuppressWarnings({
-  "rawtypes", // TODO(https://github.com/apache/beam/issues/20447)
-  "nullness" // TODO(https://github.com/apache/beam/issues/20497)
+    "rawtypes", // TODO(https://github.com/apache/beam/issues/20447)
+    "nullness" // TODO(https://github.com/apache/beam/issues/20497)
 })
 public class DataflowRunner extends PipelineRunner<DataflowPipelineJob> {
 
-  /** Experiment to "unsafely attempt to process unbounded data in batch mode". */
-  public static final String UNSAFELY_ATTEMPT_TO_PROCESS_UNBOUNDED_DATA_IN_BATCH_MODE =
-      "unsafely_attempt_to_process_unbounded_data_in_batch_mode";
-
-  private static final Logger LOG = LoggerFactory.getLogger(DataflowRunner.class);
-  /** Provided configuration options. */
-  private final DataflowPipelineOptions options;
-
-  /** Client for the Dataflow service. This is used to actually submit jobs. */
-  private final DataflowClient dataflowClient;
-
-  /** Translator for this DataflowRunner, based on options. */
-  private final DataflowPipelineTranslator translator;
-
-  /** A set of user defined functions to invoke at different points in execution. */
-  private DataflowRunnerHooks hooks;
-
-  // The limit of CreateJob request size.
-  private static final int CREATE_JOB_REQUEST_LIMIT_BYTES = 10 * 1024 * 1024;
-
-  @VisibleForTesting static final int GCS_UPLOAD_BUFFER_SIZE_BYTES_DEFAULT = 1024 * 1024;
-
-  @VisibleForTesting static final String PIPELINE_FILE_NAME = "pipeline.pb";
-  @VisibleForTesting static final String DATAFLOW_GRAPH_FILE_NAME = "dataflow_graph.json";
-
-  private static final ObjectMapper MAPPER = new ObjectMapper();
-
-  /**
-   * Use an {@link ObjectMapper} configured with any {@link Module}s in the class path allowing for
-   * user specified configuration injection into the ObjectMapper. This supports user custom types
-   * on {@link PipelineOptions}.
-   */
-  private static final ObjectMapper MAPPER_WITH_MODULES =
-      new ObjectMapper()
-          .registerModules(ObjectMapper.findModules(ReflectHelpers.findClassLoader()));
-
-  private final Set<PCollection<?>> pcollectionsRequiringIndexedFormat;
-
-  private final Set<PCollection<?>> pCollectionsPreservedKeys;
-  private final Set<PCollection<?>> pcollectionsRequiringAutoSharding;
-
-  /**
-   * Project IDs must contain lowercase letters, digits, or dashes. IDs must start with a letter and
-   * may not end with a dash. This regex isn't exact - this allows for patterns that would be
-   * rejected by the service, but this is sufficient for basic validation of project IDs.
-   */
-  public static final String PROJECT_ID_REGEXP = "[a-z][-a-z0-9:.]+[a-z0-9]";
-
-  /** Dataflow service endpoints are expected to match this pattern. */
-  static final String ENDPOINT_REGEXP = "https://[\\S]*googleapis\\.com[/]?";
-
-  /**
-   * Replaces GCS file paths with local file paths by downloading the GCS files locally. This is
-   * useful when files need to be accessed locally before being staged to Dataflow.
-   *
-   * @param filesToStage List of file paths that may contain GCS paths (gs://) and local paths
-   * @return List of local file paths where any GCS paths have been downloaded locally
-   * @throws RuntimeException if there are errors copying GCS files locally
-   */
-  public static List<String> replaceGcsFilesWithLocalFiles(List<String> filesToStage) {
-    List<String> processedFiles = new ArrayList<>();
-
-    for (String fileToStage : filesToStage) {
-      String localPath;
-      if (fileToStage.contains("=")) {
-        // Handle files with staging name specified
-        String[] components = fileToStage.split("=", 2);
-        String stagingName = components[0];
-        String filePath = components[1];
-
-        if (filePath.startsWith("gs://")) {
-          try {
-            // Create temp file with exact same name as GCS file
-            String gcsFileName = filePath.substring(filePath.lastIndexOf('/') + 1);
-            File tempDir = Files.createTempDir();
-            tempDir.deleteOnExit();
-            File tempFile = new File(tempDir, gcsFileName);
-            tempFile.deleteOnExit();
+    /**
+     * Experiment to "unsafely attempt to process unbounded data in batch mode".
+     */
+    public static final String UNSAFELY_ATTEMPT_TO_PROCESS_UNBOUNDED_DATA_IN_BATCH_MODE
+            = "unsafely_attempt_to_process_unbounded_data_in_batch_mode";
 
-            LOG.info(
-                "Downloading GCS file {} to local temp file {}",
-                filePath,
-                tempFile.getAbsolutePath());
-
-            // Copy GCS file to local temp file
-            ResourceId source = FileSystems.matchNewResource(filePath, false);
-            try (ReadableByteChannel reader = FileSystems.open(source);
-                FileOutputStream writer = new FileOutputStream(tempFile)) {
-              ByteStreams.copy(Channels.newInputStream(reader), writer);
+    private static final Logger LOG = LoggerFactory.getLogger(DataflowRunner.class);
+    /**
+     * Provided configuration options.
+     */
+    private final DataflowPipelineOptions options;
+
+    /**
+     * Client for the Dataflow service. This is used to actually submit jobs.
+     */
+    private final DataflowClient dataflowClient;
+
+    /**
+     * Translator for this DataflowRunner, based on options.
+     */
+    private final DataflowPipelineTranslator translator;
+
+    /**
+     * A set of user defined functions to invoke at different points in
+     * execution.
+     */
+    private DataflowRunnerHooks hooks;
+
+    // The limit of CreateJob request size.
+    private static final int CREATE_JOB_REQUEST_LIMIT_BYTES = 10 * 1024 * 1024;
+
+    @VisibleForTesting
+    static final int GCS_UPLOAD_BUFFER_SIZE_BYTES_DEFAULT = 1024 * 1024;
+
+    @VisibleForTesting
+    static final String PIPELINE_FILE_NAME = "pipeline.pb";
+    @VisibleForTesting
+    static final String DATAFLOW_GRAPH_FILE_NAME = "dataflow_graph.json";
+
+    private static final ObjectMapper MAPPER = new ObjectMapper();
+
+    /**
+     * Use an {@link ObjectMapper} configured with any {@link Module}s in the
+     * class path allowing for user specified configuration injection into the
+     * ObjectMapper. This supports user custom types on {@link PipelineOptions}.
+     */
+    private static final ObjectMapper MAPPER_WITH_MODULES
+            = new ObjectMapper()
+                    .registerModules(ObjectMapper.findModules(ReflectHelpers.findClassLoader()));
+
+    private final Set<PCollection<?>> pcollectionsRequiringIndexedFormat;
+
+    private final Set<PCollection<?>> pCollectionsPreservedKeys;
+    private final Set<PCollection<?>> pcollectionsRequiringAutoSharding;
+
+    /**
+     * Project IDs must contain lowercase letters, digits, or dashes. IDs must
+     * start with a letter and may not end with a dash. This regex isn't exact -
+     * this allows for patterns that would be rejected by the service, but this
+     * is sufficient for basic validation of project IDs.
+     */
+    public static final String PROJECT_ID_REGEXP = "[a-z][-a-z0-9:.]+[a-z0-9]";
+
+    /**
+     * Dataflow service endpoints are expected to match this pattern.
+     */
+    static final String ENDPOINT_REGEXP = "https://[\\S]*googleapis\\.com[/]?";
+
+    /**
+     * Replaces GCS file paths with local file paths by downloading the GCS
+     * files locally. This is useful when files need to be accessed locally
+     * before being staged to Dataflow.
+     *
+     * @param filesToStage List of file paths that may contain GCS paths (gs://)
+     * and local paths
+     * @return List of local file paths where any GCS paths have been downloaded
+     * locally
+     * @throws RuntimeException if there are errors copying GCS files locally
+     */
+    public static List<String> replaceGcsFilesWithLocalFiles(List<String> filesToStage) {
+        List<String> processedFiles = new ArrayList<>();
+
+        for (String fileToStage : filesToStage) {
+            String localPath;
+            if (fileToStage.contains("=")) {
+                // Handle files with staging name specified
+                String[] components = fileToStage.split("=", 2);
+                String stagingName = components[0];
+                String filePath = components[1];
+
+                if (filePath.startsWith("gs://")) {
+                    try {
+                        // Create temp file with exact same name as GCS file
+                        String gcsFileName = filePath.substring(filePath.lastIndexOf('/') + 1);
+                        File tempDir = Files.createTempDir();
+                        tempDir.deleteOnExit();
+                        File tempFile = new File(tempDir, gcsFileName);
+                        tempFile.deleteOnExit();
+
+                        LOG.info(
+                                "Downloading GCS file {} to local temp file {}",
+                                filePath,
+                                tempFile.getAbsolutePath());
+
+                        // Copy GCS file to local temp file
+                        ResourceId source = FileSystems.matchNewResource(filePath, false);
+                        try (ReadableByteChannel reader = FileSystems.open(source); FileOutputStream writer = new FileOutputStream(tempFile)) {
+                            ByteStreams.copy(Channels.newInputStream(reader), writer);
+                        }
+
+                        localPath = stagingName + "=" + tempFile.getAbsolutePath();
+                        LOG.info("Replaced GCS path {} with local path {}", fileToStage, localPath);
+                    } catch (IOException e) {
+                        throw new RuntimeException("Failed to copy GCS file locally: " + filePath, e);
+                    }
+                } else {
+                    localPath = fileToStage;
+                }
+            } else {
+                // Handle files without staging name
+                if (fileToStage.startsWith("gs://")) {
+                    try {
+                        // Create temp file with exact same name as GCS file
+                        String gcsFileName = fileToStage.substring(fileToStage.lastIndexOf('/') + 1);
+                        File tempDir = Files.createTempDir();
+                        tempDir.deleteOnExit();
+                        File tempFile = new File(tempDir, gcsFileName);
+                        tempFile.deleteOnExit();
+
+                        LOG.info(
+                                "Downloading GCS file {} to local temp file {}",
+                                fileToStage,
+                                tempFile.getAbsolutePath());
+
+                        // Copy GCS file to local temp file
+                        ResourceId source = FileSystems.matchNewResource(fileToStage, false);
+                        try (ReadableByteChannel reader = FileSystems.open(source); FileOutputStream writer = new FileOutputStream(tempFile)) {
+                            ByteStreams.copy(Channels.newInputStream(reader), writer);
+                        }
+
+                        localPath = tempFile.getAbsolutePath();
+                        LOG.info("Replaced GCS path {} with local path {}", fileToStage, localPath);
+                    } catch (IOException e) {
+                        throw new RuntimeException("Failed to copy GCS file locally: " + fileToStage, e);
+                    }
+                } else {
+                    localPath = fileToStage;
+                }
             }
+            processedFiles.add(localPath);
+        }
+
+        return processedFiles;
+    }
+
+    /**
+     * Construct a runner from the provided options.
+     *
+     * @param options Properties that configure the runner.
+     * @return The newly created runner.
+     */
+    public static DataflowRunner fromOptions(PipelineOptions options) {
+        DataflowPipelineOptions dataflowOptions
+                = PipelineOptionsValidator.validate(DataflowPipelineOptions.class, options);
+        ArrayList<String> missing = new ArrayList<>();
+
+        if (dataflowOptions.getAppName() == null) {
+            missing.add("appName");
+        }
+
+        if (Strings.isNullOrEmpty(dataflowOptions.getRegion())
+                && isServiceEndpoint(dataflowOptions.getDataflowEndpoint())) {
+            missing.add("region");
+        }
+        if (missing.size() > 0) {
+            throw new IllegalArgumentException(
+                    "Missing required pipeline options: " + Joiner.on(',').join(missing));
+        }
+
+        validateWorkerSettings(
+                PipelineOptionsValidator.validate(DataflowPipelineWorkerPoolOptions.class, options));
+
+        PathValidator validator = dataflowOptions.getPathValidator();
+        String gcpTempLocation;
+        try {
+            gcpTempLocation = dataflowOptions.getGcpTempLocation();
+        } catch (Exception e) {
+            throw new IllegalArgumentException(
+                    "DataflowRunner requires gcpTempLocation, "
+                    + "but failed to retrieve a value from PipelineOptions",
+                    e);
+        }
+        validator.validateOutputFilePrefixSupported(gcpTempLocation);
 
-            localPath = stagingName + "=" + tempFile.getAbsolutePath();
-            LOG.info("Replaced GCS path {} with local path {}", fileToStage, localPath);
-          } catch (IOException e) {
-            throw new RuntimeException("Failed to copy GCS file locally: " + filePath, e);
-          }
+        String stagingLocation;
+        try {
+            stagingLocation = dataflowOptions.getStagingLocation();
+        } catch (Exception e) {
+            throw new IllegalArgumentException(
+                    "DataflowRunner requires stagingLocation, "
+                    + "but failed to retrieve a value from PipelineOptions",
+                    e);
+        }
+        validator.validateOutputFilePrefixSupported(stagingLocation);
+
+        if (!isNullOrEmpty(dataflowOptions.getSaveProfilesToGcs())) {
+            validator.validateOutputFilePrefixSupported(dataflowOptions.getSaveProfilesToGcs());
+        }
+
+        if (dataflowOptions.getFilesToStage() != null) {
+            // Replace GCS file paths with local file paths
+            dataflowOptions.setFilesToStage(
+                    replaceGcsFilesWithLocalFiles(dataflowOptions.getFilesToStage()));
+            // The user specifically requested these files, so fail now if they do not exist.
+            // (automatically detected classpath elements are permitted to not exist, so later
+            // staging will not fail on nonexistent files)
+            dataflowOptions.getFilesToStage().stream()
+                    .forEach(
+                            stagedFileSpec -> {
+                                File localFile;
+                                if (stagedFileSpec.contains("=")) {
+                                    String[] components = stagedFileSpec.split("=", 2);
+                                    localFile = new File(components[1]);
+                                } else {
+                                    localFile = new File(stagedFileSpec);
+                                }
+                                if (!localFile.exists()) {
+                                    // should be FileNotFoundException, but for build-time backwards compatibility
+                                    // cannot add checked exception
+                                    throw new RuntimeException(
+                                            String.format("Non-existent files specified in filesToStage: %s", localFile));
+                                }
+                            });
         } else {
-          localPath = fileToStage;
-        }
-      } else {
-        // Handle files without staging name
-        if (fileToStage.startsWith("gs://")) {
-          try {
-            // Create temp file with exact same name as GCS file
-            String gcsFileName = fileToStage.substring(fileToStage.lastIndexOf('/') + 1);
-            File tempDir = Files.createTempDir();
-            tempDir.deleteOnExit();
-            File tempFile = new File(tempDir, gcsFileName);
-            tempFile.deleteOnExit();
+            dataflowOptions.setFilesToStage(
+                    detectClassPathResourcesToStage(DataflowRunner.class.getClassLoader(), options));
+            if (dataflowOptions.getFilesToStage().isEmpty()) {
+                throw new IllegalArgumentException("No files to stage has been found.");
+            } else {
+                LOG.info(
+                        "PipelineOptions.filesToStage was not specified. "
+                        + "Defaulting to files from the classpath: will stage {} files. "
+                        + "Enable logging at DEBUG level to see which files will be staged.",
+                        dataflowOptions.getFilesToStage().size());
+                LOG.debug("Classpath elements: {}", dataflowOptions.getFilesToStage());
+            }
+        }
 
+        // Verify jobName according to service requirements, truncating converting to lowercase if
+        // necessary.
+        String jobName = dataflowOptions.getJobName().toLowerCase();
+        checkArgument(
+                jobName.matches("[a-z]([-a-z0-9]*[a-z0-9])?"),
+                "JobName invalid; the name must consist of only the characters "
+                + "[-a-z0-9], starting with a letter and ending with a letter "
+                + "or number");
+        if (!jobName.equals(dataflowOptions.getJobName())) {
             LOG.info(
-                "Downloading GCS file {} to local temp file {}",
-                fileToStage,
-                tempFile.getAbsolutePath());
-
-            // Copy GCS file to local temp file
-            ResourceId source = FileSystems.matchNewResource(fileToStage, false);
-            try (ReadableByteChannel reader = FileSystems.open(source);
-                FileOutputStream writer = new FileOutputStream(tempFile)) {
-              ByteStreams.copy(Channels.newInputStream(reader), writer);
-            }
+                    "PipelineOptions.jobName did not match the service requirements. "
+                    + "Using {} instead of {}.",
+                    jobName,
+                    dataflowOptions.getJobName());
+        }
+        dataflowOptions.setJobName(jobName);
+
+        // Verify project
+        String project = dataflowOptions.getProject();
+        if (project.matches("[0-9]*")) {
+            throw new IllegalArgumentException(
+                    "Project ID '"
+                    + project
+                    + "' invalid. Please make sure you specified the Project ID, not project number.");
+        } else if (!project.matches(PROJECT_ID_REGEXP)) {
+            throw new IllegalArgumentException(
+                    "Project ID '"
+                    + project
+                    + "' invalid. Please make sure you specified the Project ID, not project"
+                    + " description.");
+        }
 
-            localPath = tempFile.getAbsolutePath();
-            LOG.info("Replaced GCS path {} with local path {}", fileToStage, localPath);
-          } catch (IOException e) {
-            throw new RuntimeException("Failed to copy GCS file locally: " + fileToStage, e);
-          }
-        } else {
-          localPath = fileToStage;
-        }
-      }
-      processedFiles.add(localPath);
-    }
-
-    return processedFiles;
-  }
-
-  /**
-   * Construct a runner from the provided options.
-   *
-   * @param options Properties that configure the runner.
-   * @return The newly created runner.
-   */
-  public static DataflowRunner fromOptions(PipelineOptions options) {
-    DataflowPipelineOptions dataflowOptions =
-        PipelineOptionsValidator.validate(DataflowPipelineOptions.class, options);
-    ArrayList<String> missing = new ArrayList<>();
-
-    if (dataflowOptions.getAppName() == null) {
-      missing.add("appName");
-    }
-
-    if (Strings.isNullOrEmpty(dataflowOptions.getRegion())
-        && isServiceEndpoint(dataflowOptions.getDataflowEndpoint())) {
-      missing.add("region");
-    }
-    if (missing.size() > 0) {
-      throw new IllegalArgumentException(
-          "Missing required pipeline options: " + Joiner.on(',').join(missing));
-    }
-
-    validateWorkerSettings(
-        PipelineOptionsValidator.validate(DataflowPipelineWorkerPoolOptions.class, options));
-
-    PathValidator validator = dataflowOptions.getPathValidator();
-    String gcpTempLocation;
-    try {
-      gcpTempLocation = dataflowOptions.getGcpTempLocation();
-    } catch (Exception e) {
-      throw new IllegalArgumentException(
-          "DataflowRunner requires gcpTempLocation, "
-              + "but failed to retrieve a value from PipelineOptions",
-          e);
-    }
-    validator.validateOutputFilePrefixSupported(gcpTempLocation);
-
-    String stagingLocation;
-    try {
-      stagingLocation = dataflowOptions.getStagingLocation();
-    } catch (Exception e) {
-      throw new IllegalArgumentException(
-          "DataflowRunner requires stagingLocation, "
-              + "but failed to retrieve a value from PipelineOptions",
-          e);
-    }
-    validator.validateOutputFilePrefixSupported(stagingLocation);
-
-    if (!isNullOrEmpty(dataflowOptions.getSaveProfilesToGcs())) {
-      validator.validateOutputFilePrefixSupported(dataflowOptions.getSaveProfilesToGcs());
-    }
-
-    if (dataflowOptions.getFilesToStage() != null) {
-      // Replace GCS file paths with local file paths
-      dataflowOptions.setFilesToStage(
-          replaceGcsFilesWithLocalFiles(dataflowOptions.getFilesToStage()));
-      // The user specifically requested these files, so fail now if they do not exist.
-      // (automatically detected classpath elements are permitted to not exist, so later
-      // staging will not fail on nonexistent files)
-      dataflowOptions.getFilesToStage().stream()
-          .forEach(
-              stagedFileSpec -> {
-                File localFile;
-                if (stagedFileSpec.contains("=")) {
-                  String[] components = stagedFileSpec.split("=", 2);
-                  localFile = new File(components[1]);
-                } else {
-                  localFile = new File(stagedFileSpec);
-                }
-                if (!localFile.exists()) {
-                  // should be FileNotFoundException, but for build-time backwards compatibility
-                  // cannot add checked exception
-                  throw new RuntimeException(
-                      String.format("Non-existent files specified in filesToStage: %s", localFile));
+        DataflowPipelineDebugOptions debugOptions
+                = dataflowOptions.as(DataflowPipelineDebugOptions.class);
+        // Verify the number of worker threads is a valid value
+        if (debugOptions.getNumberOfWorkerHarnessThreads() < 0) {
+            throw new IllegalArgumentException(
+                    "Number of worker harness threads '"
+                    + debugOptions.getNumberOfWorkerHarnessThreads()
+                    + "' invalid. Please make sure the value is non-negative.");
+        }
+
+        // Verify that if recordJfrOnGcThrashing is set, the pipeline is at least on java 11
+        if (dataflowOptions.getRecordJfrOnGcThrashing()
+                && Environments.getJavaVersion() == Environments.JavaVersion.java8) {
+            throw new IllegalArgumentException(
+                    "recordJfrOnGcThrashing is only supported on java 9 and up.");
+        }
+
+        if (dataflowOptions.isStreaming() && dataflowOptions.getGcsUploadBufferSizeBytes() == null) {
+            dataflowOptions.setGcsUploadBufferSizeBytes(GCS_UPLOAD_BUFFER_SIZE_BYTES_DEFAULT);
+        }
+
+        // Adding the Java version to the SDK name for user's and support convenience.
+        String agentJavaVer = "(JRE 8 environment)";
+        if (Environments.getJavaVersion() != Environments.JavaVersion.java8) {
+            agentJavaVer
+                    = String.format("(JRE %s environment)", Environments.getJavaVersion().specification());
+        }
+
+        DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
+        String userAgentName = dataflowRunnerInfo.getName();
+        Preconditions.checkArgument(
+                !userAgentName.equals(""), "Dataflow runner's `name` property cannot be empty.");
+        String userAgentVersion = dataflowRunnerInfo.getVersion();
+        Preconditions.checkArgument(
+                !userAgentVersion.equals(""), "Dataflow runner's `version` property cannot be empty.");
+        String userAgent
+                = String.format("%s/%s%s", userAgentName, userAgentVersion, agentJavaVer).replace(" ", "_");
+        dataflowOptions.setUserAgent(userAgent);
+
+        return new DataflowRunner(dataflowOptions);
+    }
+
+    static boolean isServiceEndpoint(String endpoint) {
+        return Strings.isNullOrEmpty(endpoint) || Pattern.matches(ENDPOINT_REGEXP, endpoint);
+    }
+
+    static void validateSdkContainerImageOptions(DataflowPipelineWorkerPoolOptions workerOptions) {
+        // Check against null - empty string value for workerHarnessContainerImage
+        // must be preserved for legacy dataflowWorkerJar to work.
+        String sdkContainerOption = workerOptions.getSdkContainerImage();
+        String workerHarnessOption = workerOptions.getWorkerHarnessContainerImage();
+        Preconditions.checkArgument(
+                sdkContainerOption == null
+                || workerHarnessOption == null
+                || sdkContainerOption.equals(workerHarnessOption),
+                "Cannot use legacy option workerHarnessContainerImage with sdkContainerImage. Prefer sdkContainerImage.");
+
+        // Default to new option, which may be null.
+        String containerImage = workerOptions.getSdkContainerImage();
+        if (workerOptions.getWorkerHarnessContainerImage() != null
+                && workerOptions.getSdkContainerImage() == null) {
+            // Set image to old option if old option was set but new option is not set.
+            LOG.warn(
+                    "Prefer --sdkContainerImage over deprecated legacy option --workerHarnessContainerImage.");
+            containerImage = workerOptions.getWorkerHarnessContainerImage();
+        }
+
+        // Make sure both options have same value.
+        workerOptions.setSdkContainerImage(containerImage);
+        workerOptions.setWorkerHarnessContainerImage(containerImage);
+    }
+
+    @VisibleForTesting
+    static void validateWorkerSettings(DataflowPipelineWorkerPoolOptions workerOptions) {
+        DataflowPipelineOptions dataflowOptions = workerOptions.as(DataflowPipelineOptions.class);
+
+        validateSdkContainerImageOptions(workerOptions);
+
+        GcpOptions gcpOptions = workerOptions.as(GcpOptions.class);
+        Preconditions.checkArgument(
+                gcpOptions.getZone() == null || gcpOptions.getWorkerRegion() == null,
+                "Cannot use option zone with workerRegion. Prefer either workerZone or workerRegion.");
+        Preconditions.checkArgument(
+                gcpOptions.getZone() == null || gcpOptions.getWorkerZone() == null,
+                "Cannot use option zone with workerZone. Prefer workerZone.");
+        Preconditions.checkArgument(
+                gcpOptions.getWorkerRegion() == null || gcpOptions.getWorkerZone() == null,
+                "workerRegion and workerZone options are mutually exclusive.");
+
+        boolean hasExperimentWorkerRegion = false;
+        if (dataflowOptions.getExperiments() != null) {
+            for (String experiment : dataflowOptions.getExperiments()) {
+                if (experiment.startsWith("worker_region")) {
+                    hasExperimentWorkerRegion = true;
+                    break;
                 }
-              });
-    } else {
-      dataflowOptions.setFilesToStage(
-          detectClassPathResourcesToStage(DataflowRunner.class.getClassLoader(), options));
-      if (dataflowOptions.getFilesToStage().isEmpty()) {
-        throw new IllegalArgumentException("No files to stage has been found.");
-      } else {
-        LOG.info(
-            "PipelineOptions.filesToStage was not specified. "
-                + "Defaulting to files from the classpath: will stage {} files. "
-                + "Enable logging at DEBUG level to see which files will be staged.",
-            dataflowOptions.getFilesToStage().size());
-        LOG.debug("Classpath elements: {}", dataflowOptions.getFilesToStage());
-      }
-    }
-
-    // Verify jobName according to service requirements, truncating converting to lowercase if
-    // necessary.
-    String jobName = dataflowOptions.getJobName().toLowerCase();
-    checkArgument(
-        jobName.matches("[a-z]([-a-z0-9]*[a-z0-9])?"),
-        "JobName invalid; the name must consist of only the characters "
-            + "[-a-z0-9], starting with a letter and ending with a letter "
-            + "or number");
-    if (!jobName.equals(dataflowOptions.getJobName())) {
-      LOG.info(
-          "PipelineOptions.jobName did not match the service requirements. "
-              + "Using {} instead of {}.",
-          jobName,
-          dataflowOptions.getJobName());
-    }
-    dataflowOptions.setJobName(jobName);
-
-    // Verify project
-    String project = dataflowOptions.getProject();
-    if (project.matches("[0-9]*")) {
-      throw new IllegalArgumentException(
-          "Project ID '"
-              + project
-              + "' invalid. Please make sure you specified the Project ID, not project number.");
-    } else if (!project.matches(PROJECT_ID_REGEXP)) {
-      throw new IllegalArgumentException(
-          "Project ID '"
-              + project
-              + "' invalid. Please make sure you specified the Project ID, not project"
-              + " description.");
-    }
-
-    DataflowPipelineDebugOptions debugOptions =
-        dataflowOptions.as(DataflowPipelineDebugOptions.class);
-    // Verify the number of worker threads is a valid value
-    if (debugOptions.getNumberOfWorkerHarnessThreads() < 0) {
-      throw new IllegalArgumentException(
-          "Number of worker harness threads '"
-              + debugOptions.getNumberOfWorkerHarnessThreads()
-              + "' invalid. Please make sure the value is non-negative.");
-    }
-
-    // Verify that if recordJfrOnGcThrashing is set, the pipeline is at least on java 11
-    if (dataflowOptions.getRecordJfrOnGcThrashing()
-        && Environments.getJavaVersion() == Environments.JavaVersion.java8) {
-      throw new IllegalArgumentException(
-          "recordJfrOnGcThrashing is only supported on java 9 and up.");
-    }
-
-    if (dataflowOptions.isStreaming() && dataflowOptions.getGcsUploadBufferSizeBytes() == null) {
-      dataflowOptions.setGcsUploadBufferSizeBytes(GCS_UPLOAD_BUFFER_SIZE_BYTES_DEFAULT);
-    }
-
-    // Adding the Java version to the SDK name for user's and support convenience.
-    String agentJavaVer = "(JRE 8 environment)";
-    if (Environments.getJavaVersion() != Environments.JavaVersion.java8) {
-      agentJavaVer =
-          String.format("(JRE %s environment)", Environments.getJavaVersion().specification());
-    }
-
-    DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
-    String userAgentName = dataflowRunnerInfo.getName();
-    Preconditions.checkArgument(
-        !userAgentName.equals(""), "Dataflow runner's `name` property cannot be empty.");
-    String userAgentVersion = dataflowRunnerInfo.getVersion();
-    Preconditions.checkArgument(
-        !userAgentVersion.equals(""), "Dataflow runner's `version` property cannot be empty.");
-    String userAgent =
-        String.format("%s/%s%s", userAgentName, userAgentVersion, agentJavaVer).replace(" ", "_");
-    dataflowOptions.setUserAgent(userAgent);
-
-    return new DataflowRunner(dataflowOptions);
-  }
-
-  static boolean isServiceEndpoint(String endpoint) {
-    return Strings.isNullOrEmpty(endpoint) || Pattern.matches(ENDPOINT_REGEXP, endpoint);
-  }
-
-  static void validateSdkContainerImageOptions(DataflowPipelineWorkerPoolOptions workerOptions) {
-    // Check against null - empty string value for workerHarnessContainerImage
-    // must be preserved for legacy dataflowWorkerJar to work.
-    String sdkContainerOption = workerOptions.getSdkContainerImage();
-    String workerHarnessOption = workerOptions.getWorkerHarnessContainerImage();
-    Preconditions.checkArgument(
-        sdkContainerOption == null
-            || workerHarnessOption == null
-            || sdkContainerOption.equals(workerHarnessOption),
-        "Cannot use legacy option workerHarnessContainerImage with sdkContainerImage. Prefer sdkContainerImage.");
-
-    // Default to new option, which may be null.
-    String containerImage = workerOptions.getSdkContainerImage();
-    if (workerOptions.getWorkerHarnessContainerImage() != null
-        && workerOptions.getSdkContainerImage() == null) {
-      // Set image to old option if old option was set but new option is not set.
-      LOG.warn(
-          "Prefer --sdkContainerImage over deprecated legacy option --workerHarnessContainerImage.");
-      containerImage = workerOptions.getWorkerHarnessContainerImage();
-    }
-
-    // Make sure both options have same value.
-    workerOptions.setSdkContainerImage(containerImage);
-    workerOptions.setWorkerHarnessContainerImage(containerImage);
-  }
-
-  @VisibleForTesting
-  static void validateWorkerSettings(DataflowPipelineWorkerPoolOptions workerOptions) {
-    DataflowPipelineOptions dataflowOptions = workerOptions.as(DataflowPipelineOptions.class);
-
-    validateSdkContainerImageOptions(workerOptions);
-
-    GcpOptions gcpOptions = workerOptions.as(GcpOptions.class);
-    Preconditions.checkArgument(
-        gcpOptions.getZone() == null || gcpOptions.getWorkerRegion() == null,
-        "Cannot use option zone with workerRegion. Prefer either workerZone or workerRegion.");
-    Preconditions.checkArgument(
-        gcpOptions.getZone() == null || gcpOptions.getWorkerZone() == null,
-        "Cannot use option zone with workerZone. Prefer workerZone.");
-    Preconditions.checkArgument(
-        gcpOptions.getWorkerRegion() == null || gcpOptions.getWorkerZone() == null,
-        "workerRegion and workerZone options are mutually exclusive.");
-
-    boolean hasExperimentWorkerRegion = false;
-    if (dataflowOptions.getExperiments() != null) {
-      for (String experiment : dataflowOptions.getExperiments()) {
-        if (experiment.startsWith("worker_region")) {
-          hasExperimentWorkerRegion = true;
-          break;
-        }
-      }
-    }
-    Preconditions.checkArgument(
-        !hasExperimentWorkerRegion || gcpOptions.getWorkerRegion() == null,
-        "Experiment worker_region and option workerRegion are mutually exclusive.");
-    Preconditions.checkArgument(
-        !hasExperimentWorkerRegion || gcpOptions.getWorkerZone() == null,
-        "Experiment worker_region and option workerZone are mutually exclusive.");
-
-    if (gcpOptions.getZone() != null) {
-      LOG.warn("Option --zone is deprecated. Please use --workerZone instead.");
-      gcpOptions.setWorkerZone(gcpOptions.getZone());
-      gcpOptions.setZone(null);
-    }
-  }
-
-  @VisibleForTesting
-  protected DataflowRunner(DataflowPipelineOptions options) {
-    this.options = options;
-    this.dataflowClient = DataflowClient.create(options);
-    this.translator = DataflowPipelineTranslator.fromOptions(options);
-    this.pcollectionsRequiringIndexedFormat = new HashSet<>();
-    this.pCollectionsPreservedKeys = new HashSet<>();
-    this.pcollectionsRequiringAutoSharding = new HashSet<>();
-    this.ptransformViewsWithNonDeterministicKeyCoders = new HashSet<>();
-  }
-
-  private static class AlwaysCreateViaRead<T>
-      implements PTransformOverrideFactory<PBegin, PCollection<T>, Create.Values<T>> {
-    @Override
-    public PTransformOverrideFactory.PTransformReplacement<PBegin, PCollection<T>>
-        getReplacementTransform(
-            AppliedPTransform<PBegin, PCollection<T>, Create.Values<T>> appliedTransform) {
-      return PTransformOverrideFactory.PTransformReplacement.of(
-          appliedTransform.getPipeline().begin(), appliedTransform.getTransform().alwaysUseRead());
+            }
+        }
+        Preconditions.checkArgument(
+                !hasExperimentWorkerRegion || gcpOptions.getWorkerRegion() == null,
+                "Experiment worker_region and option workerRegion are mutually exclusive.");
+        Preconditions.checkArgument(
+                !hasExperimentWorkerRegion || gcpOptions.getWorkerZone() == null,
+                "Experiment worker_region and option workerZone are mutually exclusive.");
+
+        if (gcpOptions.getZone() != null) {
+            LOG.warn("Option --zone is deprecated. Please use --workerZone instead.");
+            gcpOptions.setWorkerZone(gcpOptions.getZone());
+            gcpOptions.setZone(null);
+        }
     }
 
-    @Override
-    public final Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, PCollection<T> newOutput) {
-      return ReplacementOutputs.singleton(outputs, newOutput);
-    }
-  }
-
-  private List<PTransformOverride> getOverrides(boolean streaming) {
-    ImmutableList.Builder<PTransformOverride> overridesBuilder = ImmutableList.builder();
-
-    // Create is implemented in terms of a Read, so it must precede the override to Read in
-    // streaming
-    overridesBuilder
-        .add(
-            PTransformOverride.of(
-                PTransformMatchers.flattenWithDuplicateInputs(),
-                DeduplicatedFlattenFactory.create()))
-        .add(
-            PTransformOverride.of(
-                PTransformMatchers.emptyFlatten(), EmptyFlattenAsCreateFactory.instance()));
-
-    if (streaming) {
-      // For update compatibility, always use a Read for Create in streaming mode.
-      overridesBuilder.add(
-          PTransformOverride.of(
-              PTransformMatchers.classEqualTo(Create.Values.class), new AlwaysCreateViaRead()));
-    }
-
-    // By default Dataflow runner replaces single-output ParDo with a ParDoSingle override.
-    // However, we want a different expansion for single-output splittable ParDo.
-    overridesBuilder
-        .add(
-            PTransformOverride.of(
-                PTransformMatchers.splittableParDoSingle(),
-                new ReflectiveOneToOneOverrideFactory(
-                    SplittableParDoOverrides.ParDoSingleViaMulti.class, this)))
-        .add(
-            PTransformOverride.of(
-                PTransformMatchers.splittableParDoMulti(),
-                new SplittableParDoOverrides.SplittableParDoOverrideFactory()));
-
-    if (streaming) {
-      if (!hasExperiment(options, ENABLE_CUSTOM_PUBSUB_SOURCE)) {
-        overridesBuilder.add(
-            PTransformOverride.of(
-                PTransformMatchers.classEqualTo(PubsubUnboundedSource.class),
-                new StreamingPubsubIOReadOverrideFactory()));
-      }
-      if (!hasExperiment(options, ENABLE_CUSTOM_PUBSUB_SINK)) {
-        overridesBuilder.add(
-            PTransformOverride.of(
-                PTransformMatchers.classEqualTo(PubsubUnboundedSink.class),
-                new StreamingPubsubIOWriteOverrideFactory(this)));
-      }
+    @VisibleForTesting
+    protected DataflowRunner(DataflowPipelineOptions options) {
+        this.options = options;
+        this.dataflowClient = DataflowClient.create(options);
+        this.translator = DataflowPipelineTranslator.fromOptions(options);
+        this.pcollectionsRequiringIndexedFormat = new HashSet<>();
+        this.pCollectionsPreservedKeys = new HashSet<>();
+        this.pcollectionsRequiringAutoSharding = new HashSet<>();
+        this.ptransformViewsWithNonDeterministicKeyCoders = new HashSet<>();
+    }
 
-      try {
-        overridesBuilder.add(KafkaIO.Read.KAFKA_READ_OVERRIDE);
-      } catch (NoClassDefFoundError e) {
-        // Do nothing. io-kafka is an optional dependency of runners-google-cloud-dataflow-java
-        // and only needed when KafkaIO is used in the pipeline.
-      }
+    private static class AlwaysCreateViaRead<T>
+            implements PTransformOverrideFactory<PBegin, PCollection<T>, Create.Values<T>> {
 
-      overridesBuilder.add(SubscribeTransform.V1_READ_OVERRIDE);
+        @Override
+        public PTransformOverrideFactory.PTransformReplacement<PBegin, PCollection<T>>
+                getReplacementTransform(
+                        AppliedPTransform<PBegin, PCollection<T>, Create.Values<T>> appliedTransform) {
+            return PTransformOverrideFactory.PTransformReplacement.of(
+                    appliedTransform.getPipeline().begin(), appliedTransform.getTransform().alwaysUseRead());
+        }
 
-      if (!hasExperiment(options, "enable_file_dynamic_sharding")) {
-        overridesBuilder.add(
-            PTransformOverride.of(
-                PTransformMatchers.writeWithRunnerDeterminedSharding(),
-                new StreamingShardedWriteFactory(options)));
-      }
-
-      overridesBuilder.add(
-          PTransformOverride.of(
-              PTransformMatchers.groupIntoBatches(),
-              new GroupIntoBatchesOverride.StreamingGroupIntoBatchesOverrideFactory(this)));
-
-      overridesBuilder.add(
-          PTransformOverride.of(
-              PTransformMatchers.groupWithShardableStates(),
-              new GroupIntoBatchesOverride.StreamingGroupIntoBatchesWithShardedKeyOverrideFactory(
-                  this)));
-
-      overridesBuilder
-          .add(
-              // Streaming Bounded Read is implemented in terms of Streaming Unbounded Read, and
-              // must precede it
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(Read.Bounded.class),
-                  new StreamingBoundedReadOverrideFactory()))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(Read.Unbounded.class),
-                  new StreamingUnboundedReadOverrideFactory()));
-
-      overridesBuilder.add(
-          PTransformOverride.of(
-              PTransformMatchers.classEqualTo(View.CreatePCollectionView.class),
-              new StreamingCreatePCollectionViewFactory()));
-
-      // Dataflow Streaming runner overrides the SPLITTABLE_PROCESS_KEYED transform
-      // natively in the Dataflow service.
-    } else {
-      overridesBuilder.add(SplittableParDo.PRIMITIVE_BOUNDED_READ_OVERRIDE);
-      overridesBuilder
-          // Replace GroupIntoBatches before the state/timer replacements below since
-          // GroupIntoBatches internally uses a stateful DoFn.
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(GroupIntoBatches.class),
-                  new GroupIntoBatchesOverride.BatchGroupIntoBatchesOverrideFactory<>(this)))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(GroupIntoBatches.WithShardedKey.class),
-                  new GroupIntoBatchesOverride.BatchGroupIntoBatchesWithShardedKeyOverrideFactory<>(
-                      this)));
-
-      overridesBuilder
-          // State and timer pardos are implemented by expansion to GBK-then-ParDo
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.stateOrTimerParDoMulti(),
-                  BatchStatefulParDoOverrides.multiOutputOverrideFactory(options)))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.stateOrTimerParDoSingle(),
-                  BatchStatefulParDoOverrides.singleOutputOverrideFactory()));
-      // Dataflow Batch runner uses the naive override of the SPLITTABLE_PROCESS_KEYED transform
-      // for now, but eventually (when liquid sharding is implemented) will also override it
-      // natively in the Dataflow service.
-      overridesBuilder.add(
-          PTransformOverride.of(
-              PTransformMatchers.splittableProcessKeyedBounded(),
-              new SplittableParDoNaiveBounded.OverrideFactory()));
-
-      overridesBuilder
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(View.AsMap.class),
-                  new ReflectiveViewOverrideFactory(BatchViewOverrides.BatchViewAsMap.class, this)))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(View.AsMultimap.class),
-                  new ReflectiveViewOverrideFactory(
-                      BatchViewOverrides.BatchViewAsMultimap.class, this)))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(Combine.GloballyAsSingletonView.class),
-                  new CombineGloballyAsSingletonViewOverrideFactory(this)))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(View.AsList.class),
-                  new ReflectiveViewOverrideFactory(
-                      BatchViewOverrides.BatchViewAsList.class, this)))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(View.AsIterable.class),
-                  new ReflectiveViewOverrideFactory(
-                      BatchViewOverrides.BatchViewAsIterable.class, this)));
-    }
-    /* TODO(Beam-4684): Support @RequiresStableInput on Dataflow in a more intelligent way
+        @Override
+        public final Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, PCollection<T> newOutput) {
+            return ReplacementOutputs.singleton(outputs, newOutput);
+        }
+    }
+
+    private List<PTransformOverride> getOverrides(boolean streaming) {
+        ImmutableList.Builder<PTransformOverride> overridesBuilder = ImmutableList.builder();
+
+        // Create is implemented in terms of a Read, so it must precede the override to Read in
+        // streaming
+        overridesBuilder
+                .add(
+                        PTransformOverride.of(
+                                PTransformMatchers.flattenWithDuplicateInputs(),
+                                DeduplicatedFlattenFactory.create()))
+                .add(
+                        PTransformOverride.of(
+                                PTransformMatchers.emptyFlatten(), EmptyFlattenAsCreateFactory.instance()));
+
+        if (streaming) {
+            // For update compatibility, always use a Read for Create in streaming mode.
+            overridesBuilder.add(
+                    PTransformOverride.of(
+                            PTransformMatchers.classEqualTo(Create.Values.class), new AlwaysCreateViaRead()));
+        }
+
+        // By default Dataflow runner replaces single-output ParDo with a ParDoSingle override.
+        // However, we want a different expansion for single-output splittable ParDo.
+        overridesBuilder
+                .add(
+                        PTransformOverride.of(
+                                PTransformMatchers.splittableParDoSingle(),
+                                new ReflectiveOneToOneOverrideFactory(
+                                        SplittableParDoOverrides.ParDoSingleViaMulti.class, this)))
+                .add(
+                        PTransformOverride.of(
+                                PTransformMatchers.splittableParDoMulti(),
+                                new SplittableParDoOverrides.SplittableParDoOverrideFactory()));
+
+        if (streaming) {
+            if (!hasExperiment(options, ENABLE_CUSTOM_PUBSUB_SOURCE)) {
+                overridesBuilder.add(
+                        PTransformOverride.of(
+                                PTransformMatchers.classEqualTo(PubsubUnboundedSource.class),
+                                new StreamingPubsubIOReadOverrideFactory()));
+            }
+            if (!hasExperiment(options, ENABLE_CUSTOM_PUBSUB_SINK)) {
+                overridesBuilder.add(
+                        PTransformOverride.of(
+                                PTransformMatchers.classEqualTo(PubsubUnboundedSink.class),
+                                new StreamingPubsubIOWriteOverrideFactory(this)));
+            }
+
+            try {
+                overridesBuilder.add(KafkaIO.Read.KAFKA_READ_OVERRIDE);
+            } catch (NoClassDefFoundError e) {
+                // Do nothing. io-kafka is an optional dependency of runners-google-cloud-dataflow-java
+                // and only needed when KafkaIO is used in the pipeline.
+            }
+
+            overridesBuilder.add(SubscribeTransform.V1_READ_OVERRIDE);
+
+            if (!hasExperiment(options, "enable_file_dynamic_sharding")) {
+                overridesBuilder.add(
+                        PTransformOverride.of(
+                                PTransformMatchers.writeWithRunnerDeterminedSharding(),
+                                new StreamingShardedWriteFactory(options)));
+            }
+
+            overridesBuilder.add(
+                    PTransformOverride.of(
+                            PTransformMatchers.groupIntoBatches(),
+                            new GroupIntoBatchesOverride.StreamingGroupIntoBatchesOverrideFactory(this)));
+
+            overridesBuilder.add(
+                    PTransformOverride.of(
+                            PTransformMatchers.groupWithShardableStates(),
+                            new GroupIntoBatchesOverride.StreamingGroupIntoBatchesWithShardedKeyOverrideFactory(
+                                    this)));
+
+            overridesBuilder
+                    .add(
+                            // Streaming Bounded Read is implemented in terms of Streaming Unbounded Read, and
+                            // must precede it
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(Read.Bounded.class),
+                                    new StreamingBoundedReadOverrideFactory()))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(Read.Unbounded.class),
+                                    new StreamingUnboundedReadOverrideFactory()));
+
+            overridesBuilder.add(
+                    PTransformOverride.of(
+                            PTransformMatchers.classEqualTo(View.CreatePCollectionView.class),
+                            new StreamingCreatePCollectionViewFactory()));
+
+            // Dataflow Streaming runner overrides the SPLITTABLE_PROCESS_KEYED transform
+            // natively in the Dataflow service.
+        } else {
+            overridesBuilder.add(SplittableParDo.PRIMITIVE_BOUNDED_READ_OVERRIDE);
+            overridesBuilder
+                    // Replace GroupIntoBatches before the state/timer replacements below since
+                    // GroupIntoBatches internally uses a stateful DoFn.
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(GroupIntoBatches.class),
+                                    new GroupIntoBatchesOverride.BatchGroupIntoBatchesOverrideFactory<>(this)))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(GroupIntoBatches.WithShardedKey.class),
+                                    new GroupIntoBatchesOverride.BatchGroupIntoBatchesWithShardedKeyOverrideFactory<>(
+                                            this)));
+
+            overridesBuilder
+                    // State and timer pardos are implemented by expansion to GBK-then-ParDo
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.stateOrTimerParDoMulti(),
+                                    BatchStatefulParDoOverrides.multiOutputOverrideFactory(options)))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.stateOrTimerParDoSingle(),
+                                    BatchStatefulParDoOverrides.singleOutputOverrideFactory()));
+            // Dataflow Batch runner uses the naive override of the SPLITTABLE_PROCESS_KEYED transform
+            // for now, but eventually (when liquid sharding is implemented) will also override it
+            // natively in the Dataflow service.
+            overridesBuilder.add(
+                    PTransformOverride.of(
+                            PTransformMatchers.splittableProcessKeyedBounded(),
+                            new SplittableParDoNaiveBounded.OverrideFactory()));
+
+            overridesBuilder
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(View.AsMap.class),
+                                    new ReflectiveViewOverrideFactory(BatchViewOverrides.BatchViewAsMap.class, this)))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(View.AsMultimap.class),
+                                    new ReflectiveViewOverrideFactory(
+                                            BatchViewOverrides.BatchViewAsMultimap.class, this)))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(Combine.GloballyAsSingletonView.class),
+                                    new CombineGloballyAsSingletonViewOverrideFactory(this)))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(View.AsList.class),
+                                    new ReflectiveViewOverrideFactory(
+                                            BatchViewOverrides.BatchViewAsList.class, this)))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(View.AsIterable.class),
+                                    new ReflectiveViewOverrideFactory(
+                                            BatchViewOverrides.BatchViewAsIterable.class, this)));
+        }
+        /* TODO(Beam-4684): Support @RequiresStableInput on Dataflow in a more intelligent way
     Use Reshuffle might cause an extra and unnecessary shuffle to be inserted. To enable this, we
     should make sure that we do not add extra shuffles for transforms whose input is already stable.
     // Uses Reshuffle, so has to be before the Reshuffle override
@@ -775,2000 +810,2025 @@ private List<PTransformOverride> getOverrides(boolean streaming) {
         PTransformOverride.of(
             PTransformMatchers.requiresStableInputParDoMulti(),
             RequiresStableInputParDoOverrides.multiOutputOverrideFactory()));
-    */
-    overridesBuilder
-        .add(
-            PTransformOverride.of(
-                PTransformMatchers.classEqualTo(Reshuffle.class), new ReshuffleOverrideFactory()))
-        // Order is important. Streaming views almost all use Combine internally.
-        .add(
-            PTransformOverride.of(
-                new DataflowPTransformMatchers.CombineValuesWithoutSideInputsPTransformMatcher(),
-                new PrimitiveCombineGroupedValuesOverrideFactory()))
-        .add(
-            PTransformOverride.of(
-                PTransformMatchers.classEqualTo(ParDo.SingleOutput.class),
-                new PrimitiveParDoSingleFactory()));
+         */
+        overridesBuilder
+                .add(
+                        PTransformOverride.of(
+                                PTransformMatchers.classEqualTo(Reshuffle.class), new ReshuffleOverrideFactory()))
+                // Order is important. Streaming views almost all use Combine internally.
+                .add(
+                        PTransformOverride.of(
+                                new DataflowPTransformMatchers.CombineValuesWithoutSideInputsPTransformMatcher(),
+                                new PrimitiveCombineGroupedValuesOverrideFactory()))
+                .add(
+                        PTransformOverride.of(
+                                PTransformMatchers.classEqualTo(ParDo.SingleOutput.class),
+                                new PrimitiveParDoSingleFactory()));
 
-    overridesBuilder.add(
-        PTransformOverride.of(
-            PTransformMatchers.classEqualTo(RedistributeByKey.class),
-            new RedistributeByKeyOverrideFactory()));
-
-    if (streaming) {
-      // For update compatibility, always use a Read for Create in streaming mode.
-      overridesBuilder
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(Create.Values.class), new AlwaysCreateViaRead()))
-          // Create is implemented in terms of BoundedRead.
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(Read.Bounded.class),
-                  new StreamingBoundedReadOverrideFactory()))
-          // Streaming Bounded Read is implemented in terms of Streaming Unbounded Read.
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(Read.Unbounded.class),
-                  new StreamingUnboundedReadOverrideFactory()))
-          .add(
-              PTransformOverride.of(
-                  PTransformMatchers.classEqualTo(ParDo.SingleOutput.class),
-                  new PrimitiveParDoSingleFactory()));
-    }
-
-    return overridesBuilder.build();
-  }
-
-  /**
-   * Replace the {@link Combine.GloballyAsSingletonView} transform with a specialization which
-   * re-applies the {@link CombineFn} and adds a specialization specific to the Dataflow runner.
-   */
-  private static class CombineGloballyAsSingletonViewOverrideFactory<InputT, ViewT>
-      extends ReflectiveViewOverrideFactory<InputT, ViewT> {
-
-    private CombineGloballyAsSingletonViewOverrideFactory(DataflowRunner runner) {
-      super((Class) BatchViewOverrides.BatchViewAsSingleton.class, runner);
+        overridesBuilder.add(
+                PTransformOverride.of(
+                        PTransformMatchers.classEqualTo(RedistributeByKey.class),
+                        new RedistributeByKeyOverrideFactory()));
+
+        if (streaming) {
+            // For update compatibility, always use a Read for Create in streaming mode.
+            overridesBuilder
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(Create.Values.class), new AlwaysCreateViaRead()))
+                    // Create is implemented in terms of BoundedRead.
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(Read.Bounded.class),
+                                    new StreamingBoundedReadOverrideFactory()))
+                    // Streaming Bounded Read is implemented in terms of Streaming Unbounded Read.
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(Read.Unbounded.class),
+                                    new StreamingUnboundedReadOverrideFactory()))
+                    .add(
+                            PTransformOverride.of(
+                                    PTransformMatchers.classEqualTo(ParDo.SingleOutput.class),
+                                    new PrimitiveParDoSingleFactory()));
+        }
+
+        return overridesBuilder.build();
     }
 
-    @Override
-    public PTransformReplacement<PCollection<InputT>, PCollectionView<ViewT>>
-        getReplacementTransform(
-            AppliedPTransform<
-                    PCollection<InputT>,
-                    PCollectionView<ViewT>,
-                    PTransform<PCollection<InputT>, PCollectionView<ViewT>>>
-                transform) {
-      Combine.GloballyAsSingletonView<?, ?> combineTransform =
-          (Combine.GloballyAsSingletonView) transform.getTransform();
-      return PTransformReplacement.of(
-          PTransformReplacements.getSingletonMainInput(transform),
-          new BatchViewOverrides.BatchViewAsSingleton(
-              runner,
-              findCreatePCollectionView(transform),
-              (CombineFn) combineTransform.getCombineFn(),
-              combineTransform.getFanout()));
-    }
-  }
-
-  /**
-   * Replace the View.AsYYY transform with specialized view overrides for Dataflow. It is required
-   * that the new replacement transform uses the supplied PCollectionView and does not create
-   * another instance.
-   */
-  private static class ReflectiveViewOverrideFactory<InputT, ViewT>
-      implements PTransformOverrideFactory<
-          PCollection<InputT>,
-          PCollectionView<ViewT>,
-          PTransform<PCollection<InputT>, PCollectionView<ViewT>>> {
-
-    final Class<PTransform<PCollection<InputT>, PCollectionView<ViewT>>> replacement;
-    final DataflowRunner runner;
-
-    private ReflectiveViewOverrideFactory(
-        Class<PTransform<PCollection<InputT>, PCollectionView<ViewT>>> replacement,
-        DataflowRunner runner) {
-      this.replacement = replacement;
-      this.runner = runner;
-    }
-
-    CreatePCollectionView<ViewT, ViewT> findCreatePCollectionView(
-        final AppliedPTransform<
-                PCollection<InputT>,
-                PCollectionView<ViewT>,
-                PTransform<PCollection<InputT>, PCollectionView<ViewT>>>
-            transform) {
-      final AtomicReference<CreatePCollectionView> viewTransformRef = new AtomicReference<>();
-      transform
-          .getPipeline()
-          .traverseTopologically(
-              new PipelineVisitor.Defaults() {
-                // Stores whether we have entered the expected composite view transform.
-                private boolean tracking = false;
+    /**
+     * Replace the {@link Combine.GloballyAsSingletonView} transform with a
+     * specialization which re-applies the {@link CombineFn} and adds a
+     * specialization specific to the Dataflow runner.
+     */
+    private static class CombineGloballyAsSingletonViewOverrideFactory<InputT, ViewT>
+            extends ReflectiveViewOverrideFactory<InputT, ViewT> {
 
-                @Override
-                public CompositeBehavior enterCompositeTransform(Node node) {
-                  if (transform.getTransform() == node.getTransform()) {
-                    tracking = true;
-                  }
-                  return super.enterCompositeTransform(node);
-                }
+        private CombineGloballyAsSingletonViewOverrideFactory(DataflowRunner runner) {
+            super((Class) BatchViewOverrides.BatchViewAsSingleton.class, runner);
+        }
 
-                @Override
-                public void visitPrimitiveTransform(Node node) {
-                  if (tracking && node.getTransform() instanceof CreatePCollectionView) {
-                    checkState(
-                        viewTransformRef.compareAndSet(
-                            null, (CreatePCollectionView) node.getTransform()),
-                        "Found more than one instance of a CreatePCollectionView when "
-                            + "attempting to replace %s, found [%s, %s]",
-                        replacement,
-                        viewTransformRef.get(),
-                        node.getTransform());
-                  }
-                }
+        @Override
+        public PTransformReplacement<PCollection<InputT>, PCollectionView<ViewT>>
+                getReplacementTransform(
+                        AppliedPTransform<
+                    PCollection<InputT>, PCollectionView<ViewT>, PTransform<PCollection<InputT>, PCollectionView<ViewT>>> transform) {
+            Combine.GloballyAsSingletonView<?, ?> combineTransform
+                    = (Combine.GloballyAsSingletonView) transform.getTransform();
+            return PTransformReplacement.of(
+                    PTransformReplacements.getSingletonMainInput(transform),
+                    new BatchViewOverrides.BatchViewAsSingleton(
+                            runner,
+                            findCreatePCollectionView(transform),
+                            (CombineFn) combineTransform.getCombineFn(),
+                            combineTransform.getFanout()));
+        }
+    }
 
-                @Override
-                public void leaveCompositeTransform(Node node) {
-                  if (transform.getTransform() == node.getTransform()) {
-                    tracking = false;
-                  }
-                }
-              });
+    /**
+     * Replace the View.AsYYY transform with specialized view overrides for
+     * Dataflow. It is required that the new replacement transform uses the
+     * supplied PCollectionView and does not create another instance.
+     */
+    private static class ReflectiveViewOverrideFactory<InputT, ViewT>
+            implements PTransformOverrideFactory<
+          PCollection<InputT>, PCollectionView<ViewT>, PTransform<PCollection<InputT>, PCollectionView<ViewT>>> {
+
+        final Class<PTransform<PCollection<InputT>, PCollectionView<ViewT>>> replacement;
+        final DataflowRunner runner;
+
+        private ReflectiveViewOverrideFactory(
+                Class<PTransform<PCollection<InputT>, PCollectionView<ViewT>>> replacement,
+                DataflowRunner runner) {
+            this.replacement = replacement;
+            this.runner = runner;
+        }
 
-      checkState(
-          viewTransformRef.get() != null,
-          "Expected to find CreatePCollectionView contained within %s",
-          transform.getTransform());
-      return viewTransformRef.get();
-    }
+        CreatePCollectionView<ViewT, ViewT> findCreatePCollectionView(
+                final AppliedPTransform<
+                PCollection<InputT>, PCollectionView<ViewT>, PTransform<PCollection<InputT>, PCollectionView<ViewT>>> transform) {
+            final AtomicReference<CreatePCollectionView> viewTransformRef = new AtomicReference<>();
+            transform
+                    .getPipeline()
+                    .traverseTopologically(
+                            new PipelineVisitor.Defaults() {
+                        // Stores whether we have entered the expected composite view transform.
+                        private boolean tracking = false;
+
+                        @Override
+                        public CompositeBehavior enterCompositeTransform(Node node) {
+                            if (transform.getTransform() == node.getTransform()) {
+                                tracking = true;
+                            }
+                            return super.enterCompositeTransform(node);
+                        }
+
+                        @Override
+                        public void visitPrimitiveTransform(Node node) {
+                            if (tracking && node.getTransform() instanceof CreatePCollectionView) {
+                                checkState(
+                                        viewTransformRef.compareAndSet(
+                                                null, (CreatePCollectionView) node.getTransform()),
+                                        "Found more than one instance of a CreatePCollectionView when "
+                                        + "attempting to replace %s, found [%s, %s]",
+                                        replacement,
+                                        viewTransformRef.get(),
+                                        node.getTransform());
+                            }
+                        }
+
+                        @Override
+                        public void leaveCompositeTransform(Node node) {
+                            if (transform.getTransform() == node.getTransform()) {
+                                tracking = false;
+                            }
+                        }
+                    });
+
+            checkState(
+                    viewTransformRef.get() != null,
+                    "Expected to find CreatePCollectionView contained within %s",
+                    transform.getTransform());
+            return viewTransformRef.get();
+        }
 
-    @Override
-    public PTransformReplacement<PCollection<InputT>, PCollectionView<ViewT>>
-        getReplacementTransform(
-            final AppliedPTransform<
-                    PCollection<InputT>,
-                    PCollectionView<ViewT>,
-                    PTransform<PCollection<InputT>, PCollectionView<ViewT>>>
-                transform) {
-
-      PTransform<PCollection<InputT>, PCollectionView<ViewT>> rep =
-          InstanceBuilder.ofType(replacement)
-              .withArg(DataflowRunner.class, runner)
-              .withArg(CreatePCollectionView.class, findCreatePCollectionView(transform))
-              .build();
-      return PTransformReplacement.of(
-          PTransformReplacements.getSingletonMainInput(transform), (PTransform) rep);
-    }
+        @Override
+        public PTransformReplacement<PCollection<InputT>, PCollectionView<ViewT>>
+                getReplacementTransform(
+                        final AppliedPTransform<
+                    PCollection<InputT>, PCollectionView<ViewT>, PTransform<PCollection<InputT>, PCollectionView<ViewT>>> transform) {
+
+            PTransform<PCollection<InputT>, PCollectionView<ViewT>> rep
+                    = InstanceBuilder.ofType(replacement)
+                            .withArg(DataflowRunner.class, runner)
+                            .withArg(CreatePCollectionView.class, findCreatePCollectionView(transform))
+                            .build();
+            return PTransformReplacement.of(
+                    PTransformReplacements.getSingletonMainInput(transform), (PTransform) rep);
+        }
 
-    @Override
-    public Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, PCollectionView<ViewT> newOutput) {
-      /*
+        @Override
+        public Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, PCollectionView<ViewT> newOutput) {
+            /*
       The output of View.AsXYZ is a PCollectionView that expands to the PCollection to be materialized.
       The PCollectionView itself must have the same tag since that tag may have been embedded in serialized DoFns
       previously and cannot easily be rewired. The PCollection may differ, so we rewire it, even if the rewiring
       is a noop.
-      */
-      return ReplacementOutputs.singleton(outputs, newOutput);
+             */
+            return ReplacementOutputs.singleton(outputs, newOutput);
+        }
     }
-  }
 
-  private static class ReflectiveOneToOneOverrideFactory<
+    private static class ReflectiveOneToOneOverrideFactory<
           InputT, OutputT, TransformT extends PTransform<PCollection<InputT>, PCollection<OutputT>>>
-      extends SingleInputOutputOverrideFactory<
+            extends SingleInputOutputOverrideFactory<
           PCollection<InputT>, PCollection<OutputT>, TransformT> {
 
-    private final Class<PTransform<PCollection<InputT>, PCollection<OutputT>>> replacement;
-    private final DataflowRunner runner;
+        private final Class<PTransform<PCollection<InputT>, PCollection<OutputT>>> replacement;
+        private final DataflowRunner runner;
+
+        private ReflectiveOneToOneOverrideFactory(
+                Class<PTransform<PCollection<InputT>, PCollection<OutputT>>> replacement,
+                DataflowRunner runner) {
+            this.replacement = replacement;
+            this.runner = runner;
+        }
+
+        @Override
+        public PTransformReplacement<PCollection<InputT>, PCollection<OutputT>> getReplacementTransform(
+                AppliedPTransform<PCollection<InputT>, PCollection<OutputT>, TransformT> transform) {
+            PTransform<PCollection<InputT>, PCollection<OutputT>> rep
+                    = InstanceBuilder.ofType(replacement)
+                            .withArg(DataflowRunner.class, runner)
+                            .withArg(
+                                    (Class<TransformT>) transform.getTransform().getClass(), transform.getTransform())
+                            .build();
+            return PTransformReplacement.of(PTransformReplacements.getSingletonMainInput(transform), rep);
+        }
+    }
+
+    private RunnerApi.Pipeline resolveAnyOfEnvironments(RunnerApi.Pipeline pipeline) {
+        RunnerApi.Pipeline.Builder pipelineBuilder = pipeline.toBuilder();
+        RunnerApi.Components.Builder componentsBuilder = pipelineBuilder.getComponentsBuilder();
+        componentsBuilder.clearEnvironments();
+        for (Map.Entry<String, RunnerApi.Environment> entry
+                : pipeline.getComponents().getEnvironmentsMap().entrySet()) {
+            componentsBuilder.putEnvironments(
+                    entry.getKey(),
+                    Environments.resolveAnyOfEnvironment(
+                            entry.getValue(),
+                            BeamUrns.getUrn(RunnerApi.StandardEnvironments.Environments.DOCKER)));
+        }
+        return pipelineBuilder.build();
+    }
+
+    protected RunnerApi.Pipeline applySdkEnvironmentOverrides(
+            RunnerApi.Pipeline pipeline, DataflowPipelineOptions options) {
+        String sdkHarnessContainerImageOverrides = options.getSdkHarnessContainerImageOverrides();
+        String[] overrides
+                = Strings.isNullOrEmpty(sdkHarnessContainerImageOverrides)
+                ? new String[0]
+                : sdkHarnessContainerImageOverrides.split(",", -1);
+        if (overrides.length % 2 != 0) {
+            throw new RuntimeException(
+                    "invalid syntax for SdkHarnessContainerImageOverrides: "
+                    + options.getSdkHarnessContainerImageOverrides());
+        }
+        RunnerApi.Pipeline.Builder pipelineBuilder = pipeline.toBuilder();
+        RunnerApi.Components.Builder componentsBuilder = pipelineBuilder.getComponentsBuilder();
+        componentsBuilder.clearEnvironments();
+        for (Map.Entry<String, RunnerApi.Environment> entry
+                : pipeline.getComponents().getEnvironmentsMap().entrySet()) {
+            RunnerApi.Environment.Builder environmentBuilder = entry.getValue().toBuilder();
+            if (BeamUrns.getUrn(RunnerApi.StandardEnvironments.Environments.DOCKER)
+                    .equals(environmentBuilder.getUrn())) {
+                RunnerApi.DockerPayload dockerPayload;
+                try {
+                    dockerPayload = RunnerApi.DockerPayload.parseFrom(environmentBuilder.getPayload());
+                } catch (InvalidProtocolBufferException e) {
+                    throw new RuntimeException("Error parsing environment docker payload.", e);
+                }
+                String containerImage = dockerPayload.getContainerImage();
+                boolean updated = false;
+                for (int i = 0; i < overrides.length; i += 2) {
+                    containerImage = containerImage.replaceAll(overrides[i], overrides[i + 1]);
+                    if (!containerImage.equals(dockerPayload.getContainerImage())) {
+                        updated = true;
+                    }
+                }
+                if (containerImage.startsWith("apache/beam")
+                        && !updated
+                        // don't update if the container image is already configured by DataflowRunner
+                        && !containerImage.equals(getContainerImageForJob(options))) {
+                    containerImage
+                            = DataflowRunnerInfo.getDataflowRunnerInfo().getContainerImageBaseRepository()
+                            + containerImage.substring(containerImage.lastIndexOf("/"));
+                }
+                environmentBuilder.setPayload(
+                        RunnerApi.DockerPayload.newBuilder()
+                                .setContainerImage(containerImage)
+                                .build()
+                                .toByteString());
+            }
+            componentsBuilder.putEnvironments(entry.getKey(), environmentBuilder.build());
+        }
+        return pipelineBuilder.build();
+    }
+
+    @VisibleForTesting
+    protected RunnerApi.Pipeline resolveArtifacts(RunnerApi.Pipeline pipeline) {
+        RunnerApi.Pipeline.Builder pipelineBuilder = pipeline.toBuilder();
+        RunnerApi.Components.Builder componentsBuilder = pipelineBuilder.getComponentsBuilder();
+        componentsBuilder.clearEnvironments();
+        for (Map.Entry<String, RunnerApi.Environment> entry
+                : pipeline.getComponents().getEnvironmentsMap().entrySet()) {
+            RunnerApi.Environment.Builder environmentBuilder = entry.getValue().toBuilder();
+            environmentBuilder.clearDependencies();
+            for (RunnerApi.ArtifactInformation info : entry.getValue().getDependenciesList()) {
+                if (!BeamUrns.getUrn(RunnerApi.StandardArtifacts.Types.FILE).equals(info.getTypeUrn())) {
+                    throw new RuntimeException(
+                            String.format("unsupported artifact type %s", info.getTypeUrn()));
+                }
+                RunnerApi.ArtifactFilePayload filePayload;
+                try {
+                    filePayload = RunnerApi.ArtifactFilePayload.parseFrom(info.getTypePayload());
+                } catch (InvalidProtocolBufferException e) {
+                    throw new RuntimeException("Error parsing artifact file payload.", e);
+                }
+                String stagedName;
+                if (BeamUrns.getUrn(RunnerApi.StandardArtifacts.Roles.STAGING_TO)
+                        .equals(info.getRoleUrn())) {
+                    try {
+                        RunnerApi.ArtifactStagingToRolePayload stagingPayload
+                                = RunnerApi.ArtifactStagingToRolePayload.parseFrom(info.getRolePayload());
+                        stagedName = stagingPayload.getStagedName();
+                    } catch (InvalidProtocolBufferException e) {
+                        throw new RuntimeException("Error parsing artifact staging_to role payload.", e);
+                    }
+                } else {
+                    try {
+                        File source = new File(filePayload.getPath());
+                        HashCode hashCode = Files.asByteSource(source).hash(Hashing.sha256());
+                        stagedName = Environments.createStagingFileName(source, hashCode);
+                    } catch (IOException e) {
+                        throw new RuntimeException(
+                                String.format("Error creating staged name for artifact %s", filePayload.getPath()),
+                                e);
+                    }
+                }
+                environmentBuilder.addDependencies(
+                        info.toBuilder()
+                                .setTypeUrn(BeamUrns.getUrn(RunnerApi.StandardArtifacts.Types.URL))
+                                .setTypePayload(
+                                        RunnerApi.ArtifactUrlPayload.newBuilder()
+                                                .setUrl(
+                                                        FileSystems.matchNewResource(options.getStagingLocation(), true)
+                                                                .resolve(
+                                                                        stagedName, ResolveOptions.StandardResolveOptions.RESOLVE_FILE)
+                                                                .toString())
+                                                .setSha256(filePayload.getSha256())
+                                                .build()
+                                                .toByteString()));
+            }
+            componentsBuilder.putEnvironments(entry.getKey(), environmentBuilder.build());
+        }
+        return pipelineBuilder.build();
+    }
+
+    protected List<DataflowPackage> stageArtifacts(RunnerApi.Pipeline pipeline) {
+        ImmutableList.Builder<StagedFile> filesToStageBuilder = ImmutableList.builder();
+        Set<String> stagedNames = new HashSet<>();
+        for (Map.Entry<String, RunnerApi.Environment> entry
+                : pipeline.getComponents().getEnvironmentsMap().entrySet()) {
+            for (RunnerApi.ArtifactInformation info : entry.getValue().getDependenciesList()) {
+                if (!BeamUrns.getUrn(RunnerApi.StandardArtifacts.Types.FILE).equals(info.getTypeUrn())) {
+                    throw new RuntimeException(
+                            String.format("unsupported artifact type %s", info.getTypeUrn()));
+                }
+                RunnerApi.ArtifactFilePayload filePayload;
+                try {
+                    filePayload = RunnerApi.ArtifactFilePayload.parseFrom(info.getTypePayload());
+                } catch (InvalidProtocolBufferException e) {
+                    throw new RuntimeException("Error parsing artifact file payload.", e);
+                }
+                String stagedName;
+                if (BeamUrns.getUrn(RunnerApi.StandardArtifacts.Roles.STAGING_TO)
+                        .equals(info.getRoleUrn())) {
+                    try {
+                        RunnerApi.ArtifactStagingToRolePayload stagingPayload
+                                = RunnerApi.ArtifactStagingToRolePayload.parseFrom(info.getRolePayload());
+                        stagedName = stagingPayload.getStagedName();
+                    } catch (InvalidProtocolBufferException e) {
+                        throw new RuntimeException("Error parsing artifact staging_to role payload.", e);
+                    }
+                } else {
+                    try {
+                        File source = new File(filePayload.getPath());
+                        HashCode hashCode = Files.asByteSource(source).hash(Hashing.sha256());
+                        stagedName = Environments.createStagingFileName(source, hashCode);
+                    } catch (IOException e) {
+                        throw new RuntimeException(
+                                String.format("Error creating staged name for artifact %s", filePayload.getPath()),
+                                e);
+                    }
+                }
+                if (stagedNames.contains(stagedName)) {
+                    continue;
+                } else {
+                    stagedNames.add(stagedName);
+                }
+                filesToStageBuilder.add(
+                        StagedFile.of(filePayload.getPath(), filePayload.getSha256(), stagedName));
+            }
+        }
+        return options.getStager().stageFiles(filesToStageBuilder.build());
+    }
+
+    private List<RunnerApi.ArtifactInformation> getDefaultArtifacts() {
+        ImmutableList.Builder<String> pathsToStageBuilder = ImmutableList.builder();
+        String windmillBinary
+                = options.as(DataflowStreamingPipelineOptions.class).getOverrideWindmillBinary();
+        String dataflowWorkerJar = options.getDataflowWorkerJar();
+        if (dataflowWorkerJar != null && !dataflowWorkerJar.isEmpty() && !useUnifiedWorker(options)) {
+            // Put the user specified worker jar at the start of the classpath, to be consistent with the
+            // built in worker order.
+            pathsToStageBuilder.add("dataflow-worker.jar=" + dataflowWorkerJar);
+        }
+        pathsToStageBuilder.addAll(options.getFilesToStage());
+        if (windmillBinary != null) {
+            pathsToStageBuilder.add("windmill_main=" + windmillBinary);
+        }
+        return Environments.getArtifacts(pathsToStageBuilder.build());
+    }
+
+    @VisibleForTesting
+    static boolean isMultiLanguagePipeline(Pipeline pipeline) {
+        class IsMultiLanguageVisitor extends PipelineVisitor.Defaults {
+
+            private boolean isMultiLanguage = false;
+
+            private void performMultiLanguageTest(Node node) {
+                if (node.getTransform() instanceof External.ExpandableTransform) {
+                    isMultiLanguage = true;
+                }
+            }
+
+            @Override
+            public CompositeBehavior enterCompositeTransform(Node node) {
+                performMultiLanguageTest(node);
+                return super.enterCompositeTransform(node);
+            }
 
-    private ReflectiveOneToOneOverrideFactory(
-        Class<PTransform<PCollection<InputT>, PCollection<OutputT>>> replacement,
-        DataflowRunner runner) {
-      this.replacement = replacement;
-      this.runner = runner;
+            @Override
+            public void visitPrimitiveTransform(Node node) {
+                performMultiLanguageTest(node);
+                super.visitPrimitiveTransform(node);
+            }
+        }
+
+        IsMultiLanguageVisitor visitor = new IsMultiLanguageVisitor();
+        pipeline.traverseTopologically(visitor);
+
+        return visitor.isMultiLanguage;
+    }
+
+    private static boolean includesTransformUpgrades(Pipeline pipeline) {
+        return (pipeline
+                .getOptions()
+                .as(ExternalTranslationOptions.class)
+                .getTransformsToOverride()
+                .size()
+                > 0);
     }
 
     @Override
-    public PTransformReplacement<PCollection<InputT>, PCollection<OutputT>> getReplacementTransform(
-        AppliedPTransform<PCollection<InputT>, PCollection<OutputT>, TransformT> transform) {
-      PTransform<PCollection<InputT>, PCollection<OutputT>> rep =
-          InstanceBuilder.ofType(replacement)
-              .withArg(DataflowRunner.class, runner)
-              .withArg(
-                  (Class<TransformT>) transform.getTransform().getClass(), transform.getTransform())
-              .build();
-      return PTransformReplacement.of(PTransformReplacements.getSingletonMainInput(transform), rep);
-    }
-  }
-
-  private RunnerApi.Pipeline resolveAnyOfEnvironments(RunnerApi.Pipeline pipeline) {
-    RunnerApi.Pipeline.Builder pipelineBuilder = pipeline.toBuilder();
-    RunnerApi.Components.Builder componentsBuilder = pipelineBuilder.getComponentsBuilder();
-    componentsBuilder.clearEnvironments();
-    for (Map.Entry<String, RunnerApi.Environment> entry :
-        pipeline.getComponents().getEnvironmentsMap().entrySet()) {
-      componentsBuilder.putEnvironments(
-          entry.getKey(),
-          Environments.resolveAnyOfEnvironment(
-              entry.getValue(),
-              BeamUrns.getUrn(RunnerApi.StandardEnvironments.Environments.DOCKER)));
-    }
-    return pipelineBuilder.build();
-  }
-
-  protected RunnerApi.Pipeline applySdkEnvironmentOverrides(
-      RunnerApi.Pipeline pipeline, DataflowPipelineOptions options) {
-    String sdkHarnessContainerImageOverrides = options.getSdkHarnessContainerImageOverrides();
-    String[] overrides =
-        Strings.isNullOrEmpty(sdkHarnessContainerImageOverrides)
-            ? new String[0]
-            : sdkHarnessContainerImageOverrides.split(",", -1);
-    if (overrides.length % 2 != 0) {
-      throw new RuntimeException(
-          "invalid syntax for SdkHarnessContainerImageOverrides: "
-              + options.getSdkHarnessContainerImageOverrides());
-    }
-    RunnerApi.Pipeline.Builder pipelineBuilder = pipeline.toBuilder();
-    RunnerApi.Components.Builder componentsBuilder = pipelineBuilder.getComponentsBuilder();
-    componentsBuilder.clearEnvironments();
-    for (Map.Entry<String, RunnerApi.Environment> entry :
-        pipeline.getComponents().getEnvironmentsMap().entrySet()) {
-      RunnerApi.Environment.Builder environmentBuilder = entry.getValue().toBuilder();
-      if (BeamUrns.getUrn(RunnerApi.StandardEnvironments.Environments.DOCKER)
-          .equals(environmentBuilder.getUrn())) {
-        RunnerApi.DockerPayload dockerPayload;
+    public DataflowPipelineJob run(Pipeline pipeline) {
+        // Multi-language pipelines and pipelines that include upgrades should automatically be upgraded
+        // to Runner v2.
+        if (DataflowRunner.isMultiLanguagePipeline(pipeline) || includesTransformUpgrades(pipeline)) {
+            List<String> experiments = firstNonNull(options.getExperiments(), Collections.emptyList());
+            if (!experiments.contains("use_runner_v2")) {
+                LOG.info(
+                        "Automatically enabling Dataflow Runner v2 since the pipeline used cross-language"
+                        + " transforms or pipeline needed a transform upgrade.");
+                options.setExperiments(
+                        ImmutableList.<String>builder().addAll(experiments).add("use_runner_v2").build());
+            }
+        }
+        if (useUnifiedWorker(options)) {
+            if (hasExperiment(options, "disable_runner_v2")
+                    || hasExperiment(options, "disable_runner_v2_until_2023")
+                    || hasExperiment(options, "disable_prime_runner_v2")) {
+                throw new IllegalArgumentException(
+                        "Runner V2 both disabled and enabled: at least one of ['beam_fn_api', 'use_unified_worker', 'use_runner_v2', 'use_portable_job_submission'] is set and also one of ['disable_runner_v2', 'disable_runner_v2_until_2023', 'disable_prime_runner_v2'] is set.");
+            }
+            List<String> experiments
+                    = new ArrayList<>(options.getExperiments()); // non-null if useUnifiedWorker is true
+            if (!experiments.contains("use_runner_v2")) {
+                experiments.add("use_runner_v2");
+            }
+            if (!experiments.contains("use_unified_worker")) {
+                experiments.add("use_unified_worker");
+            }
+            if (!experiments.contains("beam_fn_api")) {
+                experiments.add("beam_fn_api");
+            }
+            if (!experiments.contains("use_portable_job_submission")) {
+                experiments.add("use_portable_job_submission");
+            }
+            options.setExperiments(ImmutableList.copyOf(experiments));
+            // Ensure that logging via the FnApi is enabled
+            options.as(SdkHarnessOptions.class).setEnableLogViaFnApi(true);
+        }
+
+        logWarningIfPCollectionViewHasNonDeterministicKeyCoder(pipeline);
+        logWarningIfBigqueryDLQUnused(pipeline);
+        if (shouldActAsStreaming(pipeline)) {
+            options.setStreaming(true);
+
+            if (useUnifiedWorker(options)) {
+                options.setEnableStreamingEngine(true);
+                List<String> experiments
+                        = new ArrayList<>(options.getExperiments()); // non-null if useUnifiedWorker is true
+                if (!experiments.contains("enable_streaming_engine")) {
+                    experiments.add("enable_streaming_engine");
+                }
+                if (!experiments.contains("enable_windmill_service")) {
+                    experiments.add("enable_windmill_service");
+                }
+            }
+        }
+
+        if (!ExperimentalOptions.hasExperiment(options, "disable_projection_pushdown")) {
+            ProjectionPushdownOptimizer.optimize(pipeline);
+        }
+
+        LOG.info(
+                "Executing pipeline on the Dataflow Service, which will have billing implications "
+                + "related to Google Compute Engine usage and other Google Cloud Services.");
+
+        DataflowPipelineOptions dataflowOptions = options.as(DataflowPipelineOptions.class);
+        String workerHarnessContainerImageURL = DataflowRunner.getContainerImageForJob(dataflowOptions);
+
+        // This incorrectly puns the worker harness container image (which implements v1beta3 API)
+        // with the SDK harness image (which implements Fn API).
+        //
+        // The same Environment is used in different and contradictory ways, depending on whether
+        // it is a v1 or v2 job submission.
+        RunnerApi.Environment defaultEnvironmentForDataflow
+                = Environments.createDockerEnvironment(workerHarnessContainerImageURL);
+
+        // The SdkComponents for portable an non-portable job submission must be kept distinct. Both
+        // need the default environment.
+        SdkComponents portableComponents = SdkComponents.create();
+        portableComponents.registerEnvironment(
+                defaultEnvironmentForDataflow
+                        .toBuilder()
+                        .addAllDependencies(getDefaultArtifacts())
+                        .addAllCapabilities(Environments.getJavaCapabilities())
+                        .build());
+
+        RunnerApi.Pipeline portablePipelineProto
+                = PipelineTranslation.toProto(pipeline, portableComponents, false);
+        // Note that `stageArtifacts` has to be called before `resolveArtifact` because
+        // `resolveArtifact` updates local paths to staged paths in pipeline proto.
+        portablePipelineProto = resolveAnyOfEnvironments(portablePipelineProto);
+        List<DataflowPackage> packages = stageArtifacts(portablePipelineProto);
+        portablePipelineProto = resolveArtifacts(portablePipelineProto);
+        portablePipelineProto = applySdkEnvironmentOverrides(portablePipelineProto, options);
+        if (LOG.isDebugEnabled()) {
+            LOG.debug(
+                    "Portable pipeline proto:\n{}",
+                    TextFormat.printer().printToString(portablePipelineProto));
+        }
+        // Stage the portable pipeline proto, retrieving the staged pipeline path, then update
+        // the options on the new job
+        // TODO: add an explicit `pipeline` parameter to the submission instead of pipeline options
+        LOG.info("Staging portable pipeline proto to {}", options.getStagingLocation());
+        byte[] serializedProtoPipeline = portablePipelineProto.toByteArray();
+
+        DataflowPackage stagedPipeline
+                = options.getStager().stageToFile(serializedProtoPipeline, PIPELINE_FILE_NAME);
+        dataflowOptions.setPipelineUrl(stagedPipeline.getLocation());
+
+        if (useUnifiedWorker(options)) {
+            LOG.info("Skipping v1 transform replacements since job will run on v2.");
+        } else {
+            // Now rewrite things to be as needed for v1 (mutates the pipeline)
+            // This way the job submitted is valid for v1 and v2, simultaneously
+            replaceV1Transforms(pipeline);
+        }
+        // Capture the SdkComponents for look up during step translations
+        SdkComponents dataflowV1Components = SdkComponents.create();
+        dataflowV1Components.registerEnvironment(
+                defaultEnvironmentForDataflow
+                        .toBuilder()
+                        .addAllDependencies(getDefaultArtifacts())
+                        .addAllCapabilities(Environments.getJavaCapabilities())
+                        .build());
+        // No need to perform transform upgrading for the Runner v1 proto.
+        RunnerApi.Pipeline dataflowV1PipelineProto
+                = PipelineTranslation.toProto(pipeline, dataflowV1Components, true, false);
+
+        if (LOG.isDebugEnabled()) {
+            LOG.debug(
+                    "Dataflow v1 pipeline proto:\n{}",
+                    TextFormat.printer().printToString(dataflowV1PipelineProto));
+        }
+
+        // Set a unique client_request_id in the CreateJob request.
+        // This is used to ensure idempotence of job creation across retried
+        // attempts to create a job. Specifically, if the service returns a job with
+        // a different client_request_id, it means the returned one is a different
+        // job previously created with the same job name, and that the job creation
+        // has been effectively rejected. The SDK should return
+        // Error::Already_Exists to user in that case.
+        int randomNum = new Random().nextInt(9000) + 1000;
+        String requestId
+                = DateTimeFormat.forPattern("YYYYMMddHHmmssmmm")
+                        .withZone(DateTimeZone.UTC)
+                        .print(DateTimeUtils.currentTimeMillis())
+                + "_"
+                + randomNum;
+
+        JobSpecification jobSpecification
+                = translator.translate(
+                        pipeline, dataflowV1PipelineProto, dataflowV1Components, this, packages);
+
+        if (!isNullOrEmpty(dataflowOptions.getDataflowWorkerJar()) && !useUnifiedWorker(options)) {
+            List<String> experiments
+                    = firstNonNull(dataflowOptions.getExperiments(), Collections.emptyList());
+            if (!experiments.contains("use_staged_dataflow_worker_jar")) {
+                dataflowOptions.setExperiments(
+                        ImmutableList.<String>builder()
+                                .addAll(experiments)
+                                .add("use_staged_dataflow_worker_jar")
+                                .build());
+            }
+        }
+
+        Job newJob = jobSpecification.getJob();
         try {
-          dockerPayload = RunnerApi.DockerPayload.parseFrom(environmentBuilder.getPayload());
-        } catch (InvalidProtocolBufferException e) {
-          throw new RuntimeException("Error parsing environment docker payload.", e);
-        }
-        String containerImage = dockerPayload.getContainerImage();
-        boolean updated = false;
-        for (int i = 0; i < overrides.length; i += 2) {
-          containerImage = containerImage.replaceAll(overrides[i], overrides[i + 1]);
-          if (!containerImage.equals(dockerPayload.getContainerImage())) {
-            updated = true;
-          }
-        }
-        if (containerImage.startsWith("apache/beam")
-            && !updated
-            // don't update if the container image is already configured by DataflowRunner
-            && !containerImage.equals(getContainerImageForJob(options))) {
-          containerImage =
-              DataflowRunnerInfo.getDataflowRunnerInfo().getContainerImageBaseRepository()
-                  + containerImage.substring(containerImage.lastIndexOf("/"));
-        }
-        environmentBuilder.setPayload(
-            RunnerApi.DockerPayload.newBuilder()
-                .setContainerImage(containerImage)
-                .build()
-                .toByteString());
-      }
-      componentsBuilder.putEnvironments(entry.getKey(), environmentBuilder.build());
-    }
-    return pipelineBuilder.build();
-  }
-
-  @VisibleForTesting
-  protected RunnerApi.Pipeline resolveArtifacts(RunnerApi.Pipeline pipeline) {
-    RunnerApi.Pipeline.Builder pipelineBuilder = pipeline.toBuilder();
-    RunnerApi.Components.Builder componentsBuilder = pipelineBuilder.getComponentsBuilder();
-    componentsBuilder.clearEnvironments();
-    for (Map.Entry<String, RunnerApi.Environment> entry :
-        pipeline.getComponents().getEnvironmentsMap().entrySet()) {
-      RunnerApi.Environment.Builder environmentBuilder = entry.getValue().toBuilder();
-      environmentBuilder.clearDependencies();
-      for (RunnerApi.ArtifactInformation info : entry.getValue().getDependenciesList()) {
-        if (!BeamUrns.getUrn(RunnerApi.StandardArtifacts.Types.FILE).equals(info.getTypeUrn())) {
-          throw new RuntimeException(
-              String.format("unsupported artifact type %s", info.getTypeUrn()));
-        }
-        RunnerApi.ArtifactFilePayload filePayload;
+            newJob
+                    .getEnvironment()
+                    .setSdkPipelineOptions(
+                            MAPPER.readValue(MAPPER_WITH_MODULES.writeValueAsBytes(options), Map.class));
+        } catch (IOException e) {
+            throw new IllegalArgumentException(
+                    "PipelineOptions specified failed to serialize to JSON.", e);
+        }
+        newJob.setClientRequestId(requestId);
+
+        DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
+        String version = dataflowRunnerInfo.getVersion();
+        checkState(
+                !"${pom.version}".equals(version),
+                "Unable to submit a job to the Dataflow service with unset version ${pom.version}");
+        LOG.info("Dataflow SDK version: {}", version);
+
+        newJob.getEnvironment().setUserAgent((Map) dataflowRunnerInfo.getProperties());
+        // The Dataflow Service may write to the temporary directory directly, so
+        // must be verified.
+        if (!isNullOrEmpty(options.getGcpTempLocation())) {
+            newJob
+                    .getEnvironment()
+                    .setTempStoragePrefix(
+                            dataflowOptions.getPathValidator().verifyPath(options.getGcpTempLocation()));
+        }
+        newJob.getEnvironment().setDataset(options.getTempDatasetId());
+
+        if (options.getWorkerRegion() != null) {
+            newJob.getEnvironment().setWorkerRegion(options.getWorkerRegion());
+        }
+        if (options.getWorkerZone() != null) {
+            newJob.getEnvironment().setWorkerZone(options.getWorkerZone());
+        }
+
+        if (options.getFlexRSGoal()
+                == DataflowPipelineOptions.FlexResourceSchedulingGoal.COST_OPTIMIZED) {
+            newJob.getEnvironment().setFlexResourceSchedulingGoal("FLEXRS_COST_OPTIMIZED");
+        } else if (options.getFlexRSGoal()
+                == DataflowPipelineOptions.FlexResourceSchedulingGoal.SPEED_OPTIMIZED) {
+            newJob.getEnvironment().setFlexResourceSchedulingGoal("FLEXRS_SPEED_OPTIMIZED");
+        }
+
+        // Represent the minCpuPlatform pipeline option as an experiment, if not already present.
+        if (!isNullOrEmpty(dataflowOptions.getMinCpuPlatform())) {
+            List<String> experiments
+                    = firstNonNull(dataflowOptions.getExperiments(), Collections.emptyList());
+
+            List<String> minCpuFlags
+                    = experiments.stream()
+                            .filter(p -> p.startsWith("min_cpu_platform"))
+                            .collect(Collectors.toList());
+
+            if (minCpuFlags.isEmpty()) {
+                dataflowOptions.setExperiments(
+                        ImmutableList.<String>builder()
+                                .addAll(experiments)
+                                .add("min_cpu_platform=" + dataflowOptions.getMinCpuPlatform())
+                                .build());
+            } else {
+                LOG.warn(
+                        "Flag min_cpu_platform is defined in both top level PipelineOption, "
+                        + "as well as under experiments. Proceed using {}.",
+                        minCpuFlags.get(0));
+            }
+        }
+
+        newJob
+                .getEnvironment()
+                .setExperiments(
+                        ImmutableList.copyOf(
+                                firstNonNull(dataflowOptions.getExperiments(), Collections.emptyList())));
+
+        // Set the Docker container image that executes Dataflow worker harness, residing in Google
+        // Container Registry. Translator is guaranteed to create a worker pool prior to this point.
+        // For runner_v1, only worker_harness_container is set.
+        // For runner_v2, both worker_harness_container and sdk_harness_container are set to the same
+        // value.
+        String containerImage = getContainerImageForJob(options);
+        for (WorkerPool workerPool : newJob.getEnvironment().getWorkerPools()) {
+            workerPool.setWorkerHarnessContainerImage(containerImage);
+        }
+
+        configureSdkHarnessContainerImages(options, portablePipelineProto, newJob);
+
+        newJob.getEnvironment().setVersion(getEnvironmentVersion(options));
+
+        if (hooks != null) {
+            hooks.modifyEnvironmentBeforeSubmission(newJob.getEnvironment());
+        }
+
+        // enable upload_graph when the graph is too large
+        byte[] jobGraphBytes = DataflowPipelineTranslator.jobToString(newJob).getBytes(UTF_8);
+        int jobGraphByteSize = jobGraphBytes.length;
+        if (jobGraphByteSize >= CREATE_JOB_REQUEST_LIMIT_BYTES
+                && !hasExperiment(options, "upload_graph")
+                && !useUnifiedWorker(options)) {
+            List<String> experiments = firstNonNull(options.getExperiments(), Collections.emptyList());
+            options.setExperiments(
+                    ImmutableList.<String>builder().addAll(experiments).add("upload_graph").build());
+            LOG.info(
+                    "The job graph size ({} in bytes) is larger than {}. Automatically add "
+                    + "the upload_graph option to experiments.",
+                    jobGraphByteSize,
+                    CREATE_JOB_REQUEST_LIMIT_BYTES);
+        }
+
+        if (hasExperiment(options, "upload_graph") && useUnifiedWorker(options)) {
+            ArrayList<String> experiments = new ArrayList<>(options.getExperiments());
+            while (experiments.remove("upload_graph")) {
+            }
+            options.setExperiments(experiments);
+            LOG.warn(
+                    "The upload_graph experiment was specified, but it does not apply "
+                    + "to runner v2 jobs. Option has been automatically removed.");
+        }
+
+        // Upload the job to GCS and remove the graph object from the API call.  The graph
+        // will be downloaded from GCS by the service.
+        if (hasExperiment(options, "upload_graph")) {
+            DataflowPackage stagedGraph
+                    = options.getStager().stageToFile(jobGraphBytes, DATAFLOW_GRAPH_FILE_NAME);
+            newJob.getSteps().clear();
+            newJob.setStepsLocation(stagedGraph.getLocation());
+        }
+
+        if (!isNullOrEmpty(options.getDataflowJobFile())
+                || !isNullOrEmpty(options.getTemplateLocation())) {
+            boolean isTemplate = !isNullOrEmpty(options.getTemplateLocation());
+            if (isTemplate) {
+                checkArgument(
+                        isNullOrEmpty(options.getDataflowJobFile()),
+                        "--dataflowJobFile and --templateLocation are mutually exclusive.");
+            }
+            String fileLocation
+                    = firstNonNull(options.getTemplateLocation(), options.getDataflowJobFile());
+            checkArgument(
+                    fileLocation.startsWith("/") || fileLocation.startsWith("gs://"),
+                    "Location must be local or on Cloud Storage, got %s.",
+                    fileLocation);
+
+            try {
+                printWorkSpecJsonToFile(fileLocation, newJob);
+                LOG.info("Printed job specification to {}", fileLocation);
+            } catch (IOException ex) {
+                String error = String.format("Cannot create output file at %s", fileLocation);
+                if (isTemplate) {
+                    throw new RuntimeException(error, ex);
+                } else {
+                    LOG.warn(error, ex);
+                }
+            }
+
+            if (isTemplate) {
+                LOG.info("Template successfully created.");
+                return new DataflowTemplateJob();
+            }
+        }
+
+        String jobIdToUpdate = null;
+        if (options.isUpdate()) {
+            jobIdToUpdate = getJobIdFromName(options.getJobName());
+            newJob.setTransformNameMapping(options.getTransformNameMapping());
+            newJob.setReplaceJobId(jobIdToUpdate);
+        }
+        if (options.getCreateFromSnapshot() != null && !options.getCreateFromSnapshot().isEmpty()) {
+            newJob.setTransformNameMapping(options.getTransformNameMapping());
+            newJob.setCreatedFromSnapshotId(options.getCreateFromSnapshot());
+        }
+
+        Job jobResult;
         try {
-          filePayload = RunnerApi.ArtifactFilePayload.parseFrom(info.getTypePayload());
-        } catch (InvalidProtocolBufferException e) {
-          throw new RuntimeException("Error parsing artifact file payload.", e);
-        }
-        String stagedName;
-        if (BeamUrns.getUrn(RunnerApi.StandardArtifacts.Roles.STAGING_TO)
-            .equals(info.getRoleUrn())) {
-          try {
-            RunnerApi.ArtifactStagingToRolePayload stagingPayload =
-                RunnerApi.ArtifactStagingToRolePayload.parseFrom(info.getRolePayload());
-            stagedName = stagingPayload.getStagedName();
-          } catch (InvalidProtocolBufferException e) {
-            throw new RuntimeException("Error parsing artifact staging_to role payload.", e);
-          }
-        } else {
-          try {
-            File source = new File(filePayload.getPath());
-            HashCode hashCode = Files.asByteSource(source).hash(Hashing.sha256());
-            stagedName = Environments.createStagingFileName(source, hashCode);
-          } catch (IOException e) {
+            jobResult = dataflowClient.createJob(newJob);
+        } catch (GoogleJsonResponseException e) {
+            String errorMessages = "Unexpected errors";
+            if (e.getDetails() != null) {
+                if (jobGraphByteSize >= CREATE_JOB_REQUEST_LIMIT_BYTES) {
+                    errorMessages
+                            = "The size of the serialized JSON representation of the pipeline "
+                            + "exceeds the allowable limit. "
+                            + "For more information, please see the documentation on job submission:\n"
+                            + "https://cloud.google.com/dataflow/docs/guides/deploying-a-pipeline#jobs";
+                } else {
+                    errorMessages = e.getDetails().getMessage();
+                }
+            }
+            throw new RuntimeException("Failed to create a workflow job: " + errorMessages, e);
+        } catch (IOException e) {
+            throw new RuntimeException("Failed to create a workflow job", e);
+        }
+
+        // Use a raw client for post-launch monitoring, as status calls may fail
+        // regularly and need not be retried automatically.
+        DataflowPipelineJob dataflowPipelineJob
+                = new DataflowPipelineJob(
+                        DataflowClient.create(options),
+                        jobResult.getId(),
+                        options,
+                        jobSpecification != null ? jobSpecification.getStepNames() : Collections.emptyMap(),
+                        portablePipelineProto);
+
+        // If the service returned client request id, the SDK needs to compare it
+        // with the original id generated in the request, if they are not the same
+        // (i.e., the returned job is not created by this request), throw
+        // DataflowJobAlreadyExistsException or DataflowJobAlreadyUpdatedException
+        // depending on whether this is a reload or not.
+        if (jobResult.getClientRequestId() != null
+                && !jobResult.getClientRequestId().isEmpty()
+                && !jobResult.getClientRequestId().equals(requestId)) {
+            // If updating a job.
+            if (options.isUpdate()) {
+                throw new DataflowJobAlreadyUpdatedException(
+                        dataflowPipelineJob,
+                        String.format(
+                                "The job named %s with id: %s has already been updated into job id: %s "
+                                + "and cannot be updated again.",
+                                newJob.getName(), jobIdToUpdate, jobResult.getId()));
+            } else {
+                throw new DataflowJobAlreadyExistsException(
+                        dataflowPipelineJob,
+                        String.format(
+                                "There is already an active job named %s with id: %s. If you want to submit a"
+                                + " second job, try again by setting a different name using --jobName.",
+                                newJob.getName(), jobResult.getId()));
+            }
+        }
+
+        LOG.info(
+                "To access the Dataflow monitoring console, please navigate to {}",
+                MonitoringUtil.getJobMonitoringPageURL(
+                        options.getProject(), options.getRegion(), jobResult.getId()));
+        LOG.info("Submitted job: {}", jobResult.getId());
+
+        LOG.info(
+                "To cancel the job using the 'gcloud' tool, run:\n> {}",
+                MonitoringUtil.getGcloudCancelCommand(options, jobResult.getId()));
+
+        return dataflowPipelineJob;
+    }
+
+    private static void printWorkSpecJsonToFile(String fileLocation, Job job) throws IOException {
+        String workSpecJson = DataflowPipelineTranslator.jobToString(job);
+        ResourceId fileResource = FileSystems.matchNewResource(fileLocation, false /* isDirectory */);
+        try (OutputStreamWriter writer
+                = new OutputStreamWriter(
+                        Channels.newOutputStream(FileSystems.create(fileResource, MimeTypes.TEXT)), UTF_8)) {
+            // Not using PrintWriter as it swallows IOException.
+            // Not using BufferedWriter as this invokes write() only once.
+            writer.write(workSpecJson);
+        }
+    }
+
+    private static EnvironmentInfo getEnvironmentInfoFromEnvironmentId(
+            String environmentId, RunnerApi.Pipeline pipelineProto) {
+        RunnerApi.Environment environment
+                = pipelineProto.getComponents().getEnvironmentsMap().get(environmentId);
+        if (!BeamUrns.getUrn(RunnerApi.StandardEnvironments.Environments.DOCKER)
+                .equals(environment.getUrn())) {
             throw new RuntimeException(
-                String.format("Error creating staged name for artifact %s", filePayload.getPath()),
-                e);
-          }
-        }
-        environmentBuilder.addDependencies(
-            info.toBuilder()
-                .setTypeUrn(BeamUrns.getUrn(RunnerApi.StandardArtifacts.Types.URL))
-                .setTypePayload(
-                    RunnerApi.ArtifactUrlPayload.newBuilder()
-                        .setUrl(
-                            FileSystems.matchNewResource(options.getStagingLocation(), true)
-                                .resolve(
-                                    stagedName, ResolveOptions.StandardResolveOptions.RESOLVE_FILE)
-                                .toString())
-                        .setSha256(filePayload.getSha256())
-                        .build()
-                        .toByteString()));
-      }
-      componentsBuilder.putEnvironments(entry.getKey(), environmentBuilder.build());
-    }
-    return pipelineBuilder.build();
-  }
-
-  protected List<DataflowPackage> stageArtifacts(RunnerApi.Pipeline pipeline) {
-    ImmutableList.Builder<StagedFile> filesToStageBuilder = ImmutableList.builder();
-    Set<String> stagedNames = new HashSet<>();
-    for (Map.Entry<String, RunnerApi.Environment> entry :
-        pipeline.getComponents().getEnvironmentsMap().entrySet()) {
-      for (RunnerApi.ArtifactInformation info : entry.getValue().getDependenciesList()) {
-        if (!BeamUrns.getUrn(RunnerApi.StandardArtifacts.Types.FILE).equals(info.getTypeUrn())) {
-          throw new RuntimeException(
-              String.format("unsupported artifact type %s", info.getTypeUrn()));
-        }
-        RunnerApi.ArtifactFilePayload filePayload;
+                    "Dataflow can only execute pipeline steps in Docker environments: "
+                    + environment.getUrn());
+        }
+        RunnerApi.DockerPayload dockerPayload;
         try {
-          filePayload = RunnerApi.ArtifactFilePayload.parseFrom(info.getTypePayload());
+            dockerPayload = RunnerApi.DockerPayload.parseFrom(environment.getPayload());
         } catch (InvalidProtocolBufferException e) {
-          throw new RuntimeException("Error parsing artifact file payload.", e);
-        }
-        String stagedName;
-        if (BeamUrns.getUrn(RunnerApi.StandardArtifacts.Roles.STAGING_TO)
-            .equals(info.getRoleUrn())) {
-          try {
-            RunnerApi.ArtifactStagingToRolePayload stagingPayload =
-                RunnerApi.ArtifactStagingToRolePayload.parseFrom(info.getRolePayload());
-            stagedName = stagingPayload.getStagedName();
-          } catch (InvalidProtocolBufferException e) {
-            throw new RuntimeException("Error parsing artifact staging_to role payload.", e);
-          }
-        } else {
-          try {
-            File source = new File(filePayload.getPath());
-            HashCode hashCode = Files.asByteSource(source).hash(Hashing.sha256());
-            stagedName = Environments.createStagingFileName(source, hashCode);
-          } catch (IOException e) {
-            throw new RuntimeException(
-                String.format("Error creating staged name for artifact %s", filePayload.getPath()),
-                e);
-          }
+            throw new RuntimeException("Error parsing docker payload.", e);
         }
-        if (stagedNames.contains(stagedName)) {
-          continue;
-        } else {
-          stagedNames.add(stagedName);
-        }
-        filesToStageBuilder.add(
-            StagedFile.of(filePayload.getPath(), filePayload.getSha256(), stagedName));
-      }
-    }
-    return options.getStager().stageFiles(filesToStageBuilder.build());
-  }
-
-  private List<RunnerApi.ArtifactInformation> getDefaultArtifacts() {
-    ImmutableList.Builder<String> pathsToStageBuilder = ImmutableList.builder();
-    String windmillBinary =
-        options.as(DataflowStreamingPipelineOptions.class).getOverrideWindmillBinary();
-    String dataflowWorkerJar = options.getDataflowWorkerJar();
-    if (dataflowWorkerJar != null && !dataflowWorkerJar.isEmpty() && !useUnifiedWorker(options)) {
-      // Put the user specified worker jar at the start of the classpath, to be consistent with the
-      // built in worker order.
-      pathsToStageBuilder.add("dataflow-worker.jar=" + dataflowWorkerJar);
-    }
-    pathsToStageBuilder.addAll(options.getFilesToStage());
-    if (windmillBinary != null) {
-      pathsToStageBuilder.add("windmill_main=" + windmillBinary);
-    }
-    return Environments.getArtifacts(pathsToStageBuilder.build());
-  }
-
-  @VisibleForTesting
-  static boolean isMultiLanguagePipeline(Pipeline pipeline) {
-    class IsMultiLanguageVisitor extends PipelineVisitor.Defaults {
-      private boolean isMultiLanguage = false;
-
-      private void performMultiLanguageTest(Node node) {
-        if (node.getTransform() instanceof External.ExpandableTransform) {
-          isMultiLanguage = true;
-        }
-      }
-
-      @Override
-      public CompositeBehavior enterCompositeTransform(Node node) {
-        performMultiLanguageTest(node);
-        return super.enterCompositeTransform(node);
-      }
-
-      @Override
-      public void visitPrimitiveTransform(Node node) {
-        performMultiLanguageTest(node);
-        super.visitPrimitiveTransform(node);
-      }
-    }
-
-    IsMultiLanguageVisitor visitor = new IsMultiLanguageVisitor();
-    pipeline.traverseTopologically(visitor);
-
-    return visitor.isMultiLanguage;
-  }
-
-  private static boolean includesTransformUpgrades(Pipeline pipeline) {
-    return (pipeline
-            .getOptions()
-            .as(ExternalTranslationOptions.class)
-            .getTransformsToOverride()
-            .size()
-        > 0);
-  }
-
-  @Override
-  public DataflowPipelineJob run(Pipeline pipeline) {
-    // Multi-language pipelines and pipelines that include upgrades should automatically be upgraded
-    // to Runner v2.
-    if (DataflowRunner.isMultiLanguagePipeline(pipeline) || includesTransformUpgrades(pipeline)) {
-      List<String> experiments = firstNonNull(options.getExperiments(), Collections.emptyList());
-      if (!experiments.contains("use_runner_v2")) {
-        LOG.info(
-            "Automatically enabling Dataflow Runner v2 since the pipeline used cross-language"
-                + " transforms or pipeline needed a transform upgrade.");
-        options.setExperiments(
-            ImmutableList.<String>builder().addAll(experiments).add("use_runner_v2").build());
-      }
-    }
-    if (useUnifiedWorker(options)) {
-      if (hasExperiment(options, "disable_runner_v2")
-          || hasExperiment(options, "disable_runner_v2_until_2023")
-          || hasExperiment(options, "disable_prime_runner_v2")) {
-        throw new IllegalArgumentException(
-            "Runner V2 both disabled and enabled: at least one of ['beam_fn_api', 'use_unified_worker', 'use_runner_v2', 'use_portable_job_submission'] is set and also one of ['disable_runner_v2', 'disable_runner_v2_until_2023', 'disable_prime_runner_v2'] is set.");
-      }
-      List<String> experiments =
-          new ArrayList<>(options.getExperiments()); // non-null if useUnifiedWorker is true
-      if (!experiments.contains("use_runner_v2")) {
-        experiments.add("use_runner_v2");
-      }
-      if (!experiments.contains("use_unified_worker")) {
-        experiments.add("use_unified_worker");
-      }
-      if (!experiments.contains("beam_fn_api")) {
-        experiments.add("beam_fn_api");
-      }
-      if (!experiments.contains("use_portable_job_submission")) {
-        experiments.add("use_portable_job_submission");
-      }
-      options.setExperiments(ImmutableList.copyOf(experiments));
-      // Ensure that logging via the FnApi is enabled
-      options.as(SdkHarnessOptions.class).setEnableLogViaFnApi(true);
-    }
-
-    logWarningIfPCollectionViewHasNonDeterministicKeyCoder(pipeline);
-    logWarningIfBigqueryDLQUnused(pipeline);
-    if (shouldActAsStreaming(pipeline)) {
-      options.setStreaming(true);
-
-      if (useUnifiedWorker(options)) {
-        options.setEnableStreamingEngine(true);
-        List<String> experiments =
-            new ArrayList<>(options.getExperiments()); // non-null if useUnifiedWorker is true
-        if (!experiments.contains("enable_streaming_engine")) {
-          experiments.add("enable_streaming_engine");
-        }
-        if (!experiments.contains("enable_windmill_service")) {
-          experiments.add("enable_windmill_service");
-        }
-      }
-    }
-
-    if (!ExperimentalOptions.hasExperiment(options, "disable_projection_pushdown")) {
-      ProjectionPushdownOptimizer.optimize(pipeline);
-    }
-
-    LOG.info(
-        "Executing pipeline on the Dataflow Service, which will have billing implications "
-            + "related to Google Compute Engine usage and other Google Cloud Services.");
-
-    DataflowPipelineOptions dataflowOptions = options.as(DataflowPipelineOptions.class);
-    String workerHarnessContainerImageURL = DataflowRunner.getContainerImageForJob(dataflowOptions);
-
-    // This incorrectly puns the worker harness container image (which implements v1beta3 API)
-    // with the SDK harness image (which implements Fn API).
-    //
-    // The same Environment is used in different and contradictory ways, depending on whether
-    // it is a v1 or v2 job submission.
-    RunnerApi.Environment defaultEnvironmentForDataflow =
-        Environments.createDockerEnvironment(workerHarnessContainerImageURL);
-
-    // The SdkComponents for portable an non-portable job submission must be kept distinct. Both
-    // need the default environment.
-    SdkComponents portableComponents = SdkComponents.create();
-    portableComponents.registerEnvironment(
-        defaultEnvironmentForDataflow
-            .toBuilder()
-            .addAllDependencies(getDefaultArtifacts())
-            .addAllCapabilities(Environments.getJavaCapabilities())
-            .build());
-
-    RunnerApi.Pipeline portablePipelineProto =
-        PipelineTranslation.toProto(pipeline, portableComponents, false);
-    // Note that `stageArtifacts` has to be called before `resolveArtifact` because
-    // `resolveArtifact` updates local paths to staged paths in pipeline proto.
-    portablePipelineProto = resolveAnyOfEnvironments(portablePipelineProto);
-    List<DataflowPackage> packages = stageArtifacts(portablePipelineProto);
-    portablePipelineProto = resolveArtifacts(portablePipelineProto);
-    portablePipelineProto = applySdkEnvironmentOverrides(portablePipelineProto, options);
-    if (LOG.isDebugEnabled()) {
-      LOG.debug(
-          "Portable pipeline proto:\n{}",
-          TextFormat.printer().printToString(portablePipelineProto));
-    }
-    // Stage the portable pipeline proto, retrieving the staged pipeline path, then update
-    // the options on the new job
-    // TODO: add an explicit `pipeline` parameter to the submission instead of pipeline options
-    LOG.info("Staging portable pipeline proto to {}", options.getStagingLocation());
-    byte[] serializedProtoPipeline = portablePipelineProto.toByteArray();
-
-    DataflowPackage stagedPipeline =
-        options.getStager().stageToFile(serializedProtoPipeline, PIPELINE_FILE_NAME);
-    dataflowOptions.setPipelineUrl(stagedPipeline.getLocation());
-
-    if (useUnifiedWorker(options)) {
-      LOG.info("Skipping v1 transform replacements since job will run on v2.");
-    } else {
-      // Now rewrite things to be as needed for v1 (mutates the pipeline)
-      // This way the job submitted is valid for v1 and v2, simultaneously
-      replaceV1Transforms(pipeline);
-    }
-    // Capture the SdkComponents for look up during step translations
-    SdkComponents dataflowV1Components = SdkComponents.create();
-    dataflowV1Components.registerEnvironment(
-        defaultEnvironmentForDataflow
-            .toBuilder()
-            .addAllDependencies(getDefaultArtifacts())
-            .addAllCapabilities(Environments.getJavaCapabilities())
-            .build());
-    // No need to perform transform upgrading for the Runner v1 proto.
-    RunnerApi.Pipeline dataflowV1PipelineProto =
-        PipelineTranslation.toProto(pipeline, dataflowV1Components, true, false);
-
-    if (LOG.isDebugEnabled()) {
-      LOG.debug(
-          "Dataflow v1 pipeline proto:\n{}",
-          TextFormat.printer().printToString(dataflowV1PipelineProto));
-    }
-
-    // Set a unique client_request_id in the CreateJob request.
-    // This is used to ensure idempotence of job creation across retried
-    // attempts to create a job. Specifically, if the service returns a job with
-    // a different client_request_id, it means the returned one is a different
-    // job previously created with the same job name, and that the job creation
-    // has been effectively rejected. The SDK should return
-    // Error::Already_Exists to user in that case.
-    int randomNum = new Random().nextInt(9000) + 1000;
-    String requestId =
-        DateTimeFormat.forPattern("YYYYMMddHHmmssmmm")
-                .withZone(DateTimeZone.UTC)
-                .print(DateTimeUtils.currentTimeMillis())
-            + "_"
-            + randomNum;
-
-    JobSpecification jobSpecification =
-        translator.translate(
-            pipeline, dataflowV1PipelineProto, dataflowV1Components, this, packages);
-
-    if (!isNullOrEmpty(dataflowOptions.getDataflowWorkerJar()) && !useUnifiedWorker(options)) {
-      List<String> experiments =
-          firstNonNull(dataflowOptions.getExperiments(), Collections.emptyList());
-      if (!experiments.contains("use_staged_dataflow_worker_jar")) {
-        dataflowOptions.setExperiments(
-            ImmutableList.<String>builder()
-                .addAll(experiments)
-                .add("use_staged_dataflow_worker_jar")
-                .build());
-      }
-    }
-
-    Job newJob = jobSpecification.getJob();
-    try {
-      newJob
-          .getEnvironment()
-          .setSdkPipelineOptions(
-              MAPPER.readValue(MAPPER_WITH_MODULES.writeValueAsBytes(options), Map.class));
-    } catch (IOException e) {
-      throw new IllegalArgumentException(
-          "PipelineOptions specified failed to serialize to JSON.", e);
-    }
-    newJob.setClientRequestId(requestId);
-
-    DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
-    String version = dataflowRunnerInfo.getVersion();
-    checkState(
-        !"${pom.version}".equals(version),
-        "Unable to submit a job to the Dataflow service with unset version ${pom.version}");
-    LOG.info("Dataflow SDK version: {}", version);
-
-    newJob.getEnvironment().setUserAgent((Map) dataflowRunnerInfo.getProperties());
-    // The Dataflow Service may write to the temporary directory directly, so
-    // must be verified.
-    if (!isNullOrEmpty(options.getGcpTempLocation())) {
-      newJob
-          .getEnvironment()
-          .setTempStoragePrefix(
-              dataflowOptions.getPathValidator().verifyPath(options.getGcpTempLocation()));
-    }
-    newJob.getEnvironment().setDataset(options.getTempDatasetId());
-
-    if (options.getWorkerRegion() != null) {
-      newJob.getEnvironment().setWorkerRegion(options.getWorkerRegion());
-    }
-    if (options.getWorkerZone() != null) {
-      newJob.getEnvironment().setWorkerZone(options.getWorkerZone());
-    }
-
-    if (options.getFlexRSGoal()
-        == DataflowPipelineOptions.FlexResourceSchedulingGoal.COST_OPTIMIZED) {
-      newJob.getEnvironment().setFlexResourceSchedulingGoal("FLEXRS_COST_OPTIMIZED");
-    } else if (options.getFlexRSGoal()
-        == DataflowPipelineOptions.FlexResourceSchedulingGoal.SPEED_OPTIMIZED) {
-      newJob.getEnvironment().setFlexResourceSchedulingGoal("FLEXRS_SPEED_OPTIMIZED");
-    }
-
-    // Represent the minCpuPlatform pipeline option as an experiment, if not already present.
-    if (!isNullOrEmpty(dataflowOptions.getMinCpuPlatform())) {
-      List<String> experiments =
-          firstNonNull(dataflowOptions.getExperiments(), Collections.emptyList());
-
-      List<String> minCpuFlags =
-          experiments.stream()
-              .filter(p -> p.startsWith("min_cpu_platform"))
-              .collect(Collectors.toList());
-
-      if (minCpuFlags.isEmpty()) {
-        dataflowOptions.setExperiments(
-            ImmutableList.<String>builder()
-                .addAll(experiments)
-                .add("min_cpu_platform=" + dataflowOptions.getMinCpuPlatform())
-                .build());
-      } else {
-        LOG.warn(
-            "Flag min_cpu_platform is defined in both top level PipelineOption, "
-                + "as well as under experiments. Proceed using {}.",
-            minCpuFlags.get(0));
-      }
-    }
-
-    newJob
-        .getEnvironment()
-        .setExperiments(
-            ImmutableList.copyOf(
-                firstNonNull(dataflowOptions.getExperiments(), Collections.emptyList())));
-
-    // Set the Docker container image that executes Dataflow worker harness, residing in Google
-    // Container Registry. Translator is guaranteed to create a worker pool prior to this point.
-    // For runner_v1, only worker_harness_container is set.
-    // For runner_v2, both worker_harness_container and sdk_harness_container are set to the same
-    // value.
-    String containerImage = getContainerImageForJob(options);
-    for (WorkerPool workerPool : newJob.getEnvironment().getWorkerPools()) {
-      workerPool.setWorkerHarnessContainerImage(containerImage);
-    }
-
-    configureSdkHarnessContainerImages(options, portablePipelineProto, newJob);
-
-    newJob.getEnvironment().setVersion(getEnvironmentVersion(options));
-
-    if (hooks != null) {
-      hooks.modifyEnvironmentBeforeSubmission(newJob.getEnvironment());
-    }
-
-    // enable upload_graph when the graph is too large
-    byte[] jobGraphBytes = DataflowPipelineTranslator.jobToString(newJob).getBytes(UTF_8);
-    int jobGraphByteSize = jobGraphBytes.length;
-    if (jobGraphByteSize >= CREATE_JOB_REQUEST_LIMIT_BYTES
-        && !hasExperiment(options, "upload_graph")
-        && !useUnifiedWorker(options)) {
-      List<String> experiments = firstNonNull(options.getExperiments(), Collections.emptyList());
-      options.setExperiments(
-          ImmutableList.<String>builder().addAll(experiments).add("upload_graph").build());
-      LOG.info(
-          "The job graph size ({} in bytes) is larger than {}. Automatically add "
-              + "the upload_graph option to experiments.",
-          jobGraphByteSize,
-          CREATE_JOB_REQUEST_LIMIT_BYTES);
-    }
-
-    if (hasExperiment(options, "upload_graph") && useUnifiedWorker(options)) {
-      ArrayList<String> experiments = new ArrayList<>(options.getExperiments());
-      while (experiments.remove("upload_graph")) {}
-      options.setExperiments(experiments);
-      LOG.warn(
-          "The upload_graph experiment was specified, but it does not apply "
-              + "to runner v2 jobs. Option has been automatically removed.");
-    }
-
-    // Upload the job to GCS and remove the graph object from the API call.  The graph
-    // will be downloaded from GCS by the service.
-    if (hasExperiment(options, "upload_graph")) {
-      DataflowPackage stagedGraph =
-          options.getStager().stageToFile(jobGraphBytes, DATAFLOW_GRAPH_FILE_NAME);
-      newJob.getSteps().clear();
-      newJob.setStepsLocation(stagedGraph.getLocation());
-    }
-
-    if (!isNullOrEmpty(options.getDataflowJobFile())
-        || !isNullOrEmpty(options.getTemplateLocation())) {
-      boolean isTemplate = !isNullOrEmpty(options.getTemplateLocation());
-      if (isTemplate) {
-        checkArgument(
-            isNullOrEmpty(options.getDataflowJobFile()),
-            "--dataflowJobFile and --templateLocation are mutually exclusive.");
-      }
-      String fileLocation =
-          firstNonNull(options.getTemplateLocation(), options.getDataflowJobFile());
-      checkArgument(
-          fileLocation.startsWith("/") || fileLocation.startsWith("gs://"),
-          "Location must be local or on Cloud Storage, got %s.",
-          fileLocation);
-
-      try {
-        printWorkSpecJsonToFile(fileLocation, newJob);
-        LOG.info("Printed job specification to {}", fileLocation);
-      } catch (IOException ex) {
-        String error = String.format("Cannot create output file at %s", fileLocation);
-        if (isTemplate) {
-          throw new RuntimeException(error, ex);
+        return EnvironmentInfo.create(
+                environmentId, dockerPayload.getContainerImage(), environment.getCapabilitiesList());
+    }
+
+    @AutoValue
+    abstract static class EnvironmentInfo {
+
+        static EnvironmentInfo create(
+                String environmentId, String containerUrl, List<String> capabilities) {
+            return new AutoValue_DataflowRunner_EnvironmentInfo(
+                    environmentId, containerUrl, capabilities);
+        }
+
+        abstract String environmentId();
+
+        abstract String containerUrl();
+
+        abstract List<String> capabilities();
+    }
+
+    private static List<EnvironmentInfo> getAllEnvironmentInfo(RunnerApi.Pipeline pipelineProto) {
+        return pipelineProto.getComponents().getTransformsMap().values().stream()
+                .map(transform -> transform.getEnvironmentId())
+                .filter(environmentId -> !environmentId.isEmpty())
+                .distinct()
+                .map(environmentId -> getEnvironmentInfoFromEnvironmentId(environmentId, pipelineProto))
+                .collect(Collectors.toList());
+    }
+
+    static void configureSdkHarnessContainerImages(
+            DataflowPipelineOptions options, RunnerApi.Pipeline pipelineProto, Job newJob) {
+        List<SdkHarnessContainerImage> sdkContainerList
+                = getAllEnvironmentInfo(pipelineProto).stream()
+                        .map(
+                                environmentInfo -> {
+                                    SdkHarnessContainerImage image = new SdkHarnessContainerImage();
+                                    image.setEnvironmentId(environmentInfo.environmentId());
+                                    image.setContainerImage(environmentInfo.containerUrl());
+                                    if (!environmentInfo
+                                            .capabilities()
+                                            .contains(
+                                                    BeamUrns.getUrn(
+                                                            RunnerApi.StandardProtocols.Enum.MULTI_CORE_BUNDLE_PROCESSING))) {
+                                        image.setUseSingleCorePerContainer(true);
+                                    }
+                                    image.setCapabilities(environmentInfo.capabilities());
+                                    return image;
+                                })
+                        .collect(Collectors.toList());
+        for (WorkerPool workerPool : newJob.getEnvironment().getWorkerPools()) {
+            workerPool.setSdkHarnessContainerImages(sdkContainerList);
+        }
+    }
+
+    /**
+     * Returns true if the specified experiment is enabled, handling null
+     * experiments.
+     */
+    public static boolean hasExperiment(DataflowPipelineDebugOptions options, String experiment) {
+        List<String> experiments
+                = firstNonNull(options.getExperiments(), Collections.<String>emptyList());
+        return experiments.contains(experiment);
+    }
+
+    /**
+     * Helper to configure the Dataflow Job Environment based on the user's job
+     * options.
+     */
+    private static Map<String, Object> getEnvironmentVersion(DataflowPipelineOptions options) {
+        DataflowRunnerInfo runnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
+        String majorVersion;
+        String jobType;
+        if (useUnifiedWorker(options)) {
+            majorVersion = runnerInfo.getFnApiEnvironmentMajorVersion();
+            jobType = options.isStreaming() ? "FNAPI_STREAMING" : "FNAPI_BATCH";
         } else {
-          LOG.warn(error, ex);
-        }
-      }
-
-      if (isTemplate) {
-        LOG.info("Template successfully created.");
-        return new DataflowTemplateJob();
-      }
-    }
-
-    String jobIdToUpdate = null;
-    if (options.isUpdate()) {
-      jobIdToUpdate = getJobIdFromName(options.getJobName());
-      newJob.setTransformNameMapping(options.getTransformNameMapping());
-      newJob.setReplaceJobId(jobIdToUpdate);
-    }
-    if (options.getCreateFromSnapshot() != null && !options.getCreateFromSnapshot().isEmpty()) {
-      newJob.setTransformNameMapping(options.getTransformNameMapping());
-      newJob.setCreatedFromSnapshotId(options.getCreateFromSnapshot());
-    }
-
-    Job jobResult;
-    try {
-      jobResult = dataflowClient.createJob(newJob);
-    } catch (GoogleJsonResponseException e) {
-      String errorMessages = "Unexpected errors";
-      if (e.getDetails() != null) {
-        if (jobGraphByteSize >= CREATE_JOB_REQUEST_LIMIT_BYTES) {
-          errorMessages =
-              "The size of the serialized JSON representation of the pipeline "
-                  + "exceeds the allowable limit. "
-                  + "For more information, please see the documentation on job submission:\n"
-                  + "https://cloud.google.com/dataflow/docs/guides/deploying-a-pipeline#jobs";
+            majorVersion = runnerInfo.getLegacyEnvironmentMajorVersion();
+            jobType = options.isStreaming() ? "STREAMING" : "JAVA_BATCH_AUTOSCALING";
+        }
+        return ImmutableMap.of(
+                PropertyNames.ENVIRONMENT_VERSION_MAJOR_KEY, majorVersion,
+                PropertyNames.ENVIRONMENT_VERSION_JOB_TYPE_KEY, jobType);
+    }
+
+    // This method is protected to allow a Google internal subclass to properly
+    // setup overrides.
+    @VisibleForTesting
+    protected void replaceV1Transforms(Pipeline pipeline) {
+        boolean streaming = shouldActAsStreaming(pipeline);
+        // Ensure all outputs of all reads are consumed before potentially replacing any
+        // Read PTransforms
+        UnconsumedReads.ensureAllReadsConsumed(pipeline);
+        pipeline.replaceAll(getOverrides(streaming));
+    }
+
+    private boolean shouldActAsStreaming(Pipeline p) {
+        class BoundednessVisitor extends PipelineVisitor.Defaults {
+
+            final List<PCollection> unboundedPCollections = new ArrayList<>();
+
+            @Override
+            public void visitValue(PValue value, Node producer) {
+                if (value instanceof PCollection) {
+                    PCollection pc = (PCollection) value;
+                    if (pc.isBounded() == IsBounded.UNBOUNDED) {
+                        unboundedPCollections.add(pc);
+                    }
+                }
+            }
+        }
+
+        BoundednessVisitor visitor = new BoundednessVisitor();
+        p.traverseTopologically(visitor);
+        if (visitor.unboundedPCollections.isEmpty()) {
+            if (options.isStreaming()) {
+                LOG.warn(
+                        "No unbounded PCollection(s) found in a streaming pipeline! "
+                        + "You might consider using 'streaming=false'!");
+                return true;
+            } else {
+                return false;
+            }
         } else {
-          errorMessages = e.getDetails().getMessage();
-        }
-      }
-      throw new RuntimeException("Failed to create a workflow job: " + errorMessages, e);
-    } catch (IOException e) {
-      throw new RuntimeException("Failed to create a workflow job", e);
-    }
-
-    // Use a raw client for post-launch monitoring, as status calls may fail
-    // regularly and need not be retried automatically.
-    DataflowPipelineJob dataflowPipelineJob =
-        new DataflowPipelineJob(
-            DataflowClient.create(options),
-            jobResult.getId(),
-            options,
-            jobSpecification != null ? jobSpecification.getStepNames() : Collections.emptyMap(),
-            portablePipelineProto);
-
-    // If the service returned client request id, the SDK needs to compare it
-    // with the original id generated in the request, if they are not the same
-    // (i.e., the returned job is not created by this request), throw
-    // DataflowJobAlreadyExistsException or DataflowJobAlreadyUpdatedException
-    // depending on whether this is a reload or not.
-    if (jobResult.getClientRequestId() != null
-        && !jobResult.getClientRequestId().isEmpty()
-        && !jobResult.getClientRequestId().equals(requestId)) {
-      // If updating a job.
-      if (options.isUpdate()) {
-        throw new DataflowJobAlreadyUpdatedException(
-            dataflowPipelineJob,
-            String.format(
-                "The job named %s with id: %s has already been updated into job id: %s "
-                    + "and cannot be updated again.",
-                newJob.getName(), jobIdToUpdate, jobResult.getId()));
-      } else {
-        throw new DataflowJobAlreadyExistsException(
-            dataflowPipelineJob,
-            String.format(
-                "There is already an active job named %s with id: %s. If you want to submit a"
-                    + " second job, try again by setting a different name using --jobName.",
-                newJob.getName(), jobResult.getId()));
-      }
-    }
-
-    LOG.info(
-        "To access the Dataflow monitoring console, please navigate to {}",
-        MonitoringUtil.getJobMonitoringPageURL(
-            options.getProject(), options.getRegion(), jobResult.getId()));
-    LOG.info("Submitted job: {}", jobResult.getId());
-
-    LOG.info(
-        "To cancel the job using the 'gcloud' tool, run:\n> {}",
-        MonitoringUtil.getGcloudCancelCommand(options, jobResult.getId()));
-
-    return dataflowPipelineJob;
-  }
-
-  private static void printWorkSpecJsonToFile(String fileLocation, Job job) throws IOException {
-    String workSpecJson = DataflowPipelineTranslator.jobToString(job);
-    ResourceId fileResource = FileSystems.matchNewResource(fileLocation, false /* isDirectory */);
-    try (OutputStreamWriter writer =
-        new OutputStreamWriter(
-            Channels.newOutputStream(FileSystems.create(fileResource, MimeTypes.TEXT)), UTF_8)) {
-      // Not using PrintWriter as it swallows IOException.
-      // Not using BufferedWriter as this invokes write() only once.
-      writer.write(workSpecJson);
-    }
-  }
-
-  private static EnvironmentInfo getEnvironmentInfoFromEnvironmentId(
-      String environmentId, RunnerApi.Pipeline pipelineProto) {
-    RunnerApi.Environment environment =
-        pipelineProto.getComponents().getEnvironmentsMap().get(environmentId);
-    if (!BeamUrns.getUrn(RunnerApi.StandardEnvironments.Environments.DOCKER)
-        .equals(environment.getUrn())) {
-      throw new RuntimeException(
-          "Dataflow can only execute pipeline steps in Docker environments: "
-              + environment.getUrn());
-    }
-    RunnerApi.DockerPayload dockerPayload;
-    try {
-      dockerPayload = RunnerApi.DockerPayload.parseFrom(environment.getPayload());
-    } catch (InvalidProtocolBufferException e) {
-      throw new RuntimeException("Error parsing docker payload.", e);
-    }
-    return EnvironmentInfo.create(
-        environmentId, dockerPayload.getContainerImage(), environment.getCapabilitiesList());
-  }
-
-  @AutoValue
-  abstract static class EnvironmentInfo {
-    static EnvironmentInfo create(
-        String environmentId, String containerUrl, List<String> capabilities) {
-      return new AutoValue_DataflowRunner_EnvironmentInfo(
-          environmentId, containerUrl, capabilities);
-    }
-
-    abstract String environmentId();
-
-    abstract String containerUrl();
-
-    abstract List<String> capabilities();
-  }
-
-  private static List<EnvironmentInfo> getAllEnvironmentInfo(RunnerApi.Pipeline pipelineProto) {
-    return pipelineProto.getComponents().getTransformsMap().values().stream()
-        .map(transform -> transform.getEnvironmentId())
-        .filter(environmentId -> !environmentId.isEmpty())
-        .distinct()
-        .map(environmentId -> getEnvironmentInfoFromEnvironmentId(environmentId, pipelineProto))
-        .collect(Collectors.toList());
-  }
-
-  static void configureSdkHarnessContainerImages(
-      DataflowPipelineOptions options, RunnerApi.Pipeline pipelineProto, Job newJob) {
-    List<SdkHarnessContainerImage> sdkContainerList =
-        getAllEnvironmentInfo(pipelineProto).stream()
-            .map(
-                environmentInfo -> {
-                  SdkHarnessContainerImage image = new SdkHarnessContainerImage();
-                  image.setEnvironmentId(environmentInfo.environmentId());
-                  image.setContainerImage(environmentInfo.containerUrl());
-                  if (!environmentInfo
-                      .capabilities()
-                      .contains(
-                          BeamUrns.getUrn(
-                              RunnerApi.StandardProtocols.Enum.MULTI_CORE_BUNDLE_PROCESSING))) {
-                    image.setUseSingleCorePerContainer(true);
-                  }
-                  image.setCapabilities(environmentInfo.capabilities());
-                  return image;
-                })
-            .collect(Collectors.toList());
-    for (WorkerPool workerPool : newJob.getEnvironment().getWorkerPools()) {
-      workerPool.setSdkHarnessContainerImages(sdkContainerList);
-    }
-  }
-
-  /** Returns true if the specified experiment is enabled, handling null experiments. */
-  public static boolean hasExperiment(DataflowPipelineDebugOptions options, String experiment) {
-    List<String> experiments =
-        firstNonNull(options.getExperiments(), Collections.<String>emptyList());
-    return experiments.contains(experiment);
-  }
-
-  /** Helper to configure the Dataflow Job Environment based on the user's job options. */
-  private static Map<String, Object> getEnvironmentVersion(DataflowPipelineOptions options) {
-    DataflowRunnerInfo runnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
-    String majorVersion;
-    String jobType;
-    if (useUnifiedWorker(options)) {
-      majorVersion = runnerInfo.getFnApiEnvironmentMajorVersion();
-      jobType = options.isStreaming() ? "FNAPI_STREAMING" : "FNAPI_BATCH";
-    } else {
-      majorVersion = runnerInfo.getLegacyEnvironmentMajorVersion();
-      jobType = options.isStreaming() ? "STREAMING" : "JAVA_BATCH_AUTOSCALING";
-    }
-    return ImmutableMap.of(
-        PropertyNames.ENVIRONMENT_VERSION_MAJOR_KEY, majorVersion,
-        PropertyNames.ENVIRONMENT_VERSION_JOB_TYPE_KEY, jobType);
-  }
-
-  // This method is protected to allow a Google internal subclass to properly
-  // setup overrides.
-  @VisibleForTesting
-  protected void replaceV1Transforms(Pipeline pipeline) {
-    boolean streaming = shouldActAsStreaming(pipeline);
-    // Ensure all outputs of all reads are consumed before potentially replacing any
-    // Read PTransforms
-    UnconsumedReads.ensureAllReadsConsumed(pipeline);
-    pipeline.replaceAll(getOverrides(streaming));
-  }
-
-  private boolean shouldActAsStreaming(Pipeline p) {
-    class BoundednessVisitor extends PipelineVisitor.Defaults {
-
-      final List<PCollection> unboundedPCollections = new ArrayList<>();
-
-      @Override
-      public void visitValue(PValue value, Node producer) {
-        if (value instanceof PCollection) {
-          PCollection pc = (PCollection) value;
-          if (pc.isBounded() == IsBounded.UNBOUNDED) {
-            unboundedPCollections.add(pc);
-          }
-        }
-      }
-    }
-
-    BoundednessVisitor visitor = new BoundednessVisitor();
-    p.traverseTopologically(visitor);
-    if (visitor.unboundedPCollections.isEmpty()) {
-      if (options.isStreaming()) {
-        LOG.warn(
-            "No unbounded PCollection(s) found in a streaming pipeline! "
-                + "You might consider using 'streaming=false'!");
-        return true;
-      } else {
-        return false;
-      }
-    } else {
-      if (options.isStreaming()) {
-        return true;
-      } else if (hasExperiment(options, UNSAFELY_ATTEMPT_TO_PROCESS_UNBOUNDED_DATA_IN_BATCH_MODE)) {
-        LOG.info(
-            "Turning a batch pipeline into streaming due to unbounded PCollection(s) has been avoided! "
-                + "Unbounded PCollection(s): {}",
-            visitor.unboundedPCollections);
-        return false;
-      } else {
-        LOG.warn(
-            "Unbounded PCollection(s) found in a batch pipeline! "
-                + "You might consider using 'streaming=true'! "
-                + "Unbounded PCollection(s): {}",
-            visitor.unboundedPCollections);
-        return true;
-      }
-    }
-  };
+            if (options.isStreaming()) {
+                return true;
+            } else if (hasExperiment(options, UNSAFELY_ATTEMPT_TO_PROCESS_UNBOUNDED_DATA_IN_BATCH_MODE)) {
+                LOG.info(
+                        "Turning a batch pipeline into streaming due to unbounded PCollection(s) has been avoided! "
+                        + "Unbounded PCollection(s): {}",
+                        visitor.unboundedPCollections);
+                return false;
+            } else {
+                LOG.warn(
+                        "Unbounded PCollection(s) found in a batch pipeline! "
+                        + "You might consider using 'streaming=true'! "
+                        + "Unbounded PCollection(s): {}",
+                        visitor.unboundedPCollections);
+                return true;
+            }
+        }
+    }
+
+    ;
 
   /** Returns the DataflowPipelineTranslator associated with this object. */
   public DataflowPipelineTranslator getTranslator() {
-    return translator;
-  }
+        return translator;
+    }
 
-  /** Sets callbacks to invoke during execution see {@code DataflowRunnerHooks}. */
-  public void setHooks(DataflowRunnerHooks hooks) {
-    this.hooks = hooks;
-  }
+    /**
+     * Sets callbacks to invoke during execution see
+     * {@code DataflowRunnerHooks}.
+     */
+    public void setHooks(DataflowRunnerHooks hooks) {
+        this.hooks = hooks;
+    }
 
-  /////////////////////////////////////////////////////////////////////////////
+    /////////////////////////////////////////////////////////////////////////////
 
   private void logWarningIfBigqueryDLQUnused(Pipeline pipeline) {
-    Map<PCollection<?>, String> unconsumedDLQ = Maps.newHashMap();
-    pipeline.traverseTopologically(
-        new PipelineVisitor.Defaults() {
-          @Override
-          public CompositeBehavior enterCompositeTransform(Node node) {
-            PTransform<?, ?> transform = node.getTransform();
-            if (transform != null) {
-              TupleTag<?> failedTag = null;
-              String rootBigQueryTransform = "";
-              if (transform.getClass().equals(StorageApiLoads.class)) {
-                StorageApiLoads<?, ?> storageLoads = (StorageApiLoads<?, ?>) transform;
-                // If the storage load is directing exceptions to an error handler, we don't need to
-                // warn for unconsumed rows
-                if (!storageLoads.usesErrorHandler()) {
-                  failedTag = storageLoads.getFailedRowsTag();
-                }
-                // For storage API the transform that outputs failed rows is nested one layer below
-                // BigQueryIO.
-                rootBigQueryTransform = node.getEnclosingNode().getFullName();
-              } else if (transform.getClass().equals(StreamingWriteTables.class)) {
-                StreamingWriteTables<?> streamingInserts = (StreamingWriteTables<?>) transform;
-                failedTag = streamingInserts.getFailedRowsTupleTag();
-                // For streaming inserts the transform that outputs failed rows is nested two layers
-                // below BigQueryIO.
-                rootBigQueryTransform = node.getEnclosingNode().getEnclosingNode().getFullName();
-              }
-              if (failedTag != null) {
-                PCollection<?> dlq = node.getOutputs().get(failedTag);
-                if (dlq != null) {
-                  unconsumedDLQ.put(dlq, rootBigQueryTransform);
+        Map<PCollection<?>, String> unconsumedDLQ = Maps.newHashMap();
+        pipeline.traverseTopologically(
+                new PipelineVisitor.Defaults() {
+            @Override
+            public CompositeBehavior enterCompositeTransform(Node node) {
+                PTransform<?, ?> transform = node.getTransform();
+                if (transform != null) {
+                    TupleTag<?> failedTag = null;
+                    String rootBigQueryTransform = "";
+                    if (transform.getClass().equals(StorageApiLoads.class)) {
+                        StorageApiLoads<?, ?> storageLoads = (StorageApiLoads<?, ?>) transform;
+                        // If the storage load is directing exceptions to an error handler, we don't need to
+                        // warn for unconsumed rows
+                        if (!storageLoads.usesErrorHandler()) {
+                            failedTag = storageLoads.getFailedRowsTag();
+                        }
+                        // For storage API the transform that outputs failed rows is nested one layer below
+                        // BigQueryIO.
+                        rootBigQueryTransform = node.getEnclosingNode().getFullName();
+                    } else if (transform.getClass().equals(StreamingWriteTables.class)) {
+                        StreamingWriteTables<?> streamingInserts = (StreamingWriteTables<?>) transform;
+                        failedTag = streamingInserts.getFailedRowsTupleTag();
+                        // For streaming inserts the transform that outputs failed rows is nested two layers
+                        // below BigQueryIO.
+                        rootBigQueryTransform = node.getEnclosingNode().getEnclosingNode().getFullName();
+                    }
+                    if (failedTag != null) {
+                        PCollection<?> dlq = node.getOutputs().get(failedTag);
+                        if (dlq != null) {
+                            unconsumedDLQ.put(dlq, rootBigQueryTransform);
+                        }
+                    }
                 }
-              }
-            }
 
-            for (PCollection<?> input : node.getInputs().values()) {
-              unconsumedDLQ.remove(input);
+                for (PCollection<?> input : node.getInputs().values()) {
+                    unconsumedDLQ.remove(input);
+                }
+                return CompositeBehavior.ENTER_TRANSFORM;
             }
-            return CompositeBehavior.ENTER_TRANSFORM;
-          }
 
-          @Override
-          public void visitPrimitiveTransform(Node node) {
-            for (PCollection<?> input : node.getInputs().values()) {
-              unconsumedDLQ.remove(input);
+            @Override
+            public void visitPrimitiveTransform(Node node) {
+                for (PCollection<?> input : node.getInputs().values()) {
+                    unconsumedDLQ.remove(input);
+                }
             }
-          }
         });
-    for (String unconsumed : unconsumedDLQ.values()) {
-      LOG.warn(
-          "No transform processes the failed-inserts output from BigQuery sink: "
-              + unconsumed
-              + "! Not processing failed inserts means that those rows will be lost.");
-    }
-  }
-
-  /** Outputs a warning about PCollection views without deterministic key coders. */
-  private void logWarningIfPCollectionViewHasNonDeterministicKeyCoder(Pipeline pipeline) {
-    // We need to wait till this point to determine the names of the transforms since only
-    // at this time do we know the hierarchy of the transforms otherwise we could
-    // have just recorded the full names during apply time.
-    if (!ptransformViewsWithNonDeterministicKeyCoders.isEmpty()) {
-      final SortedSet<String> ptransformViewNamesWithNonDeterministicKeyCoders = new TreeSet<>();
-      pipeline.traverseTopologically(
-          new PipelineVisitor.Defaults() {
-            @Override
-            public void visitValue(PValue value, TransformHierarchy.Node producer) {}
+        for (String unconsumed : unconsumedDLQ.values()) {
+            LOG.warn(
+                    "No transform processes the failed-inserts output from BigQuery sink: "
+                    + unconsumed
+                    + "! Not processing failed inserts means that those rows will be lost.");
+        }
+    }
 
-            @Override
-            public void visitPrimitiveTransform(TransformHierarchy.Node node) {
-              if (ptransformViewsWithNonDeterministicKeyCoders.contains(node.getTransform())) {
-                ptransformViewNamesWithNonDeterministicKeyCoders.add(node.getFullName());
-              }
-            }
+    /**
+     * Outputs a warning about PCollection views without deterministic key
+     * coders.
+     */
+    private void logWarningIfPCollectionViewHasNonDeterministicKeyCoder(Pipeline pipeline) {
+        // We need to wait till this point to determine the names of the transforms since only
+        // at this time do we know the hierarchy of the transforms otherwise we could
+        // have just recorded the full names during apply time.
+        if (!ptransformViewsWithNonDeterministicKeyCoders.isEmpty()) {
+            final SortedSet<String> ptransformViewNamesWithNonDeterministicKeyCoders = new TreeSet<>();
+            pipeline.traverseTopologically(
+                    new PipelineVisitor.Defaults() {
+                @Override
+                public void visitValue(PValue value, TransformHierarchy.Node producer) {
+                }
 
-            @Override
-            public CompositeBehavior enterCompositeTransform(TransformHierarchy.Node node) {
-              if (node.getTransform() instanceof View.AsMap
-                  || node.getTransform() instanceof View.AsMultimap) {
-                PCollection<KV<?, ?>> input =
-                    (PCollection<KV<?, ?>>) Iterables.getOnlyElement(node.getInputs().values());
-                KvCoder<?, ?> inputCoder = (KvCoder) input.getCoder();
-                try {
-                  inputCoder.getKeyCoder().verifyDeterministic();
-                } catch (NonDeterministicException e) {
-                  ptransformViewNamesWithNonDeterministicKeyCoders.add(node.getFullName());
+                @Override
+                public void visitPrimitiveTransform(TransformHierarchy.Node node) {
+                    if (ptransformViewsWithNonDeterministicKeyCoders.contains(node.getTransform())) {
+                        ptransformViewNamesWithNonDeterministicKeyCoders.add(node.getFullName());
+                    }
                 }
-              }
-              if (ptransformViewsWithNonDeterministicKeyCoders.contains(node.getTransform())) {
-                ptransformViewNamesWithNonDeterministicKeyCoders.add(node.getFullName());
-              }
-              return CompositeBehavior.ENTER_TRANSFORM;
-            }
 
-            @Override
-            public void leaveCompositeTransform(TransformHierarchy.Node node) {}
-          });
-
-      LOG.warn(
-          "Unable to use indexed implementation for View.AsMap and View.AsMultimap for {} because"
-              + " the key coder is not deterministic. Falling back to singleton implementation"
-              + " which may cause memory and/or performance problems. Future major versions of"
-              + " Dataflow will require deterministic key coders.",
-          ptransformViewNamesWithNonDeterministicKeyCoders);
-    }
-  }
-
-  /**
-   * Returns true if the passed in {@link PCollection} needs to be materialized using an indexed
-   * format.
-   */
-  boolean doesPCollectionRequireIndexedFormat(PCollection<?> pcol) {
-    return pcollectionsRequiringIndexedFormat.contains(pcol);
-  }
-
-  /**
-   * Marks the passed in {@link PCollection} as requiring to be materialized using an indexed
-   * format.
-   */
-  void addPCollectionRequiringIndexedFormat(PCollection<?> pcol) {
-    pcollectionsRequiringIndexedFormat.add(pcol);
-  }
-
-  void maybeRecordPCollectionPreservedKeys(PCollection<?> pcol) {
-    pCollectionsPreservedKeys.add(pcol);
-  }
-
-  void maybeRecordPCollectionWithAutoSharding(PCollection<?> pcol) {
-    // Auto-sharding is only supported in Streaming Engine.
-    checkArgument(
-        options.isEnableStreamingEngine(),
-        "Runner determined sharding not available in Dataflow for GroupIntoBatches for"
-            + " non-Streaming-Engine jobs. In order to use runner determined sharding, please use"
-            + " --streaming --experiments=enable_streaming_engine");
-    pCollectionsPreservedKeys.add(pcol);
-    pcollectionsRequiringAutoSharding.add(pcol);
-  }
-
-  boolean doesPCollectionPreserveKeys(PCollection<?> pcol) {
-    return pCollectionsPreservedKeys.contains(pcol);
-  }
-
-  boolean doesPCollectionRequireAutoSharding(PCollection<?> pcol) {
-    return pcollectionsRequiringAutoSharding.contains(pcol);
-  }
-
-  /** A set of {@link View}s with non-deterministic key coders. */
-  private Set<PTransform<?, ?>> ptransformViewsWithNonDeterministicKeyCoders;
-
-  /** Records that the {@link PTransform} requires a deterministic key coder. */
-  void recordViewUsesNonDeterministicKeyCoder(PTransform<?, ?> ptransform) {
-    ptransformViewsWithNonDeterministicKeyCoders.add(ptransform);
-  }
-
-  // ================================================================================
-  // PubsubIO translations
-  // ================================================================================
-
-  private static class StreamingPubsubIOReadOverrideFactory
-      implements PTransformOverrideFactory<
-          PBegin, PCollection<PubsubMessage>, PubsubUnboundedSource> {
+                @Override
+                public CompositeBehavior enterCompositeTransform(TransformHierarchy.Node node) {
+                    if (node.getTransform() instanceof View.AsMap
+                            || node.getTransform() instanceof View.AsMultimap) {
+                        PCollection<KV<?, ?>> input
+                                = (PCollection<KV<?, ?>>) Iterables.getOnlyElement(node.getInputs().values());
+                        KvCoder<?, ?> inputCoder = (KvCoder) input.getCoder();
+                        try {
+                            inputCoder.getKeyCoder().verifyDeterministic();
+                        } catch (NonDeterministicException e) {
+                            ptransformViewNamesWithNonDeterministicKeyCoders.add(node.getFullName());
+                        }
+                    }
+                    if (ptransformViewsWithNonDeterministicKeyCoders.contains(node.getTransform())) {
+                        ptransformViewNamesWithNonDeterministicKeyCoders.add(node.getFullName());
+                    }
+                    return CompositeBehavior.ENTER_TRANSFORM;
+                }
 
-    @Override
-    public PTransformReplacement<PBegin, PCollection<PubsubMessage>> getReplacementTransform(
-        AppliedPTransform<PBegin, PCollection<PubsubMessage>, PubsubUnboundedSource> transform) {
-      return PTransformReplacement.of(
-          transform.getPipeline().begin(), new StreamingPubsubIORead(transform.getTransform()));
+                @Override
+                public void leaveCompositeTransform(TransformHierarchy.Node node) {
+                }
+            });
+
+            LOG.warn(
+                    "Unable to use indexed implementation for View.AsMap and View.AsMultimap for {} because"
+                    + " the key coder is not deterministic. Falling back to singleton implementation"
+                    + " which may cause memory and/or performance problems. Future major versions of"
+                    + " Dataflow will require deterministic key coders.",
+                    ptransformViewNamesWithNonDeterministicKeyCoders);
+        }
     }
 
-    @Override
-    public Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, PCollection<PubsubMessage> newOutput) {
-      return ReplacementOutputs.singleton(outputs, newOutput);
+    /**
+     * Returns true if the passed in {@link PCollection} needs to be
+     * materialized using an indexed format.
+     */
+    boolean doesPCollectionRequireIndexedFormat(PCollection<?> pcol) {
+        return pcollectionsRequiringIndexedFormat.contains(pcol);
     }
-  }
-
-  /**
-   * Suppress application of {@link PubsubUnboundedSource#expand} in streaming mode so that we can
-   * instead defer to Windmill's implementation.
-   */
-  private static class StreamingPubsubIORead
-      extends PTransform<PBegin, PCollection<PubsubMessage>> {
 
-    private final PubsubUnboundedSource transform;
+    /**
+     * Marks the passed in {@link PCollection} as requiring to be materialized
+     * using an indexed format.
+     */
+    void addPCollectionRequiringIndexedFormat(PCollection<?> pcol) {
+        pcollectionsRequiringIndexedFormat.add(pcol);
+    }
 
-    public StreamingPubsubIORead(PubsubUnboundedSource transform) {
-      this.transform = transform;
+    void maybeRecordPCollectionPreservedKeys(PCollection<?> pcol) {
+        pCollectionsPreservedKeys.add(pcol);
     }
 
-    public PubsubUnboundedSource getOverriddenTransform() {
-      return transform;
+    void maybeRecordPCollectionWithAutoSharding(PCollection<?> pcol) {
+        // Auto-sharding is only supported in Streaming Engine.
+        checkArgument(
+                options.isEnableStreamingEngine(),
+                "Runner determined sharding not available in Dataflow for GroupIntoBatches for"
+                + " non-Streaming-Engine jobs. In order to use runner determined sharding, please use"
+                + " --streaming --experiments=enable_streaming_engine");
+        pCollectionsPreservedKeys.add(pcol);
+        pcollectionsRequiringAutoSharding.add(pcol);
     }
 
-    @Override
-    public PCollection<PubsubMessage> expand(PBegin input) {
-      Coder coder =
-          transform.getNeedsMessageId()
-              ? new PubsubMessageWithAttributesAndMessageIdCoder()
-              : new PubsubMessageWithAttributesCoder();
-      return PCollection.createPrimitiveOutputInternal(
-          input.getPipeline(), WindowingStrategy.globalDefault(), IsBounded.UNBOUNDED, coder);
+    boolean doesPCollectionPreserveKeys(PCollection<?> pcol) {
+        return pCollectionsPreservedKeys.contains(pcol);
     }
 
-    @Override
-    protected String getKindString() {
-      return "StreamingPubsubIORead";
+    boolean doesPCollectionRequireAutoSharding(PCollection<?> pcol) {
+        return pcollectionsRequiringAutoSharding.contains(pcol);
     }
 
-    static {
-      DataflowPipelineTranslator.registerTransformTranslator(
-          StreamingPubsubIORead.class, new StreamingPubsubIOReadTranslator());
-    }
-  }
-
-  private static void translateOverriddenPubsubSourceStep(
-      PubsubUnboundedSource overriddenTransform, StepTranslationContext stepTranslationContext) {
-    stepTranslationContext.addInput(PropertyNames.FORMAT, "pubsub");
-    if (overriddenTransform.getTopicProvider() != null) {
-      if (overriddenTransform.getTopicProvider().isAccessible()) {
-        stepTranslationContext.addInput(
-            PropertyNames.PUBSUB_TOPIC, overriddenTransform.getTopic().getFullPath());
-      } else {
-        stepTranslationContext.addInput(
-            PropertyNames.PUBSUB_TOPIC_OVERRIDE,
-            ((NestedValueProvider) overriddenTransform.getTopicProvider()).propertyName());
-      }
-    }
-    if (overriddenTransform.getSubscriptionProvider() != null) {
-      if (overriddenTransform.getSubscriptionProvider().isAccessible()) {
-        stepTranslationContext.addInput(
-            PropertyNames.PUBSUB_SUBSCRIPTION, overriddenTransform.getSubscription().getFullPath());
-      } else {
-        stepTranslationContext.addInput(
-            PropertyNames.PUBSUB_SUBSCRIPTION_OVERRIDE,
-            ((NestedValueProvider) overriddenTransform.getSubscriptionProvider()).propertyName());
-      }
-    }
-    if (overriddenTransform.getTimestampAttribute() != null) {
-      stepTranslationContext.addInput(
-          PropertyNames.PUBSUB_TIMESTAMP_ATTRIBUTE, overriddenTransform.getTimestampAttribute());
-    }
-    if (overriddenTransform.getIdAttribute() != null) {
-      stepTranslationContext.addInput(
-          PropertyNames.PUBSUB_ID_ATTRIBUTE, overriddenTransform.getIdAttribute());
-    }
-    // In both cases, the transform needs to read PubsubMessage. However, in case it needs
-    // the attributes or messageId, we supply an identity "parse fn" so the worker will
-    // read PubsubMessage's from Windmill and simply pass them around; and in case it
-    // doesn't need attributes, we're already implicitly using a "Coder" that interprets
-    // the data as a PubsubMessage's payload.
-    if (overriddenTransform.getNeedsAttributes() || overriddenTransform.getNeedsMessageId()) {
-      stepTranslationContext.addInput(
-          PropertyNames.PUBSUB_SERIALIZED_ATTRIBUTES_FN,
-          byteArrayToJsonString(serializeToByteArray(new IdentityMessageFn())));
-    }
-  }
-
-  /** Rewrite {@link StreamingPubsubIORead} to the appropriate internal node. */
-  private static class StreamingPubsubIOReadTranslator
-      implements TransformTranslator<StreamingPubsubIORead> {
+    /**
+     * A set of {@link View}s with non-deterministic key coders.
+     */
+    private Set<PTransform<?, ?>> ptransformViewsWithNonDeterministicKeyCoders;
 
-    @Override
-    public void translate(
-        StreamingPubsubIORead transform, TransformTranslator.TranslationContext context) {
-      checkArgument(
-          context.getPipelineOptions().isStreaming(),
-          "StreamingPubsubIORead is only for streaming pipelines.");
-      StepTranslationContext stepContext = context.addStep(transform, "ParallelRead");
-      translateOverriddenPubsubSourceStep(transform.getOverriddenTransform(), stepContext);
-      stepContext.addOutput(PropertyNames.OUTPUT, context.getOutput(transform));
+    /**
+     * Records that the {@link PTransform} requires a deterministic key coder.
+     */
+    void recordViewUsesNonDeterministicKeyCoder(PTransform<?, ?> ptransform) {
+        ptransformViewsWithNonDeterministicKeyCoders.add(ptransform);
     }
-  }
 
-  private static class IdentityMessageFn extends SimpleFunction<PubsubMessage, PubsubMessage> {
+    // ================================================================================
+    // PubsubIO translations
+    // ================================================================================
+    private static class StreamingPubsubIOReadOverrideFactory
+            implements PTransformOverrideFactory<
+          PBegin, PCollection<PubsubMessage>, PubsubUnboundedSource> {
 
-    @Override
-    public PubsubMessage apply(PubsubMessage input) {
-      return input;
+        @Override
+        public PTransformReplacement<PBegin, PCollection<PubsubMessage>> getReplacementTransform(
+                AppliedPTransform<PBegin, PCollection<PubsubMessage>, PubsubUnboundedSource> transform) {
+            return PTransformReplacement.of(
+                    transform.getPipeline().begin(), new StreamingPubsubIORead(transform.getTransform()));
+        }
+
+        @Override
+        public Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, PCollection<PubsubMessage> newOutput) {
+            return ReplacementOutputs.singleton(outputs, newOutput);
+        }
     }
-  }
 
-  /**
-   * Suppress application of {@link PubsubUnboundedSink#expand} in streaming mode so that we can
-   * instead defer to Windmill's implementation.
-   */
-  static class StreamingPubsubIOWrite extends PTransform<PCollection<PubsubMessage>, PDone> {
+    /**
+     * Suppress application of {@link PubsubUnboundedSource#expand} in streaming
+     * mode so that we can instead defer to Windmill's implementation.
+     */
+    private static class StreamingPubsubIORead
+            extends PTransform<PBegin, PCollection<PubsubMessage>> {
 
-    private final PubsubUnboundedSink transform;
+        private final PubsubUnboundedSource transform;
 
-    /** Builds an instance of this class from the overridden transform. */
-    public StreamingPubsubIOWrite(DataflowRunner runner, PubsubUnboundedSink transform) {
-      this.transform = transform;
-    }
+        public StreamingPubsubIORead(PubsubUnboundedSource transform) {
+            this.transform = transform;
+        }
 
-    PubsubUnboundedSink getOverriddenTransform() {
-      return transform;
-    }
+        public PubsubUnboundedSource getOverriddenTransform() {
+            return transform;
+        }
 
-    @Override
-    public PDone expand(PCollection<PubsubMessage> input) {
-      return PDone.in(input.getPipeline());
+        @Override
+        public PCollection<PubsubMessage> expand(PBegin input) {
+            Coder coder
+                    = transform.getNeedsMessageId()
+                    ? new PubsubMessageWithAttributesAndMessageIdCoder()
+                    : new PubsubMessageWithAttributesCoder();
+            return PCollection.createPrimitiveOutputInternal(
+                    input.getPipeline(), WindowingStrategy.globalDefault(), IsBounded.UNBOUNDED, coder);
+        }
+
+        @Override
+        protected String getKindString() {
+            return "StreamingPubsubIORead";
+        }
+
+        static {
+            DataflowPipelineTranslator.registerTransformTranslator(
+                    StreamingPubsubIORead.class, new StreamingPubsubIOReadTranslator());
+        }
     }
 
-    @Override
-    protected String getKindString() {
-      return "StreamingPubsubIOWrite";
+    private static void translateOverriddenPubsubSourceStep(
+            PubsubUnboundedSource overriddenTransform, StepTranslationContext stepTranslationContext) {
+        stepTranslationContext.addInput(PropertyNames.FORMAT, "pubsub");
+        if (overriddenTransform.getTopicProvider() != null) {
+            if (overriddenTransform.getTopicProvider().isAccessible()) {
+                stepTranslationContext.addInput(
+                        PropertyNames.PUBSUB_TOPIC, overriddenTransform.getTopic().getFullPath());
+            } else {
+                stepTranslationContext.addInput(
+                        PropertyNames.PUBSUB_TOPIC_OVERRIDE,
+                        ((NestedValueProvider) overriddenTransform.getTopicProvider()).propertyName());
+            }
+        }
+        if (overriddenTransform.getSubscriptionProvider() != null) {
+            if (overriddenTransform.getSubscriptionProvider().isAccessible()) {
+                stepTranslationContext.addInput(
+                        PropertyNames.PUBSUB_SUBSCRIPTION, overriddenTransform.getSubscription().getFullPath());
+            } else {
+                stepTranslationContext.addInput(
+                        PropertyNames.PUBSUB_SUBSCRIPTION_OVERRIDE,
+                        ((NestedValueProvider) overriddenTransform.getSubscriptionProvider()).propertyName());
+            }
+        }
+        if (overriddenTransform.getTimestampAttribute() != null) {
+            stepTranslationContext.addInput(
+                    PropertyNames.PUBSUB_TIMESTAMP_ATTRIBUTE, overriddenTransform.getTimestampAttribute());
+        }
+        if (overriddenTransform.getIdAttribute() != null) {
+            stepTranslationContext.addInput(
+                    PropertyNames.PUBSUB_ID_ATTRIBUTE, overriddenTransform.getIdAttribute());
+        }
+        // In both cases, the transform needs to read PubsubMessage. However, in case it needs
+        // the attributes or messageId, we supply an identity "parse fn" so the worker will
+        // read PubsubMessage's from Windmill and simply pass them around; and in case it
+        // doesn't need attributes, we're already implicitly using a "Coder" that interprets
+        // the data as a PubsubMessage's payload.
+        if (overriddenTransform.getNeedsAttributes() || overriddenTransform.getNeedsMessageId()) {
+            stepTranslationContext.addInput(
+                    PropertyNames.PUBSUB_SERIALIZED_ATTRIBUTES_FN,
+                    byteArrayToJsonString(serializeToByteArray(new IdentityMessageFn())));
+        }
     }
 
-    static {
-      DataflowPipelineTranslator.registerTransformTranslator(
-          StreamingPubsubIOWrite.class,
-          new StreamingPubsubSinkTranslators.StreamingPubsubIOWriteTranslator());
+    /**
+     * Rewrite {@link StreamingPubsubIORead} to the appropriate internal node.
+     */
+    private static class StreamingPubsubIOReadTranslator
+            implements TransformTranslator<StreamingPubsubIORead> {
+
+        @Override
+        public void translate(
+                StreamingPubsubIORead transform, TransformTranslator.TranslationContext context) {
+            checkArgument(
+                    context.getPipelineOptions().isStreaming(),
+                    "StreamingPubsubIORead is only for streaming pipelines.");
+            StepTranslationContext stepContext = context.addStep(transform, "ParallelRead");
+            translateOverriddenPubsubSourceStep(transform.getOverriddenTransform(), stepContext);
+            stepContext.addOutput(PropertyNames.OUTPUT, context.getOutput(transform));
+        }
     }
-  }
 
-  private static class StreamingPubsubSinkTranslators {
-    /** Rewrite {@link StreamingPubsubIOWrite} to the appropriate internal node. */
-    static class StreamingPubsubIOWriteTranslator
-        implements TransformTranslator<StreamingPubsubIOWrite> {
+    private static class IdentityMessageFn extends SimpleFunction<PubsubMessage, PubsubMessage> {
 
-      @Override
-      public void translate(
-          StreamingPubsubIOWrite transform, TransformTranslator.TranslationContext context) {
-        checkArgument(
-            context.getPipelineOptions().isStreaming(),
-            "StreamingPubsubIOWrite is only for streaming pipelines.");
-        StepTranslationContext stepContext = context.addStep(transform, "ParallelWrite");
-        StreamingPubsubSinkTranslators.translate(
-            transform.getOverriddenTransform(), stepContext, context.getInput(transform));
-      }
-    }
-
-    private static void translate(
-        PubsubUnboundedSink overriddenTransform,
-        StepTranslationContext stepContext,
-        PCollection input) {
-      stepContext.addInput(PropertyNames.FORMAT, "pubsub");
-      if (overriddenTransform.getTopicProvider() != null) {
-        if (overriddenTransform.getTopicProvider().isAccessible()) {
-          stepContext.addInput(
-              PropertyNames.PUBSUB_TOPIC, overriddenTransform.getTopic().getFullPath());
-        } else {
-          stepContext.addInput(
-              PropertyNames.PUBSUB_TOPIC_OVERRIDE,
-              ((NestedValueProvider) overriddenTransform.getTopicProvider()).propertyName());
-        }
-      } else {
-        stepContext.addInput(PropertyNames.PUBSUB_DYNAMIC_DESTINATIONS, true);
-      }
-      if (overriddenTransform.getTimestampAttribute() != null) {
-        stepContext.addInput(
-            PropertyNames.PUBSUB_TIMESTAMP_ATTRIBUTE, overriddenTransform.getTimestampAttribute());
-      }
-      if (overriddenTransform.getIdAttribute() != null) {
-        stepContext.addInput(
-            PropertyNames.PUBSUB_ID_ATTRIBUTE, overriddenTransform.getIdAttribute());
-      }
-      stepContext.addInput(
-          PropertyNames.PUBSUB_SERIALIZED_ATTRIBUTES_FN,
-          byteArrayToJsonString(serializeToByteArray(new IdentityMessageFn())));
-
-      // Using a GlobalWindowCoder as a place holder because GlobalWindowCoder is known coder.
-      stepContext.addEncodingInput(
-          WindowedValue.getFullCoder(VoidCoder.of(), GlobalWindow.Coder.INSTANCE));
-      stepContext.addInput(PropertyNames.PARALLEL_INPUT, input);
-    }
-  }
-
-  // ================================================================================
-
-  private static class SingleOutputExpandableTransformTranslator
-      implements TransformTranslator<External.SingleOutputExpandableTransform> {
-    @Override
-    public void translate(
-        External.SingleOutputExpandableTransform transform, TranslationContext context) {
-      StepTranslationContext stepContext = context.addStep(transform, "ExternalTransform");
-      PCollection<?> output = (PCollection<?>) context.getOutput(transform);
-      stepContext.addOutput(PropertyNames.OUTPUT, output);
-    }
-  }
-
-  static {
-    DataflowPipelineTranslator.registerTransformTranslator(
-        External.SingleOutputExpandableTransform.class,
-        new SingleOutputExpandableTransformTranslator());
-  }
-
-  private static class MultiOutputExpandableTransformTranslator
-      implements TransformTranslator<External.MultiOutputExpandableTransform> {
-    @Override
-    public void translate(
-        External.MultiOutputExpandableTransform transform, TranslationContext context) {
-      StepTranslationContext stepContext = context.addStep(transform, "ExternalTransform");
-      Map<TupleTag<?>, PCollection<?>> outputs = context.getOutputs(transform);
-      for (Map.Entry<TupleTag<?>, PCollection<?>> taggedOutput : outputs.entrySet()) {
-        TupleTag<?> tag = taggedOutput.getKey();
-        stepContext.addOutput(tag.getId(), taggedOutput.getValue());
-      }
+        @Override
+        public PubsubMessage apply(PubsubMessage input) {
+            return input;
+        }
     }
-  }
 
-  static {
-    DataflowPipelineTranslator.registerTransformTranslator(
-        External.MultiOutputExpandableTransform.class,
-        new MultiOutputExpandableTransformTranslator());
-  }
+    /**
+     * Suppress application of {@link PubsubUnboundedSink#expand} in streaming
+     * mode so that we can instead defer to Windmill's implementation.
+     */
+    static class StreamingPubsubIOWrite extends PTransform<PCollection<PubsubMessage>, PDone> {
 
-  private static class ImpulseTranslator implements TransformTranslator<Impulse> {
+        private final PubsubUnboundedSink transform;
 
-    @Override
-    public void translate(Impulse transform, TransformTranslator.TranslationContext context) {
-      if (context.getPipelineOptions().isStreaming()) {
-        StepTranslationContext stepContext = context.addStep(transform, "ParallelRead");
-        stepContext.addInput(PropertyNames.FORMAT, "pubsub");
-        stepContext.addInput(PropertyNames.PUBSUB_SUBSCRIPTION, "_starting_signal/");
-        stepContext.addOutput(PropertyNames.OUTPUT, context.getOutput(transform));
-      } else {
-        StepTranslationContext stepContext = context.addStep(transform, "ParallelRead");
-        stepContext.addInput(PropertyNames.FORMAT, "impulse");
-        WindowedValue.FullWindowedValueCoder<byte[]> coder =
-            WindowedValue.getFullCoder(
-                context.getOutput(transform).getCoder(), GlobalWindow.Coder.INSTANCE);
-        byte[] encodedImpulse;
-        try {
-          encodedImpulse = encodeToByteArray(coder, WindowedValue.valueInGlobalWindow(new byte[0]));
-        } catch (Exception e) {
-          throw new RuntimeException(e);
+        /**
+         * Builds an instance of this class from the overridden transform.
+         */
+        public StreamingPubsubIOWrite(DataflowRunner runner, PubsubUnboundedSink transform) {
+            this.transform = transform;
+        }
+
+        PubsubUnboundedSink getOverriddenTransform() {
+            return transform;
+        }
+
+        @Override
+        public PDone expand(PCollection<PubsubMessage> input) {
+            return PDone.in(input.getPipeline());
+        }
+
+        @Override
+        protected String getKindString() {
+            return "StreamingPubsubIOWrite";
+        }
+
+        static {
+            DataflowPipelineTranslator.registerTransformTranslator(
+                    StreamingPubsubIOWrite.class,
+                    new StreamingPubsubSinkTranslators.StreamingPubsubIOWriteTranslator());
         }
-        stepContext.addInput(PropertyNames.IMPULSE_ELEMENT, byteArrayToJsonString(encodedImpulse));
-        stepContext.addOutput(PropertyNames.OUTPUT, context.getOutput(transform));
-      }
     }
-  }
 
-  static {
-    DataflowPipelineTranslator.registerTransformTranslator(Impulse.class, new ImpulseTranslator());
-  }
+    private static class StreamingPubsubSinkTranslators {
 
-  private static class StreamingUnboundedReadOverrideFactory<T>
-      implements PTransformOverrideFactory<PBegin, PCollection<T>, Read.Unbounded<T>> {
+        /**
+         * Rewrite {@link StreamingPubsubIOWrite} to the appropriate internal
+         * node.
+         */
+        static class StreamingPubsubIOWriteTranslator
+                implements TransformTranslator<StreamingPubsubIOWrite> {
 
-    @Override
-    public PTransformReplacement<PBegin, PCollection<T>> getReplacementTransform(
-        AppliedPTransform<PBegin, PCollection<T>, Read.Unbounded<T>> transform) {
-      return PTransformReplacement.of(
-          transform.getPipeline().begin(), new StreamingUnboundedRead<>(transform.getTransform()));
+            @Override
+            public void translate(
+                    StreamingPubsubIOWrite transform, TransformTranslator.TranslationContext context) {
+                checkArgument(
+                        context.getPipelineOptions().isStreaming(),
+                        "StreamingPubsubIOWrite is only for streaming pipelines.");
+                StepTranslationContext stepContext = context.addStep(transform, "ParallelWrite");
+                StreamingPubsubSinkTranslators.translate(
+                        transform.getOverriddenTransform(), stepContext, context.getInput(transform));
+            }
+        }
+
+        private static void translate(
+                PubsubUnboundedSink overriddenTransform,
+                StepTranslationContext stepContext,
+                PCollection input) {
+            stepContext.addInput(PropertyNames.FORMAT, "pubsub");
+            if (overriddenTransform.getTopicProvider() != null) {
+                if (overriddenTransform.getTopicProvider().isAccessible()) {
+                    stepContext.addInput(
+                            PropertyNames.PUBSUB_TOPIC, overriddenTransform.getTopic().getFullPath());
+                } else {
+                    stepContext.addInput(
+                            PropertyNames.PUBSUB_TOPIC_OVERRIDE,
+                            ((NestedValueProvider) overriddenTransform.getTopicProvider()).propertyName());
+                }
+            } else {
+                stepContext.addInput(PropertyNames.PUBSUB_DYNAMIC_DESTINATIONS, true);
+            }
+            if (overriddenTransform.getTimestampAttribute() != null) {
+                stepContext.addInput(
+                        PropertyNames.PUBSUB_TIMESTAMP_ATTRIBUTE, overriddenTransform.getTimestampAttribute());
+            }
+            if (overriddenTransform.getIdAttribute() != null) {
+                stepContext.addInput(
+                        PropertyNames.PUBSUB_ID_ATTRIBUTE, overriddenTransform.getIdAttribute());
+            }
+            stepContext.addInput(
+                    PropertyNames.PUBSUB_SERIALIZED_ATTRIBUTES_FN,
+                    byteArrayToJsonString(serializeToByteArray(new IdentityMessageFn())));
+
+            // Using a GlobalWindowCoder as a place holder because GlobalWindowCoder is known coder.
+            stepContext.addEncodingInput(
+                    WindowedValue.getFullCoder(VoidCoder.of(), GlobalWindow.Coder.INSTANCE));
+            stepContext.addInput(PropertyNames.PARALLEL_INPUT, input);
+        }
     }
 
-    @Override
-    public Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, PCollection<T> newOutput) {
-      return ReplacementOutputs.singleton(outputs, newOutput);
+    // ================================================================================
+    private static class SingleOutputExpandableTransformTranslator
+            implements TransformTranslator<External.SingleOutputExpandableTransform> {
+
+        @Override
+        public void translate(
+                External.SingleOutputExpandableTransform transform, TranslationContext context) {
+            StepTranslationContext stepContext = context.addStep(transform, "ExternalTransform");
+            PCollection<?> output = (PCollection<?>) context.getOutput(transform);
+            stepContext.addOutput(PropertyNames.OUTPUT, output);
+        }
     }
-  }
 
-  /**
-   * Specialized implementation for {@link org.apache.beam.sdk.io.Read.Unbounded Read.Unbounded} for
-   * the Dataflow runner in streaming mode.
-   *
-   * <p>In particular, if an UnboundedSource requires deduplication, then features of WindmillSink
-   * are leveraged to do the deduplication.
-   */
-  private static class StreamingUnboundedRead<T> extends PTransform<PBegin, PCollection<T>> {
+    static {
+        DataflowPipelineTranslator.registerTransformTranslator(
+                External.SingleOutputExpandableTransform.class,
+                new SingleOutputExpandableTransformTranslator());
+    }
+
+    private static class MultiOutputExpandableTransformTranslator
+            implements TransformTranslator<External.MultiOutputExpandableTransform> {
+
+        @Override
+        public void translate(
+                External.MultiOutputExpandableTransform transform, TranslationContext context) {
+            StepTranslationContext stepContext = context.addStep(transform, "ExternalTransform");
+            Map<TupleTag<?>, PCollection<?>> outputs = context.getOutputs(transform);
+            for (Map.Entry<TupleTag<?>, PCollection<?>> taggedOutput : outputs.entrySet()) {
+                TupleTag<?> tag = taggedOutput.getKey();
+                stepContext.addOutput(tag.getId(), taggedOutput.getValue());
+            }
+        }
+    }
 
-    private final UnboundedSource<T, ?> source;
+    static {
+        DataflowPipelineTranslator.registerTransformTranslator(
+                External.MultiOutputExpandableTransform.class,
+                new MultiOutputExpandableTransformTranslator());
+    }
+
+    private static class ImpulseTranslator implements TransformTranslator<Impulse> {
+
+        @Override
+        public void translate(Impulse transform, TransformTranslator.TranslationContext context) {
+            if (context.getPipelineOptions().isStreaming()) {
+                StepTranslationContext stepContext = context.addStep(transform, "ParallelRead");
+                stepContext.addInput(PropertyNames.FORMAT, "pubsub");
+                stepContext.addInput(PropertyNames.PUBSUB_SUBSCRIPTION, "_starting_signal/");
+                stepContext.addOutput(PropertyNames.OUTPUT, context.getOutput(transform));
+            } else {
+                StepTranslationContext stepContext = context.addStep(transform, "ParallelRead");
+                stepContext.addInput(PropertyNames.FORMAT, "impulse");
+                WindowedValue.FullWindowedValueCoder<byte[]> coder
+                        = WindowedValue.getFullCoder(
+                                context.getOutput(transform).getCoder(), GlobalWindow.Coder.INSTANCE);
+                byte[] encodedImpulse;
+                try {
+                    encodedImpulse = encodeToByteArray(coder, WindowedValue.valueInGlobalWindow(new byte[0]));
+                } catch (Exception e) {
+                    throw new RuntimeException(e);
+                }
+                stepContext.addInput(PropertyNames.IMPULSE_ELEMENT, byteArrayToJsonString(encodedImpulse));
+                stepContext.addOutput(PropertyNames.OUTPUT, context.getOutput(transform));
+            }
+        }
+    }
 
-    public StreamingUnboundedRead(Read.Unbounded<T> transform) {
-      this.source = transform.getSource();
+    static {
+        DataflowPipelineTranslator.registerTransformTranslator(Impulse.class, new ImpulseTranslator());
     }
 
-    @Override
-    public final PCollection<T> expand(PBegin input) {
-      source.validate();
+    private static class StreamingUnboundedReadOverrideFactory<T>
+            implements PTransformOverrideFactory<PBegin, PCollection<T>, Read.Unbounded<T>> {
+
+        @Override
+        public PTransformReplacement<PBegin, PCollection<T>> getReplacementTransform(
+                AppliedPTransform<PBegin, PCollection<T>, Read.Unbounded<T>> transform) {
+            return PTransformReplacement.of(
+                    transform.getPipeline().begin(), new StreamingUnboundedRead<>(transform.getTransform()));
+        }
 
-      if (source.requiresDeduping()) {
-        return Pipeline.applyTransform(input, new ReadWithIds<>(source)).apply(new Deduplicate<>());
-      } else {
-        return Pipeline.applyTransform(input, new ReadWithIds<>(source))
-            .apply("StripIds", ParDo.of(new ValueWithRecordId.StripIdsDoFn<>()));
-      }
+        @Override
+        public Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, PCollection<T> newOutput) {
+            return ReplacementOutputs.singleton(outputs, newOutput);
+        }
     }
 
     /**
-     * {@link PTransform} that reads {@code (record,recordId)} pairs from an {@link
-     * UnboundedSource}.
+     * Specialized implementation for
+     * {@link org.apache.beam.sdk.io.Read.Unbounded Read.Unbounded} for the
+     * Dataflow runner in streaming mode.
+     *
+     * <p>
+     * In particular, if an UnboundedSource requires deduplication, then
+     * features of WindmillSink are leveraged to do the deduplication.
      */
-    private static class ReadWithIds<T>
-        extends PTransform<PInput, PCollection<ValueWithRecordId<T>>> {
+    private static class StreamingUnboundedRead<T> extends PTransform<PBegin, PCollection<T>> {
 
-      private final UnboundedSource<T, ?> source;
+        private final UnboundedSource<T, ?> source;
 
-      private ReadWithIds(UnboundedSource<T, ?> source) {
-        this.source = source;
-      }
+        public StreamingUnboundedRead(Read.Unbounded<T> transform) {
+            this.source = transform.getSource();
+        }
 
-      @Override
-      public final PCollection<ValueWithRecordId<T>> expand(PInput input) {
-        return PCollection.createPrimitiveOutputInternal(
-            input.getPipeline(),
-            WindowingStrategy.globalDefault(),
-            IsBounded.UNBOUNDED,
-            ValueWithRecordId.ValueWithRecordIdCoder.of(source.getOutputCoder()));
-      }
+        @Override
+        public final PCollection<T> expand(PBegin input) {
+            source.validate();
 
-      @Override
-      public void populateDisplayData(DisplayData.Builder builder) {
-        builder.delegate(source);
-      }
+            if (source.requiresDeduping()) {
+                return Pipeline.applyTransform(input, new ReadWithIds<>(source)).apply(new Deduplicate<>());
+            } else {
+                return Pipeline.applyTransform(input, new ReadWithIds<>(source))
+                        .apply("StripIds", ParDo.of(new ValueWithRecordId.StripIdsDoFn<>()));
+            }
+        }
 
-      public UnboundedSource<T, ?> getSource() {
-        return source;
-      }
-    }
+        /**
+         * {@link PTransform} that reads {@code (record,recordId)} pairs from an {@link
+         * UnboundedSource}.
+         */
+        private static class ReadWithIds<T>
+                extends PTransform<PInput, PCollection<ValueWithRecordId<T>>> {
 
-    @Override
-    public String getKindString() {
-      return String.format("Read(%s)", NameUtils.approximateSimpleName(source));
-    }
+            private final UnboundedSource<T, ?> source;
 
-    static {
-      DataflowPipelineTranslator.registerTransformTranslator(
-          ReadWithIds.class, new ReadWithIdsTranslator());
-    }
+            private ReadWithIds(UnboundedSource<T, ?> source) {
+                this.source = source;
+            }
 
-    private static class ReadWithIdsTranslator implements TransformTranslator<ReadWithIds<?>> {
+            @Override
+            public final PCollection<ValueWithRecordId<T>> expand(PInput input) {
+                return PCollection.createPrimitiveOutputInternal(
+                        input.getPipeline(),
+                        WindowingStrategy.globalDefault(),
+                        IsBounded.UNBOUNDED,
+                        ValueWithRecordId.ValueWithRecordIdCoder.of(source.getOutputCoder()));
+            }
 
-      @Override
-      public void translate(
-          ReadWithIds<?> transform, TransformTranslator.TranslationContext context) {
-        ReadTranslator.translateReadHelper(transform.getSource(), transform, context);
-      }
-    }
-  }
+            @Override
+            public void populateDisplayData(DisplayData.Builder builder) {
+                builder.delegate(source);
+            }
 
-  /** Remove values with duplicate ids. */
-  private static class Deduplicate<T>
-      extends PTransform<PCollection<ValueWithRecordId<T>>, PCollection<T>> {
+            public UnboundedSource<T, ?> getSource() {
+                return source;
+            }
+        }
 
-    // Use a finite set of keys to improve bundling.  Without this, the key space
-    // will be the space of ids which is potentially very large, which results in much
-    // more per-key overhead.
-    private static final int NUM_RESHARD_KEYS = 10000;
+        @Override
+        public String getKindString() {
+            return String.format("Read(%s)", NameUtils.approximateSimpleName(source));
+        }
 
-    @Override
-    public PCollection<T> expand(PCollection<ValueWithRecordId<T>> input) {
-      return input
-          .apply(
-              WithKeys.of(
-                      (ValueWithRecordId<T> value) ->
-                          Arrays.hashCode(value.getId()) % NUM_RESHARD_KEYS)
-                  .withKeyType(TypeDescriptors.integers()))
-          // Reshuffle will dedup based on ids in ValueWithRecordId by passing the data through
-          // WindmillSink.
-          .apply(Reshuffle.of())
-          .apply(
-              "StripIds",
-              ParDo.of(
-                  new DoFn<KV<Integer, ValueWithRecordId<T>>, T>() {
-                    @ProcessElement
-                    public void processElement(ProcessContext c) {
-                      c.output(c.element().getValue().getValue());
-                    }
-                  }));
-    }
-  }
+        static {
+            DataflowPipelineTranslator.registerTransformTranslator(
+                    ReadWithIds.class, new ReadWithIdsTranslator());
+        }
 
-  private static class StreamingBoundedReadOverrideFactory<T>
-      implements PTransformOverrideFactory<PBegin, PCollection<T>, Read.Bounded<T>> {
+        private static class ReadWithIdsTranslator implements TransformTranslator<ReadWithIds<?>> {
 
-    @Override
-    public PTransformReplacement<PBegin, PCollection<T>> getReplacementTransform(
-        AppliedPTransform<PBegin, PCollection<T>, Read.Bounded<T>> transform) {
-      return PTransformReplacement.of(
-          transform.getPipeline().begin(), new StreamingBoundedRead<>(transform.getTransform()));
+            @Override
+            public void translate(
+                    ReadWithIds<?> transform, TransformTranslator.TranslationContext context) {
+                ReadTranslator.translateReadHelper(transform.getSource(), transform, context);
+            }
+        }
     }
 
-    @Override
-    public Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, PCollection<T> newOutput) {
-      return ReplacementOutputs.singleton(outputs, newOutput);
+    /**
+     * Remove values with duplicate ids.
+     */
+    private static class Deduplicate<T>
+            extends PTransform<PCollection<ValueWithRecordId<T>>, PCollection<T>> {
+
+        // Use a finite set of keys to improve bundling.  Without this, the key space
+        // will be the space of ids which is potentially very large, which results in much
+        // more per-key overhead.
+        private static final int NUM_RESHARD_KEYS = 10000;
+
+        @Override
+        public PCollection<T> expand(PCollection<ValueWithRecordId<T>> input) {
+            return input
+                    .apply(
+                            WithKeys.of(
+                                    (ValueWithRecordId<T> value)
+                                    -> Arrays.hashCode(value.getId()) % NUM_RESHARD_KEYS)
+                                    .withKeyType(TypeDescriptors.integers()))
+                    // Reshuffle will dedup based on ids in ValueWithRecordId by passing the data through
+                    // WindmillSink.
+                    .apply(Reshuffle.of())
+                    .apply(
+                            "StripIds",
+                            ParDo.of(
+                                    new DoFn<KV<Integer, ValueWithRecordId<T>>, T>() {
+                                @ProcessElement
+                                public void processElement(ProcessContext c) {
+                                    c.output(c.element().getValue().getValue());
+                                }
+                            }));
+        }
     }
-  }
 
-  /**
-   * Specialized implementation for {@link org.apache.beam.sdk.io.Read.Bounded Read.Bounded} for the
-   * Dataflow runner in streaming mode.
-   */
-  private static class StreamingBoundedRead<T> extends PTransform<PBegin, PCollection<T>> {
+    private static class StreamingBoundedReadOverrideFactory<T>
+            implements PTransformOverrideFactory<PBegin, PCollection<T>, Read.Bounded<T>> {
 
-    private final BoundedSource<T> source;
+        @Override
+        public PTransformReplacement<PBegin, PCollection<T>> getReplacementTransform(
+                AppliedPTransform<PBegin, PCollection<T>, Read.Bounded<T>> transform) {
+            return PTransformReplacement.of(
+                    transform.getPipeline().begin(), new StreamingBoundedRead<>(transform.getTransform()));
+        }
 
-    public StreamingBoundedRead(Read.Bounded<T> transform) {
-      this.source = transform.getSource();
+        @Override
+        public Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, PCollection<T> newOutput) {
+            return ReplacementOutputs.singleton(outputs, newOutput);
+        }
     }
 
-    @Override
-    public final PCollection<T> expand(PBegin input) {
-      source.validate();
+    /**
+     * Specialized implementation for
+     * {@link org.apache.beam.sdk.io.Read.Bounded Read.Bounded} for the Dataflow
+     * runner in streaming mode.
+     */
+    private static class StreamingBoundedRead<T> extends PTransform<PBegin, PCollection<T>> {
 
-      return Pipeline.applyTransform(input, new UnboundedReadFromBoundedSource<>(source))
-          .setIsBoundedInternal(IsBounded.BOUNDED);
-    }
-  }
+        private final BoundedSource<T> source;
 
-  /**
-   * A marker {@link DoFn} for writing the contents of a {@link PCollection} to a streaming {@link
-   * PCollectionView} backend implementation.
-   */
-  public static class StreamingPCollectionViewWriterFn<T> extends DoFn<Iterable<T>, T> {
+        public StreamingBoundedRead(Read.Bounded<T> transform) {
+            this.source = transform.getSource();
+        }
 
-    private final PCollectionView<?> view;
-    private final Coder<T> dataCoder;
+        @Override
+        public final PCollection<T> expand(PBegin input) {
+            source.validate();
 
-    public static <T> StreamingPCollectionViewWriterFn<T> create(
-        PCollectionView<?> view, Coder<T> dataCoder) {
-      return new StreamingPCollectionViewWriterFn<>(view, dataCoder);
+            return Pipeline.applyTransform(input, new UnboundedReadFromBoundedSource<>(source))
+                    .setIsBoundedInternal(IsBounded.BOUNDED);
+        }
     }
 
-    private StreamingPCollectionViewWriterFn(PCollectionView<?> view, Coder<T> dataCoder) {
-      this.view = view;
-      this.dataCoder = dataCoder;
+    /**
+     * A marker {@link DoFn} for writing the contents of a {@link PCollection}
+     * to a streaming {@link
+     * PCollectionView} backend implementation.
+     */
+    public static class StreamingPCollectionViewWriterFn<T> extends DoFn<Iterable<T>, T> {
+
+        private final PCollectionView<?> view;
+        private final Coder<T> dataCoder;
+
+        public static <T> StreamingPCollectionViewWriterFn<T> create(
+                PCollectionView<?> view, Coder<T> dataCoder) {
+            return new StreamingPCollectionViewWriterFn<>(view, dataCoder);
+        }
+
+        private StreamingPCollectionViewWriterFn(PCollectionView<?> view, Coder<T> dataCoder) {
+            this.view = view;
+            this.dataCoder = dataCoder;
+        }
+
+        public PCollectionView<?> getView() {
+            return view;
+        }
+
+        public Coder<T> getDataCoder() {
+            return dataCoder;
+        }
+
+        @ProcessElement
+        public void processElement(ProcessContext c, BoundedWindow w) throws Exception {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s is a marker class only and should never be executed.", getClass().getName()));
+        }
     }
 
-    public PCollectionView<?> getView() {
-      return view;
+    @Override
+    public String toString() {
+        return "DataflowRunner#" + options.getJobName();
     }
 
-    public Coder<T> getDataCoder() {
-      return dataCoder;
+    /**
+     * Finds the id for the running job of the given name.
+     */
+    private String getJobIdFromName(String jobName) {
+        try {
+            ListJobsResponse listResult;
+            String token = null;
+            do {
+                listResult = dataflowClient.listJobs(token);
+                token = listResult.getNextPageToken();
+                for (Job job : listResult.getJobs()) {
+                    if (job.getName().equals(jobName)
+                            && MonitoringUtil.toState(job.getCurrentState()).equals(State.RUNNING)) {
+                        return job.getId();
+                    }
+                }
+            } while (token != null);
+        } catch (GoogleJsonResponseException e) {
+            throw new RuntimeException(
+                    "Got error while looking up jobs: "
+                    + (e.getDetails() != null ? e.getDetails().getMessage() : e),
+                    e);
+        } catch (IOException e) {
+            throw new RuntimeException("Got error while looking up jobs: ", e);
+        }
+
+        throw new IllegalArgumentException("Could not find running job named " + jobName);
     }
 
-    @ProcessElement
-    public void processElement(ProcessContext c, BoundedWindow w) throws Exception {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s is a marker class only and should never be executed.", getClass().getName()));
+    static class CombineGroupedValues<K, InputT, OutputT>
+            extends PTransform<PCollection<KV<K, Iterable<InputT>>>, PCollection<KV<K, OutputT>>> {
+
+        private final Combine.GroupedValues<K, InputT, OutputT> original;
+        private final Coder<KV<K, OutputT>> outputCoder;
+
+        CombineGroupedValues(
+                GroupedValues<K, InputT, OutputT> original, Coder<KV<K, OutputT>> outputCoder) {
+            this.original = original;
+            this.outputCoder = outputCoder;
+        }
+
+        @Override
+        public PCollection<KV<K, OutputT>> expand(PCollection<KV<K, Iterable<InputT>>> input) {
+            return PCollection.createPrimitiveOutputInternal(
+                    input.getPipeline(), input.getWindowingStrategy(), input.isBounded(), outputCoder);
+        }
+
+        public Combine.GroupedValues<K, InputT, OutputT> getOriginalCombine() {
+            return original;
+        }
     }
-  }
 
-  @Override
-  public String toString() {
-    return "DataflowRunner#" + options.getJobName();
-  }
+    private static class PrimitiveCombineGroupedValuesOverrideFactory<K, InputT, OutputT>
+            implements PTransformOverrideFactory<
+          PCollection<KV<K, Iterable<InputT>>>, PCollection<KV<K, OutputT>>, Combine.GroupedValues<K, InputT, OutputT>> {
+
+        @Override
+        public PTransformReplacement<PCollection<KV<K, Iterable<InputT>>>, PCollection<KV<K, OutputT>>>
+                getReplacementTransform(
+                        AppliedPTransform<
+                    PCollection<KV<K, Iterable<InputT>>>, PCollection<KV<K, OutputT>>, GroupedValues<K, InputT, OutputT>> transform) {
+            return PTransformReplacement.of(
+                    PTransformReplacements.getSingletonMainInput(transform),
+                    new CombineGroupedValues<>(
+                            transform.getTransform(),
+                            PTransformReplacements.getSingletonMainOutput(transform).getCoder()));
+        }
 
-  /** Finds the id for the running job of the given name. */
-  private String getJobIdFromName(String jobName) {
-    try {
-      ListJobsResponse listResult;
-      String token = null;
-      do {
-        listResult = dataflowClient.listJobs(token);
-        token = listResult.getNextPageToken();
-        for (Job job : listResult.getJobs()) {
-          if (job.getName().equals(jobName)
-              && MonitoringUtil.toState(job.getCurrentState()).equals(State.RUNNING)) {
-            return job.getId();
-          }
+        @Override
+        public Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, PCollection<KV<K, OutputT>> newOutput) {
+            return ReplacementOutputs.singleton(outputs, newOutput);
         }
-      } while (token != null);
-    } catch (GoogleJsonResponseException e) {
-      throw new RuntimeException(
-          "Got error while looking up jobs: "
-              + (e.getDetails() != null ? e.getDetails().getMessage() : e),
-          e);
-    } catch (IOException e) {
-      throw new RuntimeException("Got error while looking up jobs: ", e);
     }
 
-    throw new IllegalArgumentException("Could not find running job named " + jobName);
-  }
+    private static class StreamingPubsubIOWriteOverrideFactory
+            implements PTransformOverrideFactory<PCollection<PubsubMessage>, PDone, PubsubUnboundedSink> {
 
-  static class CombineGroupedValues<K, InputT, OutputT>
-      extends PTransform<PCollection<KV<K, Iterable<InputT>>>, PCollection<KV<K, OutputT>>> {
+        private final DataflowRunner runner;
 
-    private final Combine.GroupedValues<K, InputT, OutputT> original;
-    private final Coder<KV<K, OutputT>> outputCoder;
+        private StreamingPubsubIOWriteOverrideFactory(DataflowRunner runner) {
+            this.runner = runner;
+        }
 
-    CombineGroupedValues(
-        GroupedValues<K, InputT, OutputT> original, Coder<KV<K, OutputT>> outputCoder) {
-      this.original = original;
-      this.outputCoder = outputCoder;
-    }
+        @Override
+        public PTransformReplacement<PCollection<PubsubMessage>, PDone> getReplacementTransform(
+                AppliedPTransform<PCollection<PubsubMessage>, PDone, PubsubUnboundedSink> transform) {
+            return PTransformReplacement.of(
+                    PTransformReplacements.getSingletonMainInput(transform),
+                    new StreamingPubsubIOWrite(runner, transform.getTransform()));
+        }
 
-    @Override
-    public PCollection<KV<K, OutputT>> expand(PCollection<KV<K, Iterable<InputT>>> input) {
-      return PCollection.createPrimitiveOutputInternal(
-          input.getPipeline(), input.getWindowingStrategy(), input.isBounded(), outputCoder);
+        @Override
+        public Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, PDone newOutput) {
+            return Collections.emptyMap();
+        }
     }
 
-    public Combine.GroupedValues<K, InputT, OutputT> getOriginalCombine() {
-      return original;
-    }
-  }
+    @VisibleForTesting
+    static class StreamingShardedWriteFactory<UserT, DestinationT, OutputT>
+            implements PTransformOverrideFactory<
+          PCollection<UserT>, WriteFilesResult<DestinationT>, WriteFiles<UserT, DestinationT, OutputT>> {
 
-  private static class PrimitiveCombineGroupedValuesOverrideFactory<K, InputT, OutputT>
-      implements PTransformOverrideFactory<
-          PCollection<KV<K, Iterable<InputT>>>,
-          PCollection<KV<K, OutputT>>,
-          Combine.GroupedValues<K, InputT, OutputT>> {
+        // We pick 10 as a default, as it works well with the default number of workers started
+        // by Dataflow.
+        static final int DEFAULT_NUM_SHARDS = 10;
+        DataflowPipelineWorkerPoolOptions options;
 
-    @Override
-    public PTransformReplacement<PCollection<KV<K, Iterable<InputT>>>, PCollection<KV<K, OutputT>>>
-        getReplacementTransform(
-            AppliedPTransform<
-                    PCollection<KV<K, Iterable<InputT>>>,
-                    PCollection<KV<K, OutputT>>,
-                    GroupedValues<K, InputT, OutputT>>
-                transform) {
-      return PTransformReplacement.of(
-          PTransformReplacements.getSingletonMainInput(transform),
-          new CombineGroupedValues<>(
-              transform.getTransform(),
-              PTransformReplacements.getSingletonMainOutput(transform).getCoder()));
-    }
+        StreamingShardedWriteFactory(PipelineOptions options) {
+            this.options = options.as(DataflowPipelineWorkerPoolOptions.class);
+        }
 
-    @Override
-    public Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, PCollection<KV<K, OutputT>> newOutput) {
-      return ReplacementOutputs.singleton(outputs, newOutput);
-    }
-  }
+        @Override
+        public PTransformReplacement<PCollection<UserT>, WriteFilesResult<DestinationT>>
+                getReplacementTransform(
+                        AppliedPTransform<
+                    PCollection<UserT>, WriteFilesResult<DestinationT>, WriteFiles<UserT, DestinationT, OutputT>> transform) {
+            // By default, if numShards is not set WriteFiles will produce one file per bundle. In
+            // streaming, there are large numbers of small bundles, resulting in many tiny files.
+            // Instead we pick max workers * 2 to ensure full parallelism, but prevent too-many files.
+            // (current_num_workers * 2 might be a better choice, but that value is not easily available
+            // today).
+            // If the user does not set either numWorkers or maxNumWorkers, default to 10 shards.
+            int numShards;
+            if (options.getMaxNumWorkers() > 0) {
+                numShards = options.getMaxNumWorkers() * 2;
+            } else if (options.getNumWorkers() > 0) {
+                numShards = options.getNumWorkers() * 2;
+            } else {
+                numShards = DEFAULT_NUM_SHARDS;
+            }
+
+            try {
+                List<PCollectionView<?>> sideInputs
+                        = WriteFilesTranslation.getDynamicDestinationSideInputs(transform);
+                FileBasedSink sink = WriteFilesTranslation.getSink(transform);
+                WriteFiles<UserT, DestinationT, OutputT> replacement
+                        = WriteFiles.to(sink).withSideInputs(sideInputs);
+                if (WriteFilesTranslation.isWindowedWrites(transform)) {
+                    replacement = replacement.withWindowedWrites();
+                }
 
-  private static class StreamingPubsubIOWriteOverrideFactory
-      implements PTransformOverrideFactory<PCollection<PubsubMessage>, PDone, PubsubUnboundedSink> {
+                if (WriteFilesTranslation.isAutoSharded(transform)) {
+                    replacement = replacement.withAutoSharding();
+                    return PTransformReplacement.of(
+                            PTransformReplacements.getSingletonMainInput(transform), replacement);
+                }
 
-    private final DataflowRunner runner;
+                return PTransformReplacement.of(
+                        PTransformReplacements.getSingletonMainInput(transform),
+                        replacement.withNumShards(numShards));
+            } catch (Exception e) {
+                throw new RuntimeException(e);
+            }
+        }
 
-    private StreamingPubsubIOWriteOverrideFactory(DataflowRunner runner) {
-      this.runner = runner;
+        @Override
+        public Map<PCollection<?>, ReplacementOutput> mapOutputs(
+                Map<TupleTag<?>, PCollection<?>> outputs, WriteFilesResult<DestinationT> newOutput) {
+            return ReplacementOutputs.tagged(outputs, newOutput);
+        }
     }
 
-    @Override
-    public PTransformReplacement<PCollection<PubsubMessage>, PDone> getReplacementTransform(
-        AppliedPTransform<PCollection<PubsubMessage>, PDone, PubsubUnboundedSink> transform) {
-      return PTransformReplacement.of(
-          PTransformReplacements.getSingletonMainInput(transform),
-          new StreamingPubsubIOWrite(runner, transform.getTransform()));
+    @VisibleForTesting
+    static String getContainerImageForJob(DataflowPipelineOptions options) {
+        String containerImage = options.getSdkContainerImage();
+
+        if (containerImage == null) {
+            // If not set, construct and return default image URL.
+            return getDefaultContainerImageUrl(options);
+        } else if (containerImage.contains("IMAGE")) {
+            // Replace placeholder with default image name
+            return containerImage.replace("IMAGE", getDefaultContainerImageNameForJob(options));
+        } else {
+            return containerImage;
+        }
     }
 
-    @Override
-    public Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, PDone newOutput) {
-      return Collections.emptyMap();
+    /**
+     * Construct the default Dataflow container full image URL.
+     */
+    static String getDefaultContainerImageUrl(DataflowPipelineOptions options) {
+        DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
+        return String.format(
+                "%s/%s:%s",
+                dataflowRunnerInfo.getContainerImageBaseRepository(),
+                getDefaultContainerImageNameForJob(options),
+                getDefaultContainerVersion(options));
     }
-  }
 
-  @VisibleForTesting
-  static class StreamingShardedWriteFactory<UserT, DestinationT, OutputT>
-      implements PTransformOverrideFactory<
-          PCollection<UserT>,
-          WriteFilesResult<DestinationT>,
-          WriteFiles<UserT, DestinationT, OutputT>> {
+    /**
+     * Construct the default Dataflow container image name based on pipeline
+     * type and Java version.
+     */
+    static String getDefaultContainerImageNameForJob(DataflowPipelineOptions options) {
+        Environments.JavaVersion javaVersion = Environments.getJavaVersion();
+        if (useUnifiedWorker(options)) {
+            return String.format("beam_%s_sdk", javaVersion.name());
+        } else if (options.isStreaming()) {
+            return String.format("beam-%s-streaming", javaVersion.legacyName());
+        } else {
+            return String.format("beam-%s-batch", javaVersion.legacyName());
+        }
+    }
 
-    // We pick 10 as a default, as it works well with the default number of workers started
-    // by Dataflow.
-    static final int DEFAULT_NUM_SHARDS = 10;
-    DataflowPipelineWorkerPoolOptions options;
+    /**
+     * Construct the default Dataflow container image name based on pipeline
+     * type and Java version.
+     */
+    static String getDefaultContainerVersion(DataflowPipelineOptions options) {
+        DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
+        ReleaseInfo releaseInfo = ReleaseInfo.getReleaseInfo();
+        if (releaseInfo.isDevSdkVersion()) {
+            if (useUnifiedWorker(options)) {
+                return dataflowRunnerInfo.getFnApiDevContainerVersion();
+            }
+            return dataflowRunnerInfo.getLegacyDevContainerVersion();
+        }
+        return releaseInfo.getSdkVersion();
+    }
 
-    StreamingShardedWriteFactory(PipelineOptions options) {
-      this.options = options.as(DataflowPipelineWorkerPoolOptions.class);
+    static boolean useUnifiedWorker(DataflowPipelineOptions options) {
+        return hasExperiment(options, "beam_fn_api")
+                || hasExperiment(options, "use_runner_v2")
+                || hasExperiment(options, "use_unified_worker")
+                || hasExperiment(options, "use_portable_job_submission");
     }
 
-    @Override
-    public PTransformReplacement<PCollection<UserT>, WriteFilesResult<DestinationT>>
-        getReplacementTransform(
-            AppliedPTransform<
-                    PCollection<UserT>,
-                    WriteFilesResult<DestinationT>,
-                    WriteFiles<UserT, DestinationT, OutputT>>
-                transform) {
-      // By default, if numShards is not set WriteFiles will produce one file per bundle. In
-      // streaming, there are large numbers of small bundles, resulting in many tiny files.
-      // Instead we pick max workers * 2 to ensure full parallelism, but prevent too-many files.
-      // (current_num_workers * 2 might be a better choice, but that value is not easily available
-      // today).
-      // If the user does not set either numWorkers or maxNumWorkers, default to 10 shards.
-      int numShards;
-      if (options.getMaxNumWorkers() > 0) {
-        numShards = options.getMaxNumWorkers() * 2;
-      } else if (options.getNumWorkers() > 0) {
-        numShards = options.getNumWorkers() * 2;
-      } else {
-        numShards = DEFAULT_NUM_SHARDS;
-      }
-
-      try {
-        List<PCollectionView<?>> sideInputs =
-            WriteFilesTranslation.getDynamicDestinationSideInputs(transform);
-        FileBasedSink sink = WriteFilesTranslation.getSink(transform);
-        WriteFiles<UserT, DestinationT, OutputT> replacement =
-            WriteFiles.to(sink).withSideInputs(sideInputs);
-        if (WriteFilesTranslation.isWindowedWrites(transform)) {
-          replacement = replacement.withWindowedWrites();
-        }
-
-        if (WriteFilesTranslation.isAutoSharded(transform)) {
-          replacement = replacement.withAutoSharding();
-          return PTransformReplacement.of(
-              PTransformReplacements.getSingletonMainInput(transform), replacement);
-        }
-
-        return PTransformReplacement.of(
-            PTransformReplacements.getSingletonMainInput(transform),
-            replacement.withNumShards(numShards));
-      } catch (Exception e) {
-        throw new RuntimeException(e);
-      }
+    static void verifyDoFnSupported(
+            DoFn<?, ?> fn, boolean streaming, DataflowPipelineOptions options) {
+        if (!streaming && DoFnSignatures.usesMultimapState(fn)) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s does not currently support %s in batch mode",
+                            DataflowRunner.class.getSimpleName(), MultimapState.class.getSimpleName()));
+        }
+        if (streaming && DoFnSignatures.requiresTimeSortedInput(fn)) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s does not currently support @RequiresTimeSortedInput in streaming mode.",
+                            DataflowRunner.class.getSimpleName()));
+        }
+        boolean isUnifiedWorker = useUnifiedWorker(options);
+
+        if (DoFnSignatures.usesMultimapState(fn) && isUnifiedWorker) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s does not currently support %s running using streaming on unified worker",
+                            DataflowRunner.class.getSimpleName(), MultimapState.class.getSimpleName()));
+        }
+        if (DoFnSignatures.usesSetState(fn) && streaming && isUnifiedWorker) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s does not currently support %s when using streaming on unified worker",
+                            DataflowRunner.class.getSimpleName(), SetState.class.getSimpleName()));
+        }
+        if (DoFnSignatures.usesMapState(fn) && streaming && isUnifiedWorker) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s does not currently support %s when using streaming on unified worker",
+                            DataflowRunner.class.getSimpleName(), MapState.class.getSimpleName()));
+        }
+        if (DoFnSignatures.usesBundleFinalizer(fn) && !isUnifiedWorker) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s does not currently support %s when not using unified worker because it uses "
+                            + "BundleFinalizers in its implementation. Set the `--experiments=use_runner_v2` "
+                            + "option to use this DoFn.",
+                            DataflowRunner.class.getSimpleName(), fn.getClass().getSimpleName()));
+        }
     }
 
-    @Override
-    public Map<PCollection<?>, ReplacementOutput> mapOutputs(
-        Map<TupleTag<?>, PCollection<?>> outputs, WriteFilesResult<DestinationT> newOutput) {
-      return ReplacementOutputs.tagged(outputs, newOutput);
-    }
-  }
-
-  @VisibleForTesting
-  static String getContainerImageForJob(DataflowPipelineOptions options) {
-    String containerImage = options.getSdkContainerImage();
-
-    if (containerImage == null) {
-      // If not set, construct and return default image URL.
-      return getDefaultContainerImageUrl(options);
-    } else if (containerImage.contains("IMAGE")) {
-      // Replace placeholder with default image name
-      return containerImage.replace("IMAGE", getDefaultContainerImageNameForJob(options));
-    } else {
-      return containerImage;
-    }
-  }
-
-  /** Construct the default Dataflow container full image URL. */
-  static String getDefaultContainerImageUrl(DataflowPipelineOptions options) {
-    DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
-    return String.format(
-        "%s/%s:%s",
-        dataflowRunnerInfo.getContainerImageBaseRepository(),
-        getDefaultContainerImageNameForJob(options),
-        getDefaultContainerVersion(options));
-  }
-
-  /**
-   * Construct the default Dataflow container image name based on pipeline type and Java version.
-   */
-  static String getDefaultContainerImageNameForJob(DataflowPipelineOptions options) {
-    Environments.JavaVersion javaVersion = Environments.getJavaVersion();
-    if (useUnifiedWorker(options)) {
-      return String.format("beam_%s_sdk", javaVersion.name());
-    } else if (options.isStreaming()) {
-      return String.format("beam-%s-streaming", javaVersion.legacyName());
-    } else {
-      return String.format("beam-%s-batch", javaVersion.legacyName());
-    }
-  }
-
-  /**
-   * Construct the default Dataflow container image name based on pipeline type and Java version.
-   */
-  static String getDefaultContainerVersion(DataflowPipelineOptions options) {
-    DataflowRunnerInfo dataflowRunnerInfo = DataflowRunnerInfo.getDataflowRunnerInfo();
-    ReleaseInfo releaseInfo = ReleaseInfo.getReleaseInfo();
-    if (releaseInfo.isDevSdkVersion()) {
-      if (useUnifiedWorker(options)) {
-        return dataflowRunnerInfo.getFnApiDevContainerVersion();
-      }
-      return dataflowRunnerInfo.getLegacyDevContainerVersion();
-    }
-    return releaseInfo.getSdkVersion();
-  }
-
-  static boolean useUnifiedWorker(DataflowPipelineOptions options) {
-    return hasExperiment(options, "beam_fn_api")
-        || hasExperiment(options, "use_runner_v2")
-        || hasExperiment(options, "use_unified_worker")
-        || hasExperiment(options, "use_portable_job_submission");
-  }
-
-  static void verifyDoFnSupported(
-      DoFn<?, ?> fn, boolean streaming, DataflowPipelineOptions options) {
-    if (!streaming && DoFnSignatures.usesMultimapState(fn)) {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s does not currently support %s in batch mode",
-              DataflowRunner.class.getSimpleName(), MultimapState.class.getSimpleName()));
-    }
-    if (streaming && DoFnSignatures.requiresTimeSortedInput(fn)) {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s does not currently support @RequiresTimeSortedInput in streaming mode.",
-              DataflowRunner.class.getSimpleName()));
-    }
-    boolean isUnifiedWorker = useUnifiedWorker(options);
-
-    if (DoFnSignatures.usesMultimapState(fn) && isUnifiedWorker) {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s does not currently support %s running using streaming on unified worker",
-              DataflowRunner.class.getSimpleName(), MultimapState.class.getSimpleName()));
-    }
-    if (DoFnSignatures.usesSetState(fn) && streaming && isUnifiedWorker) {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s does not currently support %s when using streaming on unified worker",
-              DataflowRunner.class.getSimpleName(), SetState.class.getSimpleName()));
-    }
-    if (DoFnSignatures.usesMapState(fn) && streaming && isUnifiedWorker) {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s does not currently support %s when using streaming on unified worker",
-              DataflowRunner.class.getSimpleName(), MapState.class.getSimpleName()));
-    }
-    if (DoFnSignatures.usesBundleFinalizer(fn) && !isUnifiedWorker) {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s does not currently support %s when not using unified worker because it uses "
-                  + "BundleFinalizers in its implementation. Set the `--experiments=use_runner_v2` "
-                  + "option to use this DoFn.",
-              DataflowRunner.class.getSimpleName(), fn.getClass().getSimpleName()));
-    }
-  }
-
-  static void verifyStateSupportForWindowingStrategy(WindowingStrategy strategy) {
-    // https://github.com/apache/beam/issues/18478
-    if (strategy.needsMerge()) {
-      throw new UnsupportedOperationException(
-          String.format(
-              "%s does not currently support state or timers with merging windows",
-              DataflowRunner.class.getSimpleName()));
-    }
-  }
-
-  /**
-   * These are for dataflow-specific classes where we put fake stubs in the pipeline proto to pass
-   * validation.
-   */
-  private static class DataflowPayloadTranslator
-      implements TransformPayloadTranslator<PTransform<?, ?>> {
-    @Override
-    public String getUrn(PTransform transform) {
-      return "dataflow_stub:" + transform.getClass().getName();
+    static void verifyStateSupportForWindowingStrategy(WindowingStrategy strategy) {
+        // https://github.com/apache/beam/issues/18478
+        if (strategy.needsMerge()) {
+            throw new UnsupportedOperationException(
+                    String.format(
+                            "%s does not currently support state or timers with merging windows",
+                            DataflowRunner.class.getSimpleName()));
+        }
     }
 
-    @Override
-    public String getUrn() {
-      throw new UnsupportedOperationException(
-          "URN of DataflowPayloadTranslator depends on the transform. Please use 'getUrn(PTransform transform)' instead.");
+    /**
+     * These are for dataflow-specific classes where we put fake stubs in the
+     * pipeline proto to pass validation.
+     */
+    private static class DataflowPayloadTranslator
+            implements TransformPayloadTranslator<PTransform<?, ?>> {
+
+        @Override
+        public String getUrn(PTransform transform) {
+            return "dataflow_stub:" + transform.getClass().getName();
+        }
+
+        @Override
+        public String getUrn() {
+            throw new UnsupportedOperationException(
+                    "URN of DataflowPayloadTranslator depends on the transform. Please use 'getUrn(PTransform transform)' instead.");
+        }
+
+        @Override
+        public RunnerApi.FunctionSpec translate(
+                AppliedPTransform<?, ?, PTransform<?, ?>> application, SdkComponents components)
+                throws IOException {
+            return RunnerApi.FunctionSpec.newBuilder().setUrn(getUrn(application.getTransform())).build();
+        }
     }
 
-    @Override
-    public RunnerApi.FunctionSpec translate(
-        AppliedPTransform<?, ?, PTransform<?, ?>> application, SdkComponents components)
-        throws IOException {
-      return RunnerApi.FunctionSpec.newBuilder().setUrn(getUrn(application.getTransform())).build();
-    }
-  }
-
-  @SuppressWarnings({
-    "rawtypes" // TODO(https://github.com/apache/beam/issues/20447)
-  })
-  @AutoService(TransformPayloadTranslatorRegistrar.class)
-  public static class DataflowTransformTranslator implements TransformPayloadTranslatorRegistrar {
-    @Override
-    public Map<? extends Class<? extends PTransform>, ? extends TransformPayloadTranslator>
-        getTransformPayloadTranslators() {
-      TransformPayloadTranslator dummyTranslator = new DataflowPayloadTranslator();
-      return ImmutableMap.<Class<? extends PTransform>, TransformPayloadTranslator>builder()
-          .put(CreateDataflowView.class, dummyTranslator)
-          .put(BatchViewOverrides.GroupByKeyAndSortValuesOnly.class, dummyTranslator)
-          .put(StreamingPubsubIORead.class, dummyTranslator)
-          .put(StreamingUnboundedRead.ReadWithIds.class, dummyTranslator)
-          .put(CombineGroupedValues.class, dummyTranslator)
-          .build();
-    }
-  }
+    @SuppressWarnings({
+        "rawtypes" // TODO(https://github.com/apache/beam/issues/20447)
+    })
+    @AutoService(TransformPayloadTranslatorRegistrar.class)
+    public static class DataflowTransformTranslator implements TransformPayloadTranslatorRegistrar {
+
+        @Override
+        public Map<? extends Class<? extends PTransform>, ? extends TransformPayloadTranslator>
+                getTransformPayloadTranslators() {
+            TransformPayloadTranslator dummyTranslator = new DataflowPayloadTranslator();
+            return ImmutableMap.<Class<? extends PTransform>, TransformPayloadTranslator>builder()
+                    .put(CreateDataflowView.class, dummyTranslator)
+                    .put(BatchViewOverrides.GroupByKeyAndSortValuesOnly.class, dummyTranslator)
+                    .put(StreamingPubsubIORead.class, dummyTranslator)
+                    .put(StreamingUnboundedRead.ReadWithIds.class, dummyTranslator)
+                    .put(CombineGroupedValues.class, dummyTranslator)
+                    .build();
+        }
+    }
 }
diff --git a/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/options/DataflowPipelineOptions.java b/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/options/DataflowPipelineOptions.java
index 1c3782595337..67ae717a8317 100644
--- a/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/options/DataflowPipelineOptions.java
+++ b/runners/google-cloud-dataflow-java/src/main/java/org/apache/beam/runners/dataflow/options/DataflowPipelineOptions.java
@@ -37,13 +37,15 @@
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
-/** Options that can be used to configure the {@link DataflowRunner}. */
+/**
+ * Options that can be used to configure the {@link DataflowRunner}.
+ */
 @Description("Options that configure the Dataflow pipeline.")
 @SuppressWarnings({
-  "nullness" // TODO(https://github.com/apache/beam/issues/20497)
+    "nullness" // TODO(https://github.com/apache/beam/issues/20497)
 })
 public interface DataflowPipelineOptions
-    extends PipelineOptions,
+        extends PipelineOptions,
         GcpOptions,
         ApplicationNameOptions,
         DataflowPipelineDebugOptions,
@@ -56,202 +58,255 @@ public interface DataflowPipelineOptions
         DataflowProfilingOptions,
         PubsubOptions {
 
-  @Description(
-      "Project id. Required when running a Dataflow in the cloud. "
-          + "See https://cloud.google.com/storage/docs/projects for further details.")
-  @Override
-  @Validation.Required
-  @Default.InstanceFactory(DefaultProjectFactory.class)
-  String getProject();
-
-  @Override
-  void setProject(String value);
-
-  /**
-   * GCS path for staging local files, e.g. gs://bucket/object
-   *
-   * <p>Must be a valid Cloud Storage URL, beginning with the prefix "gs://"
-   *
-   * <p>If {@link #getStagingLocation()} is not set, it will default to {@link
-   * GcpOptions#getGcpTempLocation()}. {@link GcpOptions#getGcpTempLocation()} must be a valid GCS
-   * path.
-   */
-  @Description(
-      "GCS path for staging local files, e.g. \"gs://bucket/object\". "
-          + "Must be a valid Cloud Storage URL, beginning with the prefix \"gs://\". "
-          + "If stagingLocation is unset, defaults to gcpTempLocation with \"/staging\" suffix.")
-  @Default.InstanceFactory(StagingLocationFactory.class)
-  String getStagingLocation();
-
-  void setStagingLocation(String value);
-
-  /** Whether to update the currently running pipeline with the same name as this one. */
-  @Description(
-      "If set, replace the existing pipeline with the name specified by --jobName with "
-          + "this pipeline, preserving state.")
-  boolean isUpdate();
-
-  void setUpdate(boolean value);
-
-  /** If set, the snapshot from which the job should be created. */
-  @Description("If set, the snapshot from which the job should be created.")
-  String getCreateFromSnapshot();
-
-  void setCreateFromSnapshot(String value);
-
-  /** Where the runner should generate a template file. Must either be local or Cloud Storage. */
-  @Description(
-      "Where the runner should generate a template file. "
-          + "Must either be local or Cloud Storage.")
-  String getTemplateLocation();
-
-  void setTemplateLocation(String value);
-
-  /**
-   * Service options are set by the user and configure the service. This decouples service side
-   * feature availability from the Apache Beam release cycle.
-   */
-  @Description(
-      "Service options are set by the user and configure the service. This "
-          + "decouples service side feature availability from the Apache Beam release cycle. "
-          + "For a list of service options, see "
-          + "https://cloud.google.com/dataflow/docs/reference/service-options "
-          + "in the Dataflow documentation.")
-  List<String> getDataflowServiceOptions();
-
-  void setDataflowServiceOptions(List<String> options);
-
-  /** Run the job as a specific service account, instead of the default GCE robot. */
-  @Description("Run the job as a specific service account, instead of the default GCE robot.")
-  String getServiceAccount();
-
-  void setServiceAccount(String value);
-
-  /**
-   * The Google Compute Engine <a
-   * href="https://cloud.google.com/compute/docs/regions-zones/regions-zones">region</a> for
-   * creating Dataflow jobs.
-   */
-  @Description(
-      "The Google Compute Engine region for creating Dataflow jobs. See "
-          + "https://cloud.google.com/compute/docs/regions-zones/regions-zones for a list of valid "
-          + "options.")
-  @Default.InstanceFactory(DefaultGcpRegionFactory.class)
-  String getRegion();
-
-  void setRegion(String region);
-
-  /**
-   * Dataflow endpoint to use.
-   *
-   * <p>Defaults to the current version of the Google Cloud Dataflow API, at the time the current
-   * SDK version was released.
-   *
-   * <p>If the string contains "://", then this is treated as a URL, otherwise {@link
-   * #getApiRootUrl()} is used as the root URL.
-   */
-  @Description(
-      "The URL for the Dataflow API. If the string contains \"://\", this"
-          + " will be treated as the entire URL, otherwise will be treated relative to apiRootUrl.")
-  @Override
-  @Default.String(Dataflow.DEFAULT_SERVICE_PATH)
-  String getDataflowEndpoint();
-
-  @Override
-  void setDataflowEndpoint(String value);
-
-  /** Labels that will be applied to the billing records for this job. */
-  @Description("Labels that will be applied to the billing records for this job.")
-  Map<String, String> getLabels();
-
-  void setLabels(Map<String, String> labels);
-
-  /** The URL of the staged portable pipeline. */
-  @Description("The URL of the staged portable pipeline")
-  String getPipelineUrl();
-
-  void setPipelineUrl(String urlString);
-
-  @Description("The customized dataflow worker jar")
-  String getDataflowWorkerJar();
-
-  void setDataflowWorkerJar(String dataflowWorkerJar);
-
-  /** Set of available Flexible Resource Scheduling goals. */
-  enum FlexResourceSchedulingGoal {
-    /** No goal specified. */
-    UNSPECIFIED,
-
-    /** Optimize for lower execution time. */
-    SPEED_OPTIMIZED,
-
-    /** Optimize for lower cost. */
-    COST_OPTIMIZED,
-  }
-
-  /** This option controls Flexible Resource Scheduling mode. */
-  @Description("Controls the Flexible Resource Scheduling mode.")
-  @Default.Enum("UNSPECIFIED")
-  FlexResourceSchedulingGoal getFlexRSGoal();
-
-  void setFlexRSGoal(FlexResourceSchedulingGoal goal);
-
-  /** Returns a default staging location under {@link GcpOptions#getGcpTempLocation}. */
-  class StagingLocationFactory implements DefaultValueFactory<String> {
-    private static final Logger LOG = LoggerFactory.getLogger(StagingLocationFactory.class);
+    @Description(
+            "Project id. Required when running a Dataflow in the cloud. "
+            + "See https://cloud.google.com/storage/docs/projects for further details.")
+    @Override
+    @Validation.Required
+    @Default.InstanceFactory(DefaultProjectFactory.class)
+    String getProject();
+
+    @Override
+    void setProject(String value);
+
+    /**
+     * GCS path for staging local files, e.g. gs://bucket/object
+     *
+     * <p>
+     * Must be a valid Cloud Storage URL, beginning with the prefix "gs://"
+     *
+     * <p>
+     * If {@link #getStagingLocation()} is not set, it will default to {@link
+     * GcpOptions#getGcpTempLocation()}. {@link GcpOptions#getGcpTempLocation()}
+     * must be a valid GCS path.
+     */
+    @Description(
+            "GCS path for staging local files, e.g. \"gs://bucket/object\". "
+            + "Must be a valid Cloud Storage URL, beginning with the prefix \"gs://\". "
+            + "If stagingLocation is unset, defaults to gcpTempLocation with \"/staging\" suffix.")
+    @Default.InstanceFactory(StagingLocationFactory.class)
+    String getStagingLocation();
+
+    void setStagingLocation(String value);
+
+    /**
+     * Whether to update the currently running pipeline with the same name as
+     * this one.
+     */
+    @Description(
+            "If set, replace the existing pipeline with the name specified by --jobName with "
+            + "this pipeline, preserving state.")
+    boolean isUpdate();
+
+    void setUpdate(boolean value);
+
+    /**
+     * If set, the snapshot from which the job should be created.
+     */
+    @Description("If set, the snapshot from which the job should be created.")
+    String getCreateFromSnapshot();
+
+    void setCreateFromSnapshot(String value);
+
+    /**
+     * Where the runner should generate a template file. Must either be local or
+     * Cloud Storage.
+     */
+    @Description(
+            "Where the runner should generate a template file. "
+            + "Must either be local or Cloud Storage.")
+    String getTemplateLocation();
+
+    /**
+     * Sets the Cloud Storage path where the Dataflow template will be stored.
+     * Required for creating Flex Templates or Classic Templates.
+     *
+     * <p>
+     * Example:
+     * <pre>{@code
+     * DataflowPipelineOptions options = PipelineOptionsFactory.as(DataflowPipelineOptions.class);
+     * options.setTemplateLocation("gs://your-bucket/templates/my-template");
+     * }</pre>
+     *
+     * @param templateLocation Cloud Storage path for storing the Dataflow
+     * template.
+     */
+    void setTemplateLocation(String value);
+
+    /**
+     * Service options are set by the user and configure the service. This
+     * decouples service side feature availability from the Apache Beam release
+     * cycle.
+     */
+    @Description(
+            "Service options are set by the user and configure the service. This "
+            + "decouples service side feature availability from the Apache Beam release cycle. "
+            + "For a list of service options, see "
+            + "https://cloud.google.com/dataflow/docs/reference/service-options "
+            + "in the Dataflow documentation.")
+    List<String> getDataflowServiceOptions();
+
+    void setDataflowServiceOptions(List<String> options);
+
+    /**
+     * Run the job as a specific service account, instead of the default GCE
+     * robot.
+     */
+    @Description("Run the job as a specific service account, instead of the default GCE robot.")
+    String getServiceAccount();
+
+    void setServiceAccount(String value);
+
+    /**
+     * The Google Compute Engine <a
+     * href="https://cloud.google.com/compute/docs/regions-zones/regions-zones">region</a>
+     * for creating Dataflow jobs.
+     */
+    @Description(
+            "The Google Compute Engine region for creating Dataflow jobs. See "
+            + "https://cloud.google.com/compute/docs/regions-zones/regions-zones for a list of valid "
+            + "options.")
+    @Default.InstanceFactory(DefaultGcpRegionFactory.class)
+    String getRegion();
+
+    void setRegion(String region);
+
+    /**
+     * Dataflow endpoint to use.
+     *
+     * <p>
+     * Defaults to the current version of the Google Cloud Dataflow API, at the
+     * time the current SDK version was released.
+     *
+     * <p>
+     * If the string contains "://", then this is treated as a URL, otherwise {@link
+     * #getApiRootUrl()} is used as the root URL.
+     */
+    @Description(
+            "The URL for the Dataflow API. If the string contains \"://\", this"
+            + " will be treated as the entire URL, otherwise will be treated relative to apiRootUrl.")
+    @Override
+    @Default.String(Dataflow.DEFAULT_SERVICE_PATH)
+    String getDataflowEndpoint();
 
     @Override
-    public String create(PipelineOptions options) {
-      GcsOptions gcsOptions = options.as(GcsOptions.class);
-      LOG.info("No stagingLocation provided, falling back to gcpTempLocation");
-      String gcpTempLocation;
-      try {
-        gcpTempLocation = gcsOptions.getGcpTempLocation();
-      } catch (Exception e) {
-        throw new IllegalArgumentException(
-            "Error constructing default value for stagingLocation: failed to retrieve gcpTempLocation. "
-                + "Either stagingLocation must be set explicitly or a valid value must be provided "
-                + "for gcpTempLocation.",
-            e);
-      }
-      try {
-        gcsOptions.getPathValidator().validateOutputFilePrefixSupported(gcpTempLocation);
-      } catch (Exception e) {
-        throw new IllegalArgumentException(
-            String.format(
-                "Error constructing default value for stagingLocation: gcpTempLocation is not"
-                    + " a valid GCS path, %s. ",
-                gcpTempLocation),
-            e);
-      }
-      return FileSystems.matchNewResource(gcpTempLocation, true /* isDirectory */)
-          .resolve("staging", StandardResolveOptions.RESOLVE_DIRECTORY)
-          .toString();
+    void setDataflowEndpoint(String value);
+
+    /**
+     * Labels that will be applied to the billing records for this job.
+     */
+    @Description("Labels that will be applied to the billing records for this job.")
+    Map<String, String> getLabels();
+
+    void setLabels(Map<String, String> labels);
+
+    /**
+     * The URL of the staged portable pipeline.
+     */
+    @Description("The URL of the staged portable pipeline")
+    String getPipelineUrl();
+
+    void setPipelineUrl(String urlString);
+
+    @Description("The customized dataflow worker jar")
+    String getDataflowWorkerJar();
+
+    void setDataflowWorkerJar(String dataflowWorkerJar);
+
+    /**
+     * Set of available Flexible Resource Scheduling goals.
+     */
+    enum FlexResourceSchedulingGoal {
+        /**
+         * No goal specified.
+         */
+        UNSPECIFIED,
+        /**
+         * Optimize for lower execution time.
+         */
+        SPEED_OPTIMIZED,
+        /**
+         * Optimize for lower cost.
+         */
+        COST_OPTIMIZED,
+    }
+
+    /**
+     * This option controls Flexible Resource Scheduling mode.
+     */
+    @Description("Controls the Flexible Resource Scheduling mode.")
+    @Default.Enum("UNSPECIFIED")
+    FlexResourceSchedulingGoal getFlexRSGoal();
+
+    void setFlexRSGoal(FlexResourceSchedulingGoal goal);
+
+    /**
+     * Returns a default staging location under
+     * {@link GcpOptions#getGcpTempLocation}.
+     */
+    class StagingLocationFactory implements DefaultValueFactory<String> {
+
+        private static final Logger LOG = LoggerFactory.getLogger(StagingLocationFactory.class);
+
+        @Override
+        public String create(PipelineOptions options) {
+            GcsOptions gcsOptions = options.as(GcsOptions.class);
+            LOG.info("No stagingLocation provided, falling back to gcpTempLocation");
+            String gcpTempLocation;
+            try {
+                gcpTempLocation = gcsOptions.getGcpTempLocation();
+            } catch (Exception e) {
+                throw new IllegalArgumentException(
+                        "Error constructing default value for stagingLocation: failed to retrieve gcpTempLocation. "
+                        + "Either stagingLocation must be set explicitly or a valid value must be provided "
+                        + "for gcpTempLocation.",
+                        e);
+            }
+            try {
+                gcsOptions.getPathValidator().validateOutputFilePrefixSupported(gcpTempLocation);
+            } catch (Exception e) {
+                throw new IllegalArgumentException(
+                        String.format(
+                                "Error constructing default value for stagingLocation: gcpTempLocation is not"
+                                + " a valid GCS path, %s. ",
+                                gcpTempLocation),
+                        e);
+            }
+            return FileSystems.matchNewResource(gcpTempLocation, true /* isDirectory */)
+                    .resolve("staging", StandardResolveOptions.RESOLVE_DIRECTORY)
+                    .toString();
+        }
     }
-  }
-
-  /** If enabled then the literal key will be logged to Cloud Logging if a hot key is detected. */
-  @Description(
-      "If enabled then the literal key will be logged to Cloud Logging if a hot key is detected.")
-  boolean isHotKeyLoggingEnabled();
-
-  void setHotKeyLoggingEnabled(boolean value);
-
-  /**
-   * Open modules needed for reflection that access JDK internals with Java 9+
-   *
-   * <p>With JDK 16+, <a href="#{https://openjdk.java.net/jeps/403}">JDK internals are strongly
-   * encapsulated</a> and can result in an InaccessibleObjectException being thrown if a tool or
-   * library uses reflection that access JDK internals. If you see these errors in your worker logs,
-   * you can pass in modules to open using the format module/package=target-module(,target-module)*
-   * to allow access to the library. E.g. java.base/java.lang=jamm
-   *
-   * <p>You may see warnings that jamm, a library used to more accurately size objects, is unable to
-   * make a private field accessible. To resolve the warning, open the specified module/package to
-   * jamm.
-   */
-  @Description("Open modules needed for reflection with Java 17+.")
-  List<String> getJdkAddOpenModules();
-
-  void setJdkAddOpenModules(List<String> options);
+
+    /**
+     * If enabled then the literal key will be logged to Cloud Logging if a hot
+     * key is detected.
+     */
+    @Description(
+            "If enabled then the literal key will be logged to Cloud Logging if a hot key is detected.")
+    boolean isHotKeyLoggingEnabled();
+
+    void setHotKeyLoggingEnabled(boolean value);
+
+    /**
+     * Open modules needed for reflection that access JDK internals with Java 9+
+     *
+     * <p>
+     * With JDK 16+, <a href="#{https://openjdk.java.net/jeps/403}">JDK
+     * internals are strongly encapsulated</a> and can result in an
+     * InaccessibleObjectException being thrown if a tool or library uses
+     * reflection that access JDK internals. If you see these errors in your
+     * worker logs, you can pass in modules to open using the format
+     * module/package=target-module(,target-module)* to allow access to the
+     * library. E.g. java.base/java.lang=jamm
+     *
+     * <p>
+     * You may see warnings that jamm, a library used to more accurately size
+     * objects, is unable to make a private field accessible. To resolve the
+     * warning, open the specified module/package to jamm.
+     */
+    @Description("Open modules needed for reflection with Java 17+.")
+    List<String> getJdkAddOpenModules();
+
+    void setJdkAddOpenModules(List<String> options);
 }