docs: update docs (#916) * fix: re-run script * test: fix noxfile

commit: 4ed7d3f9b61ac35e08a22b4995076a95451cf7c8 [log] [tgz]
author: Bu Sun Kim <8822365+busunkim96@users.noreply.github.com> Wed May 27 12:20:54 2020 -0700
committer: GitHub <noreply@github.com> Wed May 27 12:20:54 2020 -0700
tree: a5caffd63e85ad5ff02901d9c90f2fcaddcb1564
parent: b8458c0b73030155b64a3c2392b2f70e5fbc3baf [diff] [blame]
diff --git a/docs/dyn/dataflow_v1b3.projects.locations.flexTemplates.html b/docs/dyn/dataflow_v1b3.projects.locations.flexTemplates.html
index aaa07be..3aee8db 100644
--- a/docs/dyn/dataflow_v1b3.projects.locations.flexTemplates.html
+++ b/docs/dyn/dataflow_v1b3.projects.locations.flexTemplates.html

@@ -94,9 +94,14 @@
     &quot;validateOnly&quot;: True or False, # If true, the request is validated but not actually executed.
         # Defaults to false.
     &quot;launchParameter&quot;: { # Launch FlexTemplate Parameter. # Required. Parameter to launch a job form Flex Template.
+      &quot;containerSpecGcsPath&quot;: &quot;A String&quot;, # Gcs path to a file with json serialized ContainerSpec as content.
+      &quot;parameters&quot;: { # The parameters for FlexTemplate.
+          # Ex. {&quot;num_workers&quot;:&quot;5&quot;}
+        &quot;a_key&quot;: &quot;A String&quot;,
+      },
+      &quot;jobName&quot;: &quot;A String&quot;, # Required. The job name to use for the created job.
       &quot;containerSpec&quot;: { # Container Spec. # Spec about the container image to launch.
         &quot;metadata&quot;: { # Metadata describing a template. # Metadata describing a template including description and validation rules.
-          &quot;name&quot;: &quot;A String&quot;, # Required. The name of the template.
           &quot;parameters&quot;: [ # The parameters for the template.
             { # Metadata for a specific parameter.
               &quot;label&quot;: &quot;A String&quot;, # Required. The label to display for the parameter.
@@ -110,6 +115,7 @@
               &quot;isOptional&quot;: True or False, # Optional. Whether the parameter is optional. Defaults to false.
             },
           ],
+          &quot;name&quot;: &quot;A String&quot;, # Required. The name of the template.
           &quot;description&quot;: &quot;A String&quot;, # Optional. A description of the template.
         },
         &quot;sdkInfo&quot;: { # SDK Information. # Required. SDK info of the Flex Template.
@@ -118,12 +124,6 @@
         },
         &quot;image&quot;: &quot;A String&quot;, # Name of the docker container image. E.g., gcr.io/project/some-image
       },
-      &quot;containerSpecGcsPath&quot;: &quot;A String&quot;, # Gcs path to a file with json serialized ContainerSpec as content.
-      &quot;parameters&quot;: { # The parameters for FlexTemplate.
-          # Ex. {&quot;num_workers&quot;:&quot;5&quot;}
-        &quot;a_key&quot;: &quot;A String&quot;,
-      },
-      &quot;jobName&quot;: &quot;A String&quot;, # Required. The job name to use for the created job.
     },
   }
 
@@ -155,219 +155,6 @@
         &quot;a_key&quot;: &quot;A String&quot;,
       },
       &quot;environment&quot;: { # Describes the environment in which a Dataflow Job runs. # The environment for the job.
-        &quot;sdkPipelineOptions&quot;: { # The Cloud Dataflow SDK pipeline options specified by the user. These
-            # options are passed through the service and are used to recreate the
-            # SDK pipeline options on the worker in a language agnostic and platform
-            # independent way.
-          &quot;a_key&quot;: &quot;&quot;, # Properties of the object.
-        },
-        &quot;flexResourceSchedulingGoal&quot;: &quot;A String&quot;, # Which Flexible Resource Scheduling mode to run in.
-        &quot;workerPools&quot;: [ # The worker pools. At least one &quot;harness&quot; worker pool must be
-            # specified in order for the job to have workers.
-          { # Describes one particular pool of Cloud Dataflow workers to be
-              # instantiated by the Cloud Dataflow service in order to perform the
-              # computations required by a job.  Note that a workflow job may use
-              # multiple pools, in order to match the various computational
-              # requirements of the various stages of the job.
-            &quot;defaultPackageSet&quot;: &quot;A String&quot;, # The default package set to install.  This allows the service to
-                # select a default set of packages which are useful to worker
-                # harnesses written in a particular language.
-            &quot;network&quot;: &quot;A String&quot;, # Network to which VMs will be assigned.  If empty or unspecified,
-                # the service will use the network &quot;default&quot;.
-            &quot;zone&quot;: &quot;A String&quot;, # Zone to run the worker pools in.  If empty or unspecified, the service
-                # will attempt to choose a reasonable default.
-            &quot;numWorkers&quot;: 42, # Number of Google Compute Engine workers in this pool needed to
-                # execute the job.  If zero or unspecified, the service will
-                # attempt to choose a reasonable default.
-            &quot;numThreadsPerWorker&quot;: 42, # The number of threads per worker harness. If empty or unspecified, the
-                # service will choose a number of threads (according to the number of cores
-                # on the selected machine type for batch, or 1 by convention for streaming).
-            &quot;diskSourceImage&quot;: &quot;A String&quot;, # Fully qualified source image for disks.
-            &quot;packages&quot;: [ # Packages to be installed on workers.
-              { # The packages that must be installed in order for a worker to run the
-                  # steps of the Cloud Dataflow job that will be assigned to its worker
-                  # pool.
-                  #
-                  # This is the mechanism by which the Cloud Dataflow SDK causes code to
-                  # be loaded onto the workers. For example, the Cloud Dataflow Java SDK
-                  # might use this to install jars containing the user&#x27;s code and all of the
-                  # various dependencies (libraries, data files, etc.) required in order
-                  # for that code to run.
-                &quot;location&quot;: &quot;A String&quot;, # The resource to read the package from. The supported resource type is:
-                    #
-                    # Google Cloud Storage:
-                    #
-                    #   storage.googleapis.com/{bucket}
-                    #   bucket.storage.googleapis.com/
-                &quot;name&quot;: &quot;A String&quot;, # The name of the package.
-              },
-            ],
-            &quot;teardownPolicy&quot;: &quot;A String&quot;, # Sets the policy for determining when to turndown worker pool.
-                # Allowed values are: `TEARDOWN_ALWAYS`, `TEARDOWN_ON_SUCCESS`, and
-                # `TEARDOWN_NEVER`.
-                # `TEARDOWN_ALWAYS` means workers are always torn down regardless of whether
-                # the job succeeds. `TEARDOWN_ON_SUCCESS` means workers are torn down
-                # if the job succeeds. `TEARDOWN_NEVER` means the workers are never torn
-                # down.
-                #
-                # If the workers are not torn down by the service, they will
-                # continue to run and use Google Compute Engine VM resources in the
-                # user&#x27;s project until they are explicitly terminated by the user.
-                # Because of this, Google recommends using the `TEARDOWN_ALWAYS`
-                # policy except for small, manually supervised test jobs.
-                #
-                # If unknown or unspecified, the service will attempt to choose a reasonable
-                # default.
-            &quot;onHostMaintenance&quot;: &quot;A String&quot;, # The action to take on host maintenance, as defined by the Google
-                # Compute Engine API.
-            &quot;poolArgs&quot;: { # Extra arguments for this worker pool.
-              &quot;a_key&quot;: &quot;&quot;, # Properties of the object. Contains field @type with type URL.
-            },
-            &quot;diskSizeGb&quot;: 42, # Size of root disk for VMs, in GB.  If zero or unspecified, the service will
-                # attempt to choose a reasonable default.
-            &quot;workerHarnessContainerImage&quot;: &quot;A String&quot;, # Required. Docker container image that executes the Cloud Dataflow worker
-                # harness, residing in Google Container Registry.
-                #
-                # Deprecated for the Fn API path. Use sdk_harness_container_images instead.
-            &quot;diskType&quot;: &quot;A String&quot;, # Type of root disk for VMs.  If empty or unspecified, the service will
-                # attempt to choose a reasonable default.
-            &quot;machineType&quot;: &quot;A String&quot;, # Machine type (e.g. &quot;n1-standard-1&quot;).  If empty or unspecified, the
-                # service will attempt to choose a reasonable default.
-            &quot;kind&quot;: &quot;A String&quot;, # The kind of the worker pool; currently only `harness` and `shuffle`
-                # are supported.
-            &quot;dataDisks&quot;: [ # Data disks that are used by a VM in this workflow.
-              { # Describes the data disk used by a workflow job.
-                &quot;sizeGb&quot;: 42, # Size of disk in GB.  If zero or unspecified, the service will
-                    # attempt to choose a reasonable default.
-                &quot;diskType&quot;: &quot;A String&quot;, # Disk storage type, as defined by Google Compute Engine.  This
-                    # must be a disk type appropriate to the project and zone in which
-                    # the workers will run.  If unknown or unspecified, the service
-                    # will attempt to choose a reasonable default.
-                    #
-                    # For example, the standard persistent disk type is a resource name
-                    # typically ending in &quot;pd-standard&quot;.  If SSD persistent disks are
-                    # available, the resource name typically ends with &quot;pd-ssd&quot;.  The
-                    # actual valid values are defined the Google Compute Engine API,
-                    # not by the Cloud Dataflow API; consult the Google Compute Engine
-                    # documentation for more information about determining the set of
-                    # available disk types for a particular project and zone.
-                    #
-                    # Google Compute Engine Disk types are local to a particular
-                    # project in a particular zone, and so the resource name will
-                    # typically look something like this:
-                    #
-                    # compute.googleapis.com/projects/project-id/zones/zone/diskTypes/pd-standard
-                &quot;mountPoint&quot;: &quot;A String&quot;, # Directory in a VM where disk is mounted.
-              },
-            ],
-            &quot;sdkHarnessContainerImages&quot;: [ # Set of SDK harness containers needed to execute this pipeline. This will
-                # only be set in the Fn API path. For non-cross-language pipelines this
-                # should have only one entry. Cross-language pipelines will have two or more
-                # entries.
-              { # Defines a SDK harness container for executing Dataflow pipelines.
-                &quot;containerImage&quot;: &quot;A String&quot;, # A docker container image that resides in Google Container Registry.
-                &quot;useSingleCorePerContainer&quot;: True or False, # If true, recommends the Dataflow service to use only one core per SDK
-                    # container instance with this image. If false (or unset) recommends using
-                    # more than one core per SDK container instance with this image for
-                    # efficiency. Note that Dataflow service may choose to override this property
-                    # if needed.
-              },
-            ],
-            &quot;subnetwork&quot;: &quot;A String&quot;, # Subnetwork to which VMs will be assigned, if desired.  Expected to be of
-                # the form &quot;regions/REGION/subnetworks/SUBNETWORK&quot;.
-            &quot;ipConfiguration&quot;: &quot;A String&quot;, # Configuration for VM IPs.
-            &quot;taskrunnerSettings&quot;: { # Taskrunner configuration settings. # Settings passed through to Google Compute Engine workers when
-                # using the standard Dataflow task runner.  Users should ignore
-                # this field.
-              &quot;alsologtostderr&quot;: True or False, # Whether to also send taskrunner log info to stderr.
-              &quot;taskGroup&quot;: &quot;A String&quot;, # The UNIX group ID on the worker VM to use for tasks launched by
-                  # taskrunner; e.g. &quot;wheel&quot;.
-              &quot;harnessCommand&quot;: &quot;A String&quot;, # The command to launch the worker harness.
-              &quot;logDir&quot;: &quot;A String&quot;, # The directory on the VM to store logs.
-              &quot;oauthScopes&quot;: [ # The OAuth2 scopes to be requested by the taskrunner in order to
-                  # access the Cloud Dataflow API.
-                &quot;A String&quot;,
-              ],
-              &quot;dataflowApiVersion&quot;: &quot;A String&quot;, # The API version of endpoint, e.g. &quot;v1b3&quot;
-              &quot;logUploadLocation&quot;: &quot;A String&quot;, # Indicates where to put logs.  If this is not specified, the logs
-                  # will not be uploaded.
-                  #
-                  # The supported resource type is:
-                  #
-                  # Google Cloud Storage:
-                  #   storage.googleapis.com/{bucket}/{object}
-                  #   bucket.storage.googleapis.com/{object}
-              &quot;streamingWorkerMainClass&quot;: &quot;A String&quot;, # The streaming worker main class name.
-              &quot;workflowFileName&quot;: &quot;A String&quot;, # The file to store the workflow in.
-              &quot;baseTaskDir&quot;: &quot;A String&quot;, # The location on the worker for task-specific subdirectories.
-              &quot;tempStoragePrefix&quot;: &quot;A String&quot;, # The prefix of the resources the taskrunner should use for
-                  # temporary storage.
-                  #
-                  # The supported resource type is:
-                  #
-                  # Google Cloud Storage:
-                  #   storage.googleapis.com/{bucket}/{object}
-                  #   bucket.storage.googleapis.com/{object}
-              &quot;commandlinesFileName&quot;: &quot;A String&quot;, # The file to store preprocessing commands in.
-              &quot;languageHint&quot;: &quot;A String&quot;, # The suggested backend language.
-              &quot;baseUrl&quot;: &quot;A String&quot;, # The base URL for the taskrunner to use when accessing Google Cloud APIs.
-                  #
-                  # When workers access Google Cloud APIs, they logically do so via
-                  # relative URLs.  If this field is specified, it supplies the base
-                  # URL to use for resolving these relative URLs.  The normative
-                  # algorithm used is defined by RFC 1808, &quot;Relative Uniform Resource
-                  # Locators&quot;.
-                  #
-                  # If not specified, the default value is &quot;http://www.googleapis.com/&quot;
-              &quot;logToSerialconsole&quot;: True or False, # Whether to send taskrunner log info to Google Compute Engine VM serial
-                  # console.
-              &quot;continueOnException&quot;: True or False, # Whether to continue taskrunner if an exception is hit.
-              &quot;parallelWorkerSettings&quot;: { # Provides data to pass through to the worker harness. # The settings to pass to the parallel worker harness.
-                &quot;baseUrl&quot;: &quot;A String&quot;, # The base URL for accessing Google Cloud APIs.
-                    #
-                    # When workers access Google Cloud APIs, they logically do so via
-                    # relative URLs.  If this field is specified, it supplies the base
-                    # URL to use for resolving these relative URLs.  The normative
-                    # algorithm used is defined by RFC 1808, &quot;Relative Uniform Resource
-                    # Locators&quot;.
-                    #
-                    # If not specified, the default value is &quot;http://www.googleapis.com/&quot;
-                &quot;reportingEnabled&quot;: True or False, # Whether to send work progress updates to the service.
-                &quot;servicePath&quot;: &quot;A String&quot;, # The Cloud Dataflow service path relative to the root URL, for example,
-                    # &quot;dataflow/v1b3/projects&quot;.
-                &quot;shuffleServicePath&quot;: &quot;A String&quot;, # The Shuffle service path relative to the root URL, for example,
-                    # &quot;shuffle/v1beta1&quot;.
-                &quot;workerId&quot;: &quot;A String&quot;, # The ID of the worker running this pipeline.
-                &quot;tempStoragePrefix&quot;: &quot;A String&quot;, # The prefix of the resources the system should use for temporary
-                    # storage.
-                    #
-                    # The supported resource type is:
-                    #
-                    # Google Cloud Storage:
-                    #
-                    #   storage.googleapis.com/{bucket}/{object}
-                    #   bucket.storage.googleapis.com/{object}
-              },
-              &quot;vmId&quot;: &quot;A String&quot;, # The ID string of the VM.
-              &quot;taskUser&quot;: &quot;A String&quot;, # The UNIX user ID on the worker VM to use for tasks launched by
-                  # taskrunner; e.g. &quot;root&quot;.
-            },
-            &quot;autoscalingSettings&quot;: { # Settings for WorkerPool autoscaling. # Settings for autoscaling of this WorkerPool.
-              &quot;maxNumWorkers&quot;: 42, # The maximum number of workers to cap scaling at.
-              &quot;algorithm&quot;: &quot;A String&quot;, # The algorithm to use for autoscaling.
-            },
-            &quot;metadata&quot;: { # Metadata to set on the Google Compute Engine VMs.
-              &quot;a_key&quot;: &quot;A String&quot;,
-            },
-          },
-        ],
-        &quot;dataset&quot;: &quot;A String&quot;, # The dataset for the current project where various workflow
-            # related tables are stored.
-            #
-            # The supported resource type is:
-            #
-            # Google BigQuery:
-            #   bigquery.googleapis.com/{dataset}
         &quot;internalExperiments&quot;: { # Experimental settings.
           &quot;a_key&quot;: &quot;&quot;, # Properties of the object. Contains field @type with type URL.
         },
@@ -414,50 +201,249 @@
           &quot;a_key&quot;: &quot;&quot;, # Properties of the object.
         },
         &quot;serviceAccountEmail&quot;: &quot;A String&quot;, # Identity to run virtual machines as. Defaults to the default account.
+        &quot;sdkPipelineOptions&quot;: { # The Cloud Dataflow SDK pipeline options specified by the user. These
+            # options are passed through the service and are used to recreate the
+            # SDK pipeline options on the worker in a language agnostic and platform
+            # independent way.
+          &quot;a_key&quot;: &quot;&quot;, # Properties of the object.
+        },
+        &quot;flexResourceSchedulingGoal&quot;: &quot;A String&quot;, # Which Flexible Resource Scheduling mode to run in.
+        &quot;workerPools&quot;: [ # The worker pools. At least one &quot;harness&quot; worker pool must be
+            # specified in order for the job to have workers.
+          { # Describes one particular pool of Cloud Dataflow workers to be
+              # instantiated by the Cloud Dataflow service in order to perform the
+              # computations required by a job.  Note that a workflow job may use
+              # multiple pools, in order to match the various computational
+              # requirements of the various stages of the job.
+            &quot;numThreadsPerWorker&quot;: 42, # The number of threads per worker harness. If empty or unspecified, the
+                # service will choose a number of threads (according to the number of cores
+                # on the selected machine type for batch, or 1 by convention for streaming).
+            &quot;numWorkers&quot;: 42, # Number of Google Compute Engine workers in this pool needed to
+                # execute the job.  If zero or unspecified, the service will
+                # attempt to choose a reasonable default.
+            &quot;zone&quot;: &quot;A String&quot;, # Zone to run the worker pools in.  If empty or unspecified, the service
+                # will attempt to choose a reasonable default.
+            &quot;diskSourceImage&quot;: &quot;A String&quot;, # Fully qualified source image for disks.
+            &quot;packages&quot;: [ # Packages to be installed on workers.
+              { # The packages that must be installed in order for a worker to run the
+                  # steps of the Cloud Dataflow job that will be assigned to its worker
+                  # pool.
+                  #
+                  # This is the mechanism by which the Cloud Dataflow SDK causes code to
+                  # be loaded onto the workers. For example, the Cloud Dataflow Java SDK
+                  # might use this to install jars containing the user&#x27;s code and all of the
+                  # various dependencies (libraries, data files, etc.) required in order
+                  # for that code to run.
+                &quot;name&quot;: &quot;A String&quot;, # The name of the package.
+                &quot;location&quot;: &quot;A String&quot;, # The resource to read the package from. The supported resource type is:
+                    #
+                    # Google Cloud Storage:
+                    #
+                    #   storage.googleapis.com/{bucket}
+                    #   bucket.storage.googleapis.com/
+              },
+            ],
+            &quot;teardownPolicy&quot;: &quot;A String&quot;, # Sets the policy for determining when to turndown worker pool.
+                # Allowed values are: `TEARDOWN_ALWAYS`, `TEARDOWN_ON_SUCCESS`, and
+                # `TEARDOWN_NEVER`.
+                # `TEARDOWN_ALWAYS` means workers are always torn down regardless of whether
+                # the job succeeds. `TEARDOWN_ON_SUCCESS` means workers are torn down
+                # if the job succeeds. `TEARDOWN_NEVER` means the workers are never torn
+                # down.
+                #
+                # If the workers are not torn down by the service, they will
+                # continue to run and use Google Compute Engine VM resources in the
+                # user&#x27;s project until they are explicitly terminated by the user.
+                # Because of this, Google recommends using the `TEARDOWN_ALWAYS`
+                # policy except for small, manually supervised test jobs.
+                #
+                # If unknown or unspecified, the service will attempt to choose a reasonable
+                # default.
+            &quot;onHostMaintenance&quot;: &quot;A String&quot;, # The action to take on host maintenance, as defined by the Google
+                # Compute Engine API.
+            &quot;poolArgs&quot;: { # Extra arguments for this worker pool.
+              &quot;a_key&quot;: &quot;&quot;, # Properties of the object. Contains field @type with type URL.
+            },
+            &quot;diskSizeGb&quot;: 42, # Size of root disk for VMs, in GB.  If zero or unspecified, the service will
+                # attempt to choose a reasonable default.
+            &quot;workerHarnessContainerImage&quot;: &quot;A String&quot;, # Required. Docker container image that executes the Cloud Dataflow worker
+                # harness, residing in Google Container Registry.
+                #
+                # Deprecated for the Fn API path. Use sdk_harness_container_images instead.
+            &quot;diskType&quot;: &quot;A String&quot;, # Type of root disk for VMs.  If empty or unspecified, the service will
+                # attempt to choose a reasonable default.
+            &quot;machineType&quot;: &quot;A String&quot;, # Machine type (e.g. &quot;n1-standard-1&quot;).  If empty or unspecified, the
+                # service will attempt to choose a reasonable default.
+            &quot;kind&quot;: &quot;A String&quot;, # The kind of the worker pool; currently only `harness` and `shuffle`
+                # are supported.
+            &quot;sdkHarnessContainerImages&quot;: [ # Set of SDK harness containers needed to execute this pipeline. This will
+                # only be set in the Fn API path. For non-cross-language pipelines this
+                # should have only one entry. Cross-language pipelines will have two or more
+                # entries.
+              { # Defines a SDK harness container for executing Dataflow pipelines.
+                &quot;containerImage&quot;: &quot;A String&quot;, # A docker container image that resides in Google Container Registry.
+                &quot;useSingleCorePerContainer&quot;: True or False, # If true, recommends the Dataflow service to use only one core per SDK
+                    # container instance with this image. If false (or unset) recommends using
+                    # more than one core per SDK container instance with this image for
+                    # efficiency. Note that Dataflow service may choose to override this property
+                    # if needed.
+              },
+            ],
+            &quot;dataDisks&quot;: [ # Data disks that are used by a VM in this workflow.
+              { # Describes the data disk used by a workflow job.
+                &quot;diskType&quot;: &quot;A String&quot;, # Disk storage type, as defined by Google Compute Engine.  This
+                    # must be a disk type appropriate to the project and zone in which
+                    # the workers will run.  If unknown or unspecified, the service
+                    # will attempt to choose a reasonable default.
+                    #
+                    # For example, the standard persistent disk type is a resource name
+                    # typically ending in &quot;pd-standard&quot;.  If SSD persistent disks are
+                    # available, the resource name typically ends with &quot;pd-ssd&quot;.  The
+                    # actual valid values are defined the Google Compute Engine API,
+                    # not by the Cloud Dataflow API; consult the Google Compute Engine
+                    # documentation for more information about determining the set of
+                    # available disk types for a particular project and zone.
+                    #
+                    # Google Compute Engine Disk types are local to a particular
+                    # project in a particular zone, and so the resource name will
+                    # typically look something like this:
+                    #
+                    # compute.googleapis.com/projects/project-id/zones/zone/diskTypes/pd-standard
+                &quot;sizeGb&quot;: 42, # Size of disk in GB.  If zero or unspecified, the service will
+                    # attempt to choose a reasonable default.
+                &quot;mountPoint&quot;: &quot;A String&quot;, # Directory in a VM where disk is mounted.
+              },
+            ],
+            &quot;subnetwork&quot;: &quot;A String&quot;, # Subnetwork to which VMs will be assigned, if desired.  Expected to be of
+                # the form &quot;regions/REGION/subnetworks/SUBNETWORK&quot;.
+            &quot;ipConfiguration&quot;: &quot;A String&quot;, # Configuration for VM IPs.
+            &quot;taskrunnerSettings&quot;: { # Taskrunner configuration settings. # Settings passed through to Google Compute Engine workers when
+                # using the standard Dataflow task runner.  Users should ignore
+                # this field.
+              &quot;alsologtostderr&quot;: True or False, # Whether to also send taskrunner log info to stderr.
+              &quot;taskGroup&quot;: &quot;A String&quot;, # The UNIX group ID on the worker VM to use for tasks launched by
+                  # taskrunner; e.g. &quot;wheel&quot;.
+              &quot;harnessCommand&quot;: &quot;A String&quot;, # The command to launch the worker harness.
+              &quot;logDir&quot;: &quot;A String&quot;, # The directory on the VM to store logs.
+              &quot;oauthScopes&quot;: [ # The OAuth2 scopes to be requested by the taskrunner in order to
+                  # access the Cloud Dataflow API.
+                &quot;A String&quot;,
+              ],
+              &quot;dataflowApiVersion&quot;: &quot;A String&quot;, # The API version of endpoint, e.g. &quot;v1b3&quot;
+              &quot;logUploadLocation&quot;: &quot;A String&quot;, # Indicates where to put logs.  If this is not specified, the logs
+                  # will not be uploaded.
+                  #
+                  # The supported resource type is:
+                  #
+                  # Google Cloud Storage:
+                  #   storage.googleapis.com/{bucket}/{object}
+                  #   bucket.storage.googleapis.com/{object}
+              &quot;streamingWorkerMainClass&quot;: &quot;A String&quot;, # The streaming worker main class name.
+              &quot;workflowFileName&quot;: &quot;A String&quot;, # The file to store the workflow in.
+              &quot;languageHint&quot;: &quot;A String&quot;, # The suggested backend language.
+              &quot;commandlinesFileName&quot;: &quot;A String&quot;, # The file to store preprocessing commands in.
+              &quot;baseTaskDir&quot;: &quot;A String&quot;, # The location on the worker for task-specific subdirectories.
+              &quot;tempStoragePrefix&quot;: &quot;A String&quot;, # The prefix of the resources the taskrunner should use for
+                  # temporary storage.
+                  #
+                  # The supported resource type is:
+                  #
+                  # Google Cloud Storage:
+                  #   storage.googleapis.com/{bucket}/{object}
+                  #   bucket.storage.googleapis.com/{object}
+              &quot;baseUrl&quot;: &quot;A String&quot;, # The base URL for the taskrunner to use when accessing Google Cloud APIs.
+                  #
+                  # When workers access Google Cloud APIs, they logically do so via
+                  # relative URLs.  If this field is specified, it supplies the base
+                  # URL to use for resolving these relative URLs.  The normative
+                  # algorithm used is defined by RFC 1808, &quot;Relative Uniform Resource
+                  # Locators&quot;.
+                  #
+                  # If not specified, the default value is &quot;http://www.googleapis.com/&quot;
+              &quot;logToSerialconsole&quot;: True or False, # Whether to send taskrunner log info to Google Compute Engine VM serial
+                  # console.
+              &quot;continueOnException&quot;: True or False, # Whether to continue taskrunner if an exception is hit.
+              &quot;parallelWorkerSettings&quot;: { # Provides data to pass through to the worker harness. # The settings to pass to the parallel worker harness.
+                &quot;tempStoragePrefix&quot;: &quot;A String&quot;, # The prefix of the resources the system should use for temporary
+                    # storage.
+                    #
+                    # The supported resource type is:
+                    #
+                    # Google Cloud Storage:
+                    #
+                    #   storage.googleapis.com/{bucket}/{object}
+                    #   bucket.storage.googleapis.com/{object}
+                &quot;reportingEnabled&quot;: True or False, # Whether to send work progress updates to the service.
+                &quot;baseUrl&quot;: &quot;A String&quot;, # The base URL for accessing Google Cloud APIs.
+                    #
+                    # When workers access Google Cloud APIs, they logically do so via
+                    # relative URLs.  If this field is specified, it supplies the base
+                    # URL to use for resolving these relative URLs.  The normative
+                    # algorithm used is defined by RFC 1808, &quot;Relative Uniform Resource
+                    # Locators&quot;.
+                    #
+                    # If not specified, the default value is &quot;http://www.googleapis.com/&quot;
+                &quot;servicePath&quot;: &quot;A String&quot;, # The Cloud Dataflow service path relative to the root URL, for example,
+                    # &quot;dataflow/v1b3/projects&quot;.
+                &quot;shuffleServicePath&quot;: &quot;A String&quot;, # The Shuffle service path relative to the root URL, for example,
+                    # &quot;shuffle/v1beta1&quot;.
+                &quot;workerId&quot;: &quot;A String&quot;, # The ID of the worker running this pipeline.
+              },
+              &quot;taskUser&quot;: &quot;A String&quot;, # The UNIX user ID on the worker VM to use for tasks launched by
+                  # taskrunner; e.g. &quot;root&quot;.
+              &quot;vmId&quot;: &quot;A String&quot;, # The ID string of the VM.
+            },
+            &quot;autoscalingSettings&quot;: { # Settings for WorkerPool autoscaling. # Settings for autoscaling of this WorkerPool.
+              &quot;algorithm&quot;: &quot;A String&quot;, # The algorithm to use for autoscaling.
+              &quot;maxNumWorkers&quot;: 42, # The maximum number of workers to cap scaling at.
+            },
+            &quot;metadata&quot;: { # Metadata to set on the Google Compute Engine VMs.
+              &quot;a_key&quot;: &quot;A String&quot;,
+            },
+            &quot;defaultPackageSet&quot;: &quot;A String&quot;, # The default package set to install.  This allows the service to
+                # select a default set of packages which are useful to worker
+                # harnesses written in a particular language.
+            &quot;network&quot;: &quot;A String&quot;, # Network to which VMs will be assigned.  If empty or unspecified,
+                # the service will use the network &quot;default&quot;.
+          },
+        ],
+        &quot;dataset&quot;: &quot;A String&quot;, # The dataset for the current project where various workflow
+            # related tables are stored.
+            #
+            # The supported resource type is:
+            #
+            # Google BigQuery:
+            #   bigquery.googleapis.com/{dataset}
       },
       &quot;stageStates&quot;: [ # This field may be mutated by the Cloud Dataflow service;
           # callers cannot mutate it.
         { # A message describing the state of a particular execution stage.
-          &quot;executionStageName&quot;: &quot;A String&quot;, # The name of the execution stage.
           &quot;currentStateTime&quot;: &quot;A String&quot;, # The time at which the stage transitioned to this state.
           &quot;executionStageState&quot;: &quot;A String&quot;, # Executions stage states allow the same set of values as JobState.
+          &quot;executionStageName&quot;: &quot;A String&quot;, # The name of the execution stage.
         },
       ],
       &quot;jobMetadata&quot;: { # Metadata available primarily for filtering jobs. Will be included in the # This field is populated by the Dataflow service to support filtering jobs
           # by the metadata values provided here. Populated for ListJobs and all GetJob
           # views SUMMARY and higher.
           # ListJob response and Job SUMMARY view.
-        &quot;bigTableDetails&quot;: [ # Identification of a BigTable source used in the Dataflow job.
-          { # Metadata for a BigTable connector used by the job.
-            &quot;tableId&quot;: &quot;A String&quot;, # TableId accessed in the connection.
-            &quot;projectId&quot;: &quot;A String&quot;, # ProjectId accessed in the connection.
-            &quot;instanceId&quot;: &quot;A String&quot;, # InstanceId accessed in the connection.
-          },
-        ],
-        &quot;spannerDetails&quot;: [ # Identification of a Spanner source used in the Dataflow job.
-          { # Metadata for a Spanner connector used by the job.
-            &quot;databaseId&quot;: &quot;A String&quot;, # DatabaseId accessed in the connection.
-            &quot;instanceId&quot;: &quot;A String&quot;, # InstanceId accessed in the connection.
-            &quot;projectId&quot;: &quot;A String&quot;, # ProjectId accessed in the connection.
-          },
-        ],
         &quot;datastoreDetails&quot;: [ # Identification of a Datastore source used in the Dataflow job.
           { # Metadata for a Datastore connector used by the job.
-            &quot;projectId&quot;: &quot;A String&quot;, # ProjectId accessed in the connection.
             &quot;namespace&quot;: &quot;A String&quot;, # Namespace used in the connection.
+            &quot;projectId&quot;: &quot;A String&quot;, # ProjectId accessed in the connection.
           },
         ],
         &quot;sdkVersion&quot;: { # The version of the SDK used to run the job. # The SDK version used to run the job.
-          &quot;versionDisplayName&quot;: &quot;A String&quot;, # A readable string describing the version of the SDK.
-          &quot;sdkSupportStatus&quot;: &quot;A String&quot;, # The support status for this SDK version.
           &quot;version&quot;: &quot;A String&quot;, # The version of the SDK used to run the job.
+          &quot;sdkSupportStatus&quot;: &quot;A String&quot;, # The support status for this SDK version.
+          &quot;versionDisplayName&quot;: &quot;A String&quot;, # A readable string describing the version of the SDK.
         },
         &quot;bigqueryDetails&quot;: [ # Identification of a BigQuery source used in the Dataflow job.
           { # Metadata for a BigQuery connector used by the job.
             &quot;table&quot;: &quot;A String&quot;, # Table accessed in the connection.
             &quot;dataset&quot;: &quot;A String&quot;, # Dataset accessed in the connection.
-            &quot;projectId&quot;: &quot;A String&quot;, # Project accessed in the connection.
             &quot;query&quot;: &quot;A String&quot;, # Query used to access data in the connection.
+            &quot;projectId&quot;: &quot;A String&quot;, # Project accessed in the connection.
           },
         ],
         &quot;fileDetails&quot;: [ # Identification of a File source used in the Dataflow job.
@@ -467,15 +453,29 @@
         ],
         &quot;pubsubDetails&quot;: [ # Identification of a PubSub source used in the Dataflow job.
           { # Metadata for a PubSub connector used by the job.
-            &quot;subscription&quot;: &quot;A String&quot;, # Subscription used in the connection.
             &quot;topic&quot;: &quot;A String&quot;, # Topic accessed in the connection.
+            &quot;subscription&quot;: &quot;A String&quot;, # Subscription used in the connection.
+          },
+        ],
+        &quot;bigTableDetails&quot;: [ # Identification of a BigTable source used in the Dataflow job.
+          { # Metadata for a BigTable connector used by the job.
+            &quot;projectId&quot;: &quot;A String&quot;, # ProjectId accessed in the connection.
+            &quot;instanceId&quot;: &quot;A String&quot;, # InstanceId accessed in the connection.
+            &quot;tableId&quot;: &quot;A String&quot;, # TableId accessed in the connection.
+          },
+        ],
+        &quot;spannerDetails&quot;: [ # Identification of a Spanner source used in the Dataflow job.
+          { # Metadata for a Spanner connector used by the job.
+            &quot;instanceId&quot;: &quot;A String&quot;, # InstanceId accessed in the connection.
+            &quot;projectId&quot;: &quot;A String&quot;, # ProjectId accessed in the connection.
+            &quot;databaseId&quot;: &quot;A String&quot;, # DatabaseId accessed in the connection.
           },
         ],
       },
+      &quot;type&quot;: &quot;A String&quot;, # The type of Cloud Dataflow job.
+      &quot;projectId&quot;: &quot;A String&quot;, # The ID of the Cloud Platform project that the job belongs to.
       &quot;createdFromSnapshotId&quot;: &quot;A String&quot;, # If this is specified, the job&#x27;s initial state is populated from the given
           # snapshot.
-      &quot;projectId&quot;: &quot;A String&quot;, # The ID of the Cloud Platform project that the job belongs to.
-      &quot;type&quot;: &quot;A String&quot;, # The type of Cloud Dataflow job.
       &quot;pipelineDescription&quot;: { # A descriptive representation of submitted pipeline as well as the executed # Preliminary field: The format of this data may change at any time.
           # A description of the user pipeline and stages through which it is executed.
           # Created by Cloud Dataflow service.  Only retrieved with
@@ -486,6 +486,25 @@
           { # Description of the composing transforms, names/ids, and input/outputs of a
               # stage of execution.  Some composing transforms and sources may have been
               # generated by the Dataflow service during execution planning.
+            &quot;outputSource&quot;: [ # Output sources for this stage.
+              { # Description of an input or output of an execution stage.
+                &quot;sizeBytes&quot;: &quot;A String&quot;, # Size of the source, if measurable.
+                &quot;name&quot;: &quot;A String&quot;, # Dataflow service generated name for this source.
+                &quot;userName&quot;: &quot;A String&quot;, # Human-readable name for this source; may be user or system generated.
+                &quot;originalTransformOrCollection&quot;: &quot;A String&quot;, # User name for the original user transform or collection with which this
+                    # source is most closely associated.
+              },
+            ],
+            &quot;name&quot;: &quot;A String&quot;, # Dataflow service generated name for this stage.
+            &quot;inputSource&quot;: [ # Input sources for this stage.
+              { # Description of an input or output of an execution stage.
+                &quot;sizeBytes&quot;: &quot;A String&quot;, # Size of the source, if measurable.
+                &quot;name&quot;: &quot;A String&quot;, # Dataflow service generated name for this source.
+                &quot;userName&quot;: &quot;A String&quot;, # Human-readable name for this source; may be user or system generated.
+                &quot;originalTransformOrCollection&quot;: &quot;A String&quot;, # User name for the original user transform or collection with which this
+                    # source is most closely associated.
+              },
+            ],
             &quot;id&quot;: &quot;A String&quot;, # Dataflow service generated id for this stage.
             &quot;componentTransform&quot;: [ # Transforms that comprise this execution stage.
               { # Description of a transform executed as part of an execution stage.
@@ -505,25 +524,6 @@
               },
             ],
             &quot;kind&quot;: &quot;A String&quot;, # Type of tranform this stage is executing.
-            &quot;outputSource&quot;: [ # Output sources for this stage.
-              { # Description of an input or output of an execution stage.
-                &quot;originalTransformOrCollection&quot;: &quot;A String&quot;, # User name for the original user transform or collection with which this
-                    # source is most closely associated.
-                &quot;name&quot;: &quot;A String&quot;, # Dataflow service generated name for this source.
-                &quot;sizeBytes&quot;: &quot;A String&quot;, # Size of the source, if measurable.
-                &quot;userName&quot;: &quot;A String&quot;, # Human-readable name for this source; may be user or system generated.
-              },
-            ],
-            &quot;name&quot;: &quot;A String&quot;, # Dataflow service generated name for this stage.
-            &quot;inputSource&quot;: [ # Input sources for this stage.
-              { # Description of an input or output of an execution stage.
-                &quot;originalTransformOrCollection&quot;: &quot;A String&quot;, # User name for the original user transform or collection with which this
-                    # source is most closely associated.
-                &quot;name&quot;: &quot;A String&quot;, # Dataflow service generated name for this source.
-                &quot;sizeBytes&quot;: &quot;A String&quot;, # Size of the source, if measurable.
-                &quot;userName&quot;: &quot;A String&quot;, # Human-readable name for this source; may be user or system generated.
-              },
-            ],
           },
         ],
         &quot;originalPipelineTransform&quot;: [ # Description of each transform in the pipeline and collections between them.
@@ -536,12 +536,8 @@
             &quot;id&quot;: &quot;A String&quot;, # SDK generated id of this transform instance.
             &quot;displayData&quot;: [ # Transform-specific display data.
               { # Data provided with a pipeline or transform to provide descriptive info.
-                &quot;timestampValue&quot;: &quot;A String&quot;, # Contains value if the data is of timestamp type.
-                &quot;boolValue&quot;: True or False, # Contains value if the data is of a boolean type.
-                &quot;javaClassValue&quot;: &quot;A String&quot;, # Contains value if the data is of java class type.
-                &quot;strValue&quot;: &quot;A String&quot;, # Contains value if the data is of string type.
-                &quot;int64Value&quot;: &quot;A String&quot;, # Contains value if the data is of int64 type.
                 &quot;durationValue&quot;: &quot;A String&quot;, # Contains value if the data is of duration type.
+                &quot;int64Value&quot;: &quot;A String&quot;, # Contains value if the data is of int64 type.
                 &quot;namespace&quot;: &quot;A String&quot;, # The namespace for the key. This is usually a class name or programming
                     # language namespace (i.e. python module) which defines the display data.
                     # This allows a dax monitoring system to specially handle the data
@@ -558,6 +554,10 @@
                     # will be displayed as a tooltip.
                 &quot;url&quot;: &quot;A String&quot;, # An optional full URL.
                 &quot;label&quot;: &quot;A String&quot;, # An optional label to display in a dax UI for the element.
+                &quot;timestampValue&quot;: &quot;A String&quot;, # Contains value if the data is of timestamp type.
+                &quot;boolValue&quot;: True or False, # Contains value if the data is of a boolean type.
+                &quot;javaClassValue&quot;: &quot;A String&quot;, # Contains value if the data is of java class type.
+                &quot;strValue&quot;: &quot;A String&quot;, # Contains value if the data is of string type.
               },
             ],
             &quot;outputCollectionName&quot;: [ # User  names for all collection outputs to this transform.
@@ -567,12 +567,8 @@
         ],
         &quot;displayData&quot;: [ # Pipeline level display data.
           { # Data provided with a pipeline or transform to provide descriptive info.
-            &quot;timestampValue&quot;: &quot;A String&quot;, # Contains value if the data is of timestamp type.
-            &quot;boolValue&quot;: True or False, # Contains value if the data is of a boolean type.
-            &quot;javaClassValue&quot;: &quot;A String&quot;, # Contains value if the data is of java class type.
-            &quot;strValue&quot;: &quot;A String&quot;, # Contains value if the data is of string type.
-            &quot;int64Value&quot;: &quot;A String&quot;, # Contains value if the data is of int64 type.
             &quot;durationValue&quot;: &quot;A String&quot;, # Contains value if the data is of duration type.
+            &quot;int64Value&quot;: &quot;A String&quot;, # Contains value if the data is of int64 type.
             &quot;namespace&quot;: &quot;A String&quot;, # The namespace for the key. This is usually a class name or programming
                 # language namespace (i.e. python module) which defines the display data.
                 # This allows a dax monitoring system to specially handle the data
@@ -589,6 +585,10 @@
                 # will be displayed as a tooltip.
             &quot;url&quot;: &quot;A String&quot;, # An optional full URL.
             &quot;label&quot;: &quot;A String&quot;, # An optional label to display in a dax UI for the element.
+            &quot;timestampValue&quot;: &quot;A String&quot;, # Contains value if the data is of timestamp type.
+            &quot;boolValue&quot;: True or False, # Contains value if the data is of a boolean type.
+            &quot;javaClassValue&quot;: &quot;A String&quot;, # Contains value if the data is of java class type.
+            &quot;strValue&quot;: &quot;A String&quot;, # Contains value if the data is of string type.
           },
         ],
       },
commit	4ed7d3f9b61ac35e08a22b4995076a95451cf7c8	[log] [tgz]
author	Bu Sun Kim <8822365+busunkim96@users.noreply.github.com>	Wed May 27 12:20:54 2020 -0700
committer	GitHub <noreply@github.com>	Wed May 27 12:20:54 2020 -0700
tree	a5caffd63e85ad5ff02901d9c90f2fcaddcb1564
parent	b8458c0b73030155b64a3c2392b2f70e5fbc3baf [diff] [blame]