public interface DataflowPipelineOptions extends PipelineOptions, GcpOptions, ApplicationNameOptions, DataflowPipelineDebugOptions, DataflowPipelineWorkerPoolOptions, BigQueryOptions, GcsOptions, StreamingOptions, CloudDebuggerOptions, DataflowWorkerLoggingOptions, DataflowProfilingOptions, PubsubOptions
DataflowRunner
.Modifier and Type | Interface and Description |
---|---|
static class |
DataflowPipelineOptions.DefaultGcpRegionFactory
Factory for a default value for Google Cloud region according to
https://cloud.google.com/compute/docs/gcloud-compute/#default-properties.
|
static class |
DataflowPipelineOptions.FlexResourceSchedulingGoal
Set of available Flexible Resource Scheduling goals.
|
static class |
DataflowPipelineOptions.StagingLocationFactory
Returns a default staging location under
GcpOptions.getGcpTempLocation() . |
DataflowPipelineDebugOptions.DataflowClientFactory, DataflowPipelineDebugOptions.StagerFactory
DataflowPipelineWorkerPoolOptions.AutoscalingAlgorithmType, DataflowPipelineWorkerPoolOptions.WorkerHarnessContainerImageFactory
GcsOptions.ExecutorServiceFactory, GcsOptions.PathValidatorFactory
DataflowWorkerLoggingOptions.Level, DataflowWorkerLoggingOptions.WorkerLogLevelOverrides
DataflowProfilingOptions.DataflowProfilingAgentConfiguration
GcpOptions.DefaultProjectFactory, GcpOptions.EnableStreamingEngineFactory, GcpOptions.GcpTempLocationFactory, GcpOptions.GcpUserCredentialsFactory
GoogleApiDebugOptions.GoogleApiTracer
STATE_CACHE_SIZE
STREAMING_ENGINE_EXPERIMENT, WINDMILL_SERVICE_EXPERIMENT
Modifier and Type | Method and Description |
---|---|
java.lang.String |
getCreateFromSnapshot()
If set, the snapshot from which the job should be created.
|
java.lang.String |
getDataflowWorkerJar() |
DataflowPipelineOptions.FlexResourceSchedulingGoal |
getFlexRSGoal()
This option controls Flexible Resource Scheduling mode.
|
java.util.Map<java.lang.String,java.lang.String> |
getLabels()
Labels that will be applied to the billing records for this job.
|
java.lang.String |
getPipelineUrl()
The URL of the staged portable pipeline.
|
java.lang.String |
getProject()
Project id to use when launching jobs.
|
java.lang.String |
getRegion()
The Google Compute Engine region for
creating Dataflow jobs.
|
java.lang.String |
getServiceAccount()
Run the job as a specific service account, instead of the default GCE robot.
|
java.lang.String |
getStagingLocation()
GCS path for staging local files, e.g.
|
java.lang.String |
getTemplateLocation()
Where the runner should generate a template file.
|
boolean |
isUpdate()
Whether to update the currently running pipeline with the same name as this one.
|
void |
setCreateFromSnapshot(java.lang.String value) |
void |
setDataflowWorkerJar(java.lang.String dataflowWorkerJar) |
void |
setFlexRSGoal(DataflowPipelineOptions.FlexResourceSchedulingGoal goal) |
void |
setLabels(java.util.Map<java.lang.String,java.lang.String> labels) |
void |
setPipelineUrl(java.lang.String urlString) |
void |
setProject(java.lang.String value) |
void |
setRegion(java.lang.String region) |
void |
setServiceAccount(java.lang.String value) |
void |
setStagingLocation(java.lang.String value) |
void |
setTemplateLocation(java.lang.String value) |
void |
setUpdate(boolean value) |
getApiRootUrl, getDataflowClient, getDataflowEndpoint, getDataflowJobFile, getDumpHeapOnOOM, getNumberOfWorkerHarnessThreads, getOverrideWindmillBinary, getSaveHeapDumpsToGcsPath, getStager, getStagerClass, getTransformNameMapping, getWindmillServiceEndpoint, getWindmillServicePort, setApiRootUrl, setDataflowClient, setDataflowEndpoint, setDataflowJobFile, setDumpHeapOnOOM, setNumberOfWorkerHarnessThreads, setOverrideWindmillBinary, setSaveHeapDumpsToGcsPath, setStager, setStagerClass, setTransformNameMapping, setWindmillServiceEndpoint, setWindmillServicePort
addExperiment, getExperiments, getExperimentValue, hasExperiment, setExperiments
getAutoscalingAlgorithm, getDiskSizeGb, getFilesToStage, getMaxNumWorkers, getMinCpuPlatform, getNetwork, getNumWorkers, getSubnetwork, getUsePublicIps, getWorkerDiskType, getWorkerHarnessContainerImage, getWorkerMachineType, setAutoscalingAlgorithm, setDiskSizeGb, setFilesToStage, setMaxNumWorkers, setMinCpuPlatform, setNetwork, setNumWorkers, setSubnetwork, setUsePublicIps, setWorkerDiskType, setWorkerHarnessContainerImage, setWorkerMachineType
getHTTPWriteTimeout, getInsertBundleParallelism, getMaxStreamingBatchSize, getMaxStreamingRowsToBatch, getNumStreamingKeys, getTempDatasetId, setHTTPWriteTimeout, setInsertBundleParallelism, setMaxStreamingBatchSize, setMaxStreamingRowsToBatch, setNumStreamingKeys, setTempDatasetId
getExecutorService, getGcsEndpoint, getGcsPerformanceMetrics, getGcsUploadBufferSizeBytes, getGcsUtil, getPathValidator, getPathValidatorClass, getUseGrpcForGcs, setExecutorService, setGcsEndpoint, setGcsPerformanceMetrics, setGcsUploadBufferSizeBytes, setGcsUtil, setPathValidator, setPathValidatorClass, setUseGrpcForGcs
getDebuggee, getEnableCloudDebugger, getMaxConditionCost, setDebuggee, setEnableCloudDebugger, setMaxConditionCost
getDefaultWorkerLogLevel, getWorkerLogLevelOverrides, getWorkerSystemErrMessageLevel, getWorkerSystemOutMessageLevel, setDefaultWorkerLogLevel, setWorkerLogLevelOverrides, setWorkerSystemErrMessageLevel, setWorkerSystemOutMessageLevel
getProfilingAgentConfiguration, getSaveProfilesToGcs, setProfilingAgentConfiguration, setSaveProfilesToGcs
getPubsubRootUrl, setPubsubRootUrl
getCredentialFactoryClass, getDataflowKmsKey, getGcpCredential, getGcpTempLocation, getWorkerRegion, getWorkerZone, getZone, isEnableStreamingEngine, setCredentialFactoryClass, setDataflowKmsKey, setEnableStreamingEngine, setGcpCredential, setGcpTempLocation, setWorkerRegion, setWorkerZone, setZone
getGoogleApiTrace, setGoogleApiTrace
@Validation.Required @Default.InstanceFactory(value=GcpOptions.DefaultProjectFactory.class) java.lang.String getProject()
GcpOptions
getProject
in interface GcpOptions
void setProject(java.lang.String value)
setProject
in interface GcpOptions
@Default.InstanceFactory(value=DataflowPipelineOptions.StagingLocationFactory.class) java.lang.String getStagingLocation()
Must be a valid Cloud Storage URL, beginning with the prefix "gs://"
If getStagingLocation()
is not set, it will default to GcpOptions.getGcpTempLocation()
. GcpOptions.getGcpTempLocation()
must be a valid GCS
path.
void setStagingLocation(java.lang.String value)
boolean isUpdate()
void setUpdate(boolean value)
@Hidden @Experimental java.lang.String getCreateFromSnapshot()
void setCreateFromSnapshot(java.lang.String value)
java.lang.String getTemplateLocation()
void setTemplateLocation(java.lang.String value)
@Hidden @Experimental java.lang.String getServiceAccount()
void setServiceAccount(java.lang.String value)
@Hidden @Experimental @Default.InstanceFactory(value=DataflowPipelineOptions.DefaultGcpRegionFactory.class) java.lang.String getRegion()
void setRegion(java.lang.String region)
java.util.Map<java.lang.String,java.lang.String> getLabels()
void setLabels(java.util.Map<java.lang.String,java.lang.String> labels)
java.lang.String getPipelineUrl()
void setPipelineUrl(java.lang.String urlString)
java.lang.String getDataflowWorkerJar()
void setDataflowWorkerJar(java.lang.String dataflowWorkerJar)
@Default.Enum(value="UNSPECIFIED") DataflowPipelineOptions.FlexResourceSchedulingGoal getFlexRSGoal()
void setFlexRSGoal(DataflowPipelineOptions.FlexResourceSchedulingGoal goal)