您可以使用适用于Python的Dataflow
API客户端库中的模板启动方法来执行此操作,如下所示:
import googleapiclient.discoveryfrom oauth2client.client import GoogleCredentialsproject = PROJECT_IDlocation = LOCATIoncredentials = GoogleCredentials.get_application_default()dataflow = googleapiclient.discovery.build('dataflow', 'v1b3', credentials=credentials)result = dataflow.projects().templates().launch( projectId=project, body={ "environment": { "zone": "us-central1-f", "tempLocation": "gs://{{my-cloud-storage-bucket}}/tmp" }, "parameters": { "inputLocations" : "{"location1":"gs://{{my-cloud-storage-bucket}}/my-folder*"}", "outputLocations": "{"location1":"gs://{{my-cloud-storage-bucket}}/my-output/output.csv"}" }, "jobName": SOME_NAME }, gcsPath = PATH_TO_TEMPLATE).execute()


