# Export to file for next processing step in pipeline # Copyright 2020 The Kubeflow Authors # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. name: Bigquery - Query description: | A Kubeflow Pipeline component to submit a query to Google Cloud Bigquery and store the results to a csv file. metadata: labels: add-pod-env: 'true' inputs: - name: query description: 'The query used by Bigquery service to fetch the results.' type: String - name: project_id description: 'The project to execute the query job.' type: GCPProjectID - name: job_config description: >- The full config spec for the query job.See [QueryJobConfig](https://googleapis.github.io/google-cloud-python/latest/bigquery/generated/google.cloud.bigquery.job.QueryJobConfig.html#google.cloud.bigquery.job.QueryJobConfig) for details. default: '' type: Dict - name: output_filename description: 'The output file name' default: 'bq_results.csv' type: String outputs: - name: MLPipeline UI metadata type: UI metadata - name: table description: 'The path to the result from BigQuery' type: CSV implementation: container: image: gcr.io/ml-pipeline/ml-pipeline-gcp:1.7.0-rc.3 args: [ --ui_metadata_path, {outputPath: MLPipeline UI metadata}, kfp_component.google.bigquery, query, --query, {inputValue: query}, --project_id, {inputValue: project_id}, --output_path, {outputPath: table}, --output_filename, {inputValue: output_filename}, --job_config, {inputValue: job_config}, ] env: KFP_POD_NAME: "{{pod.name}}"