apache
diff --git a/‎BREEZE.rst
Lines changed: 1 addition & 1 deletion b/‎BREEZE.rst
Lines changed: 1 addition & 1 deletion
diff --git a/‎CONTRIBUTING.rst
Lines changed: 4 additions & 4 deletions b/‎CONTRIBUTING.rst
Lines changed: 4 additions & 4 deletions
diff --git a/‎IMAGES.rst
Lines changed: 2 additions & 2 deletions b/‎IMAGES.rst
Lines changed: 2 additions & 2 deletions
diff --git a/‎INSTALL
Lines changed: 1 addition & 1 deletion b/‎INSTALL
Lines changed: 1 addition & 1 deletion
diff --git a/‎TESTING.rst
Lines changed: 2 additions & 2 deletions b/‎TESTING.rst
Lines changed: 2 additions & 2 deletions
diff --git a/‎airflow/providers/dependencies.json
Lines changed: 3 additions & 1 deletion b/‎airflow/providers/dependencies.json
Lines changed: 3 additions & 1 deletion
diff --git a/‎airflow/providers/google/cloud/example_dags/example_trino_to_gcs.py
Lines changed: 150 additions & 0 deletions b/‎airflow/providers/google/cloud/example_dags/example_trino_to_gcs.py
Lines changed: 150 additions & 0 deletions
@@ -2444,7 +2444,7 @@ This is the current syntax for  `./breeze <./breeze>`_:
           start all integrations. Selected integrations are not saved for future execution.
           One of:
 
-                 cassandra kerberos mongo openldap pinot presto rabbitmq redis statsd all
+                 cassandra kerberos mongo openldap pinot rabbitmq redis statsd trino all
 
   --init-script INIT_SCRIPT_FILE
           Initialization script name - Sourced from files/airflow-breeze-config. Default value
 
@@ -594,7 +594,7 @@ github_enterprise, google, google_auth, grpc, hashicorp, hdfs, hive, http, imap,
 jira, kerberos, kubernetes, ldap, microsoft.azure, microsoft.mssql, microsoft.winrm, mongo, mssql,
 mysql, neo4j, odbc, openfaas, opsgenie, oracle, pagerduty, papermill, password, pinot, plexus,
 postgres, presto, qds, qubole, rabbitmq, redis, s3, salesforce, samba, segment, sendgrid, sentry,
-sftp, singularity, slack, snowflake, spark, sqlite, ssh, statsd, tableau, telegram, vertica,
+sftp, singularity, slack, snowflake, spark, sqlite, ssh, statsd, tableau, telegram, trino, vertica,
 virtualenv, webhdfs, winrm, yandex, zendesk
 
   .. END EXTRAS HERE
@@ -661,11 +661,11 @@ apache.hive                amazon,microsoft.mssql,mysql,presto,samba,vertica
 apache.livy                http
 dingding                   http
 discord                    http
-google                     amazon,apache.beam,apache.cassandra,cncf.kubernetes,facebook,microsoft.azure,microsoft.mssql,mysql,oracle,postgres,presto,salesforce,sftp,ssh
+google                     amazon,apache.beam,apache.cassandra,cncf.kubernetes,facebook,microsoft.azure,microsoft.mssql,mysql,oracle,postgres,presto,salesforce,sftp,ssh,trino
 hashicorp                  google
 microsoft.azure            google,oracle
 microsoft.mssql            odbc
-mysql                      amazon,presto,vertica
+mysql                      amazon,presto,trino,vertica
 opsgenie                   http
 postgres                   amazon
 salesforce                 tableau
@@ -756,7 +756,7 @@ providers.
   not only "green path"
 
 * Integration tests where 'local' integration with a component is possible (for example tests with
-  MySQL/Postgres DB/Presto/Kerberos all have integration tests which run with real, dockerised components
+  MySQL/Postgres DB/Trino/Kerberos all have integration tests which run with real, dockerized components
 
 * System Tests which provide end-to-end testing, usually testing together several operators, sensors,
   transfers connecting to a real external system
 
@@ -116,7 +116,7 @@ parameter to Breeze:
 
 .. code-block:: bash
 
-  ./breeze build-image --python 3.7 --additional-extras=presto \
+  ./breeze build-image --python 3.7 --additional-extras=trino \
       --production-image --install-airflow-version=2.0.0
 
 
@@ -163,7 +163,7 @@ You can also skip installing airflow and install it from locally provided files
 
 .. code-block:: bash
 
-  ./breeze build-image --python 3.7 --additional-extras=presto \
+  ./breeze build-image --python 3.7 --additional-extras=trino \
       --production-image --disable-pypi-when-building --install-from-local-files-when-building
 
 In this case you airflow and all packages (.whl files) should be placed in ``docker-context-files`` folder.
 
@@ -106,7 +106,7 @@ github_enterprise, google, google_auth, grpc, hashicorp, hdfs, hive, http, imap,
 jira, kerberos, kubernetes, ldap, microsoft.azure, microsoft.mssql, microsoft.winrm, mongo, mssql,
 mysql, neo4j, odbc, openfaas, opsgenie, oracle, pagerduty, papermill, password, pinot, plexus,
 postgres, presto, qds, qubole, rabbitmq, redis, s3, salesforce, samba, segment, sendgrid, sentry,
-sftp, singularity, slack, snowflake, spark, sqlite, ssh, statsd, tableau, telegram, vertica,
+sftp, singularity, slack, snowflake, spark, sqlite, ssh, statsd, tableau, telegram, trino, vertica,
 virtualenv, webhdfs, winrm, yandex, zendesk
 
 # END EXTRAS HERE
 
@@ -281,12 +281,12 @@ The following integrations are available:
      - Integration required for OpenLDAP hooks
    * - pinot
      - Integration required for Apache Pinot hooks
-   * - presto
-     - Integration required for Presto hooks
    * - rabbitmq
      - Integration required for Celery executor tests
    * - redis
      - Integration required for Celery executor tests
+   * - trino
+     - Integration required for Trino hooks
 
 To start the ``mongo`` integration only, enter:
 
 
@@ -50,7 +50,8 @@
     "presto",
     "salesforce",
     "sftp",
-    "ssh"
+    "ssh",
+    "trino"
   ],
   "hashicorp": [
     "google"
@@ -65,6 +66,7 @@
   "mysql": [
     "amazon",
     "presto",
+    "trino",
     "vertica"
   ],
   "opsgenie": [
 
@@ -0,0 +1,150 @@
+#
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+"""
+Example DAG using TrinoToGCSOperator.
+"""
+import os
+import re
+
+from airflow import models
+from airflow.providers.google.cloud.operators.bigquery import (
+    BigQueryCreateEmptyDatasetOperator,
+    BigQueryCreateExternalTableOperator,
+    BigQueryDeleteDatasetOperator,
+    BigQueryExecuteQueryOperator,
+)
+from airflow.providers.google.cloud.transfers.trino_to_gcs import TrinoToGCSOperator
+from airflow.utils.dates import days_ago
+
+GCP_PROJECT_ID = os.environ.get("GCP_PROJECT_ID", 'example-project')
+GCS_BUCKET = os.environ.get("GCP_TRINO_TO_GCS_BUCKET_NAME", "test-trino-to-gcs-bucket")
+DATASET_NAME = os.environ.get("GCP_TRINO_TO_GCS_DATASET_NAME", "test_trino_to_gcs_dataset")
+
+SOURCE_MULTIPLE_TYPES = "memory.default.test_multiple_types"
+SOURCE_CUSTOMER_TABLE = "tpch.sf1.customer"
+
+
+def safe_name(s: str) -> str:
+    """
+    Remove invalid characters for filename
+    """
+    return re.sub("[^0-9a-zA-Z_]+", "_", s)
+
+
+with models.DAG(
+    dag_id="example_trino_to_gcs",
+    schedule_interval=None,  # Override to match your needs
+    start_date=days_ago(1),
+    tags=["example"],
+) as dag:
+
+    create_dataset = BigQueryCreateEmptyDatasetOperator(task_id="create-dataset", dataset_id=DATASET_NAME)
+
+    delete_dataset = BigQueryDeleteDatasetOperator(
+        task_id="delete_dataset", dataset_id=DATASET_NAME, delete_contents=True
+    )
+
+    # [START howto_operator_trino_to_gcs_basic]
+    trino_to_gcs_basic = TrinoToGCSOperator(
+        task_id="trino_to_gcs_basic",
+        sql=f"select * from {SOURCE_MULTIPLE_TYPES}",
+        bucket=GCS_BUCKET,
+        filename=f"{safe_name(SOURCE_MULTIPLE_TYPES)}.{{}}.json",
+    )
+    # [END howto_operator_trino_to_gcs_basic]
+
+    # [START howto_operator_trino_to_gcs_multiple_types]
+    trino_to_gcs_multiple_types = TrinoToGCSOperator(
+        task_id="trino_to_gcs_multiple_types",
+        sql=f"select * from {SOURCE_MULTIPLE_TYPES}",
+        bucket=GCS_BUCKET,
+        filename=f"{safe_name(SOURCE_MULTIPLE_TYPES)}.{{}}.json",
+        schema_filename=f"{safe_name(SOURCE_MULTIPLE_TYPES)}-schema.json",
+        gzip=False,
+    )
+    # [END howto_operator_trino_to_gcs_multiple_types]
+
+    # [START howto_operator_create_external_table_multiple_types]
+    create_external_table_multiple_types = BigQueryCreateExternalTableOperator(
+        task_id="create_external_table_multiple_types",
+        bucket=GCS_BUCKET,
+        source_objects=[f"{safe_name(SOURCE_MULTIPLE_TYPES)}.*.json"],
+        source_format="NEWLINE_DELIMITED_JSON",
+        destination_project_dataset_table=f"{DATASET_NAME}.{safe_name(SOURCE_MULTIPLE_TYPES)}",
+        schema_object=f"{safe_name(SOURCE_MULTIPLE_TYPES)}-schema.json",
+    )
+    # [END howto_operator_create_external_table_multiple_types]
+
+    read_data_from_gcs_multiple_types = BigQueryExecuteQueryOperator(
+        task_id="read_data_from_gcs_multiple_types",
+        sql=f"SELECT COUNT(*) FROM `{GCP_PROJECT_ID}.{DATASET_NAME}.{safe_name(SOURCE_MULTIPLE_TYPES)}`",
+        use_legacy_sql=False,
+    )
+
+    # [START howto_operator_trino_to_gcs_many_chunks]
+    trino_to_gcs_many_chunks = TrinoToGCSOperator(
+        task_id="trino_to_gcs_many_chunks",
+        sql=f"select * from {SOURCE_CUSTOMER_TABLE}",
+        bucket=GCS_BUCKET,
+        filename=f"{safe_name(SOURCE_CUSTOMER_TABLE)}.{{}}.json",
+        schema_filename=f"{safe_name(SOURCE_CUSTOMER_TABLE)}-schema.json",
+        approx_max_file_size_bytes=10_000_000,
+        gzip=False,
+    )
+    # [END howto_operator_trino_to_gcs_many_chunks]
+
+    create_external_table_many_chunks = BigQueryCreateExternalTableOperator(
+        task_id="create_external_table_many_chunks",
+        bucket=GCS_BUCKET,
+        source_objects=[f"{safe_name(SOURCE_CUSTOMER_TABLE)}.*.json"],
+        source_format="NEWLINE_DELIMITED_JSON",
+        destination_project_dataset_table=f"{DATASET_NAME}.{safe_name(SOURCE_CUSTOMER_TABLE)}",
+        schema_object=f"{safe_name(SOURCE_CUSTOMER_TABLE)}-schema.json",
+    )
+
+    # [START howto_operator_read_data_from_gcs_many_chunks]
+    read_data_from_gcs_many_chunks = BigQueryExecuteQueryOperator(
+        task_id="read_data_from_gcs_many_chunks",
+        sql=f"SELECT COUNT(*) FROM `{GCP_PROJECT_ID}.{DATASET_NAME}.{safe_name(SOURCE_CUSTOMER_TABLE)}`",
+        use_legacy_sql=False,
+    )
+    # [END howto_operator_read_data_from_gcs_many_chunks]
+
+    # [START howto_operator_trino_to_gcs_csv]
+    trino_to_gcs_csv = TrinoToGCSOperator(
+        task_id="trino_to_gcs_csv",
+        sql=f"select * from {SOURCE_MULTIPLE_TYPES}",
+        bucket=GCS_BUCKET,
+        filename=f"{safe_name(SOURCE_MULTIPLE_TYPES)}.{{}}.csv",
+        schema_filename=f"{safe_name(SOURCE_MULTIPLE_TYPES)}-schema.json",
+        export_format="csv",
+    )
+    # [END howto_operator_trino_to_gcs_csv]
+
+    create_dataset >> trino_to_gcs_basic
+    create_dataset >> trino_to_gcs_multiple_types
+    create_dataset >> trino_to_gcs_many_chunks
+    create_dataset >> trino_to_gcs_csv
+
+    trino_to_gcs_multiple_types >> create_external_table_multiple_types >> read_data_from_gcs_multiple_types
+    trino_to_gcs_many_chunks >> create_external_table_many_chunks >> read_data_from_gcs_many_chunks
+
+    trino_to_gcs_basic >> delete_dataset
+    trino_to_gcs_csv >> delete_dataset
+    read_data_from_gcs_multiple_types >> delete_dataset
+    read_data_from_gcs_many_chunks >> delete_dataset