From 37b5b6d660bfa309abccfe3a408883318fb7cce2 Mon Sep 17 00:00:00 2001 From: Kacper Muda Date: Fri, 17 May 2024 11:51:32 +0200 Subject: [PATCH] fix: empty openlineage dataset name for AthenaExtractor (#39677) Signed-off-by: Kacper Muda --- airflow/providers/amazon/aws/operators/athena.py | 2 +- tests/providers/amazon/aws/operators/test_athena.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/airflow/providers/amazon/aws/operators/athena.py b/airflow/providers/amazon/aws/operators/athena.py index a9e09fb325d43..48b4a8254c083 100644 --- a/airflow/providers/amazon/aws/operators/athena.py +++ b/airflow/providers/amazon/aws/operators/athena.py @@ -266,7 +266,7 @@ def get_openlineage_facets_on_start(self) -> OperatorLineage: if self.output_location: parsed = urlparse(self.output_location) - outputs.append(Dataset(namespace=f"{parsed.scheme}://{parsed.netloc}", name=parsed.path)) + outputs.append(Dataset(namespace=f"{parsed.scheme}://{parsed.netloc}", name=parsed.path or "/")) return OperatorLineage(job_facets=job_facets, run_facets=run_facets, inputs=inputs, outputs=outputs) diff --git a/tests/providers/amazon/aws/operators/test_athena.py b/tests/providers/amazon/aws/operators/test_athena.py index d4ccf521a742d..66fb6b297f993 100644 --- a/tests/providers/amazon/aws/operators/test_athena.py +++ b/tests/providers/amazon/aws/operators/test_athena.py @@ -279,7 +279,7 @@ def mock_get_table_metadata(CatalogName, DatabaseName, TableName): task_id="test_athena_openlineage", query="INSERT INTO TEST_TABLE SELECT CUSTOMER_EMAIL FROM DISCOUNTS", database="TEST_DATABASE", - output_location="s3://test_s3_bucket/", + output_location="s3://test_s3_bucket", client_request_token="eac427d0-1c6d-4dfb-96aa-2835d3ac6595", sleep_time=0, max_polling_attempts=3,