Skip to content

Commit

Permalink
fix(ingest/bigquery): Fix tags urn/name ingestion for BigQuery (#11691)
Browse files Browse the repository at this point in the history
  • Loading branch information
skrydal authored Oct 22, 2024
1 parent 7ba77a9 commit b7958c4
Show file tree
Hide file tree
Showing 3 changed files with 100 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -310,7 +310,7 @@ def gen_dataset_containers(
logger.warning(
f"Failed to generate platform resource for label {k}:{v}: {e}"
)
tags_joined.append(tag_urn.urn())
tags_joined.append(tag_urn.name)

database_container_key = self.gen_project_id_key(database=project_id)

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -112,6 +112,26 @@
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "container",
"entityUrn": "urn:li:container:8df46c5e3ded05a3122b0015822c0ef0",
"changeType": "UPSERT",
"aspectName": "globalTags",
"aspect": {
"json": {
"tags": [
{
"tag": "urn:li:tag:priority:medium:test"
}
]
}
},
"systemMetadata": {
"lastObserved": 1643871600000,
"runId": "bigquery-2022_02_03-07_00_00",
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "container",
"entityUrn": "urn:li:container:8df46c5e3ded05a3122b0015822c0ef0",
Expand Down Expand Up @@ -257,6 +277,64 @@
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "platformResource",
"entityUrn": "urn:li:platformResource:7fbbf79fb726422dc2434222a8e30630",
"changeType": "UPSERT",
"aspectName": "platformResourceInfo",
"aspect": {
"json": {
"resourceType": "BigQueryLabelInfo",
"primaryKey": "priority/medium:test",
"secondaryKeys": [
"urn:li:tag:priority:medium:test"
],
"value": {
"blob": "{\"datahub_urn\": \"urn:li:tag:priority:medium:test\", \"managed_by_datahub\": false, \"key\": \"priority\", \"value\": \"medium:test\"}",
"contentType": "JSON",
"schemaType": "JSON",
"schemaRef": "BigQueryLabelInfo"
}
}
},
"systemMetadata": {
"lastObserved": 1643871600000,
"runId": "bigquery-2022_02_03-07_00_00-2j2qqv",
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "platformResource",
"entityUrn": "urn:li:platformResource:7fbbf79fb726422dc2434222a8e30630",
"changeType": "UPSERT",
"aspectName": "dataPlatformInstance",
"aspect": {
"json": {
"platform": "urn:li:dataPlatform:bigquery"
}
},
"systemMetadata": {
"lastObserved": 1643871600000,
"runId": "bigquery-2022_02_03-07_00_00-2j2qqv",
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "platformResource",
"entityUrn": "urn:li:platformResource:7fbbf79fb726422dc2434222a8e30630",
"changeType": "UPSERT",
"aspectName": "status",
"aspect": {
"json": {
"removed": false
}
},
"systemMetadata": {
"lastObserved": 1643871600000,
"runId": "bigquery-2022_02_03-07_00_00-2j2qqv",
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "platformResource",
"entityUrn": "urn:li:platformResource:99b34051bd90d28d922b0e107277a916",
Expand Down Expand Up @@ -1241,6 +1319,22 @@
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "tag",
"entityUrn": "urn:li:tag:priority:medium:test",
"changeType": "UPSERT",
"aspectName": "tagKey",
"aspect": {
"json": {
"name": "priority:medium:test"
}
},
"systemMetadata": {
"lastObserved": 1643871600000,
"runId": "bigquery-2022_02_03-07_00_00",
"lastRunId": "no-run-id-provided"
}
},
{
"entityType": "tag",
"entityUrn": "urn:li:tag:purchase",
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -70,6 +70,7 @@ def recipe(mcp_output_path: str, source_config_override: dict = {}) -> dict:
"include_table_lineage": True,
"include_data_platform_instance": True,
"capture_table_label_as_tag": True,
"capture_dataset_label_as_tag": True,
"classification": ClassificationConfig(
enabled=True,
classifiers=[
Expand Down Expand Up @@ -141,7 +142,10 @@ def side_effect(*args: Any) -> Optional[PlatformResource]:

get_platform_resource.side_effect = side_effect
get_datasets_for_project_id.return_value = [
BigqueryDataset(name=dataset_name, location="US")
# BigqueryDataset(name=dataset_name, location="US")
BigqueryDataset(
name=dataset_name, location="US", labels={"priority": "medium:test"}
)
]

table_list_item = TableListItem(
Expand Down

0 comments on commit b7958c4

Please sign in to comment.