Skip to content

Commit

Permalink
chore(ingest): always use urn creation helpers (datahub-project#11911)
Browse files Browse the repository at this point in the history
  • Loading branch information
hsheth2 authored and sleeperdeep committed Dec 17, 2024
1 parent 50b9293 commit 52e98e4
Show file tree
Hide file tree
Showing 3 changed files with 18 additions and 9 deletions.
10 changes: 7 additions & 3 deletions metadata-ingestion/scripts/modeldocgen.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,11 @@
import click

from datahub.configuration.common import ConfigEnum, PermissiveConfigModel
from datahub.emitter.mce_builder import make_data_platform_urn, make_dataset_urn
from datahub.emitter.mce_builder import (
make_data_platform_urn,
make_dataset_urn,
make_schema_field_urn,
)
from datahub.emitter.mcp import MetadataChangeProposalWrapper
from datahub.emitter.rest_emitter import DatahubRestEmitter
from datahub.ingestion.api.common import PipelineContext, RecordEnvelope
Expand Down Expand Up @@ -442,10 +446,10 @@ def strip_types(field_path: str) -> str:
name=relnship_name,
foreignDataset=foreign_dataset_urn,
foreignFields=[
f"urn:li:schemaField:({foreign_dataset_urn}, urn)"
make_schema_field_urn(foreign_dataset_urn, "urn")
],
sourceFields=[
f"urn:li:schemaField:({source_dataset_urn},{f_field.fieldPath})"
make_schema_field_urn(source_dataset_urn, f_field.fieldPath)
],
)
foreign_keys.append(fkey)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,7 @@
make_data_platform_urn,
make_dataplatform_instance_urn,
make_dataset_urn_with_platform_instance,
make_schema_field_urn,
make_tag_urn,
)
from datahub.emitter.mcp import MetadataChangeProposalWrapper
Expand Down Expand Up @@ -676,7 +677,7 @@ def get_foreign_key_metadata(
)

source_fields = [
f"urn:li:schemaField:({dataset_urn},{f})"
make_schema_field_urn(dataset_urn, f)
for f in fk_dict["constrained_columns"]
]
foreign_dataset = make_dataset_urn_with_platform_instance(
Expand All @@ -686,7 +687,7 @@ def get_foreign_key_metadata(
env=self.config.env,
)
foreign_fields = [
f"urn:li:schemaField:({foreign_dataset},{f})"
make_schema_field_urn(foreign_dataset, f)
for f in fk_dict["referred_columns"]
]

Expand Down
12 changes: 8 additions & 4 deletions metadata-ingestion/tests/unit/test_sql_common.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,7 +38,7 @@ def test_generate_foreign_key():
"referred_columns": ["test_referred_column"], # type: ignore
}
foreign_key = source.get_foreign_key_metadata(
dataset_urn="test_urn",
dataset_urn="urn:li:dataset:(urn:li:dataPlatform:TEST,test_schema.base_urn,PROD)",
schema="test_schema",
fk_dict=fk_dict,
inspector=mock.Mock(),
Expand All @@ -48,7 +48,9 @@ def test_generate_foreign_key():
assert [
"urn:li:schemaField:(urn:li:dataset:(urn:li:dataPlatform:TEST,test_referred_schema.test_table,PROD),test_referred_column)"
] == foreign_key.foreignFields
assert ["urn:li:schemaField:(test_urn,test_column)"] == foreign_key.sourceFields
assert [
"urn:li:schemaField:(urn:li:dataset:(urn:li:dataPlatform:TEST,test_schema.base_urn,PROD),test_column)"
] == foreign_key.sourceFields


def test_use_source_schema_for_foreign_key_if_not_specified():
Expand All @@ -60,7 +62,7 @@ def test_use_source_schema_for_foreign_key_if_not_specified():
"referred_columns": ["test_referred_column"], # type: ignore
}
foreign_key = source.get_foreign_key_metadata(
dataset_urn="test_urn",
dataset_urn="urn:li:dataset:(urn:li:dataPlatform:TEST,test_schema.base_urn,PROD)",
schema="test_schema",
fk_dict=fk_dict,
inspector=mock.Mock(),
Expand All @@ -70,7 +72,9 @@ def test_use_source_schema_for_foreign_key_if_not_specified():
assert [
"urn:li:schemaField:(urn:li:dataset:(urn:li:dataPlatform:TEST,test_schema.test_table,PROD),test_referred_column)"
] == foreign_key.foreignFields
assert ["urn:li:schemaField:(test_urn,test_column)"] == foreign_key.sourceFields
assert [
"urn:li:schemaField:(urn:li:dataset:(urn:li:dataPlatform:TEST,test_schema.base_urn,PROD),test_column)"
] == foreign_key.sourceFields


PLATFORM_FROM_SQLALCHEMY_URI_TEST_CASES: Dict[str, str] = {
Expand Down

0 comments on commit 52e98e4

Please sign in to comment.