diff --git a/gms/impl/src/main/resources/DataPlatformInfo.json b/gms/impl/src/main/resources/DataPlatformInfo.json index d41e5b04afdfe9..8369572a7d6b72 100644 --- a/gms/impl/src/main/resources/DataPlatformInfo.json +++ b/gms/impl/src/main/resources/DataPlatformInfo.json @@ -67,9 +67,9 @@ "type": "OLAP_DATASTORE", "logoUrl": "https://raw.githubusercontent.com/linkedin/datahub/master/datahub-web-react/src/images/kustologo.png" }, - "urn:li:dataPlatform:mongo": { + "urn:li:dataPlatform:mongodb": { "datasetNameDelimiter": ".", - "name": "mongo", + "name": "mongodb", "displayName": "MongoDB", "type": "KEY_VALUE_STORE", "logoUrl": "https://raw.githubusercontent.com/linkedin/datahub/master/datahub-web-react/src/images/mongodblogo.png" diff --git a/gms/impl/src/test/java/com/linkedin/metadata/resources/dataplatform/utils/DataPlatformsUtilTest.java b/gms/impl/src/test/java/com/linkedin/metadata/resources/dataplatform/utils/DataPlatformsUtilTest.java index df8571bf960bf1..f7bf68998fad1b 100644 --- a/gms/impl/src/test/java/com/linkedin/metadata/resources/dataplatform/utils/DataPlatformsUtilTest.java +++ b/gms/impl/src/test/java/com/linkedin/metadata/resources/dataplatform/utils/DataPlatformsUtilTest.java @@ -30,7 +30,7 @@ public void testGetPlatformType() { assertPlatformType("hdfs", PlatformType.FILE_SYSTEM); assertPlatformType("hive", PlatformType.FILE_SYSTEM); assertPlatformType("kafka", PlatformType.MESSAGE_BROKER); - assertPlatformType("mongo", PlatformType.KEY_VALUE_STORE); + assertPlatformType("mongodb", PlatformType.KEY_VALUE_STORE); assertPlatformType("mysql", PlatformType.RELATIONAL_DB); assertPlatformType("oracle", PlatformType.RELATIONAL_DB); assertPlatformType("pinot", PlatformType.OLAP_DATASTORE); @@ -66,7 +66,7 @@ public void testGetPlatformDelimiter() { assertEquals(DataPlatformsUtil.getPlatformDelimiter("hdfs").get(), "/"); assertEquals(DataPlatformsUtil.getPlatformDelimiter("hive").get(), "."); assertEquals(DataPlatformsUtil.getPlatformDelimiter("kafka").get(), "."); - assertEquals(DataPlatformsUtil.getPlatformDelimiter("mongo").get(), "."); + assertEquals(DataPlatformsUtil.getPlatformDelimiter("mongodb").get(), "."); assertEquals(DataPlatformsUtil.getPlatformDelimiter("mysql").get(), "."); assertEquals(DataPlatformsUtil.getPlatformDelimiter("oracle").get(), "."); assertEquals(DataPlatformsUtil.getPlatformDelimiter("pinot").get(), "."); diff --git a/metadata-ingestion/examples/mce_files/bootstrap_mce.json b/metadata-ingestion/examples/mce_files/bootstrap_mce.json index b7a4ee0932f062..a98a61cdf7bf9d 100644 --- a/metadata-ingestion/examples/mce_files/bootstrap_mce.json +++ b/metadata-ingestion/examples/mce_files/bootstrap_mce.json @@ -1626,12 +1626,12 @@ "auditHeader": null, "proposedSnapshot": { "com.linkedin.pegasus2avro.metadata.snapshot.DataPlatformSnapshot": { - "urn": "urn:li:dataPlatform:mongo", + "urn": "urn:li:dataPlatform:mongodb", "aspects": [ { "com.linkedin.pegasus2avro.dataplatform.DataPlatformInfo": { "datasetNameDelimiter": ".", - "name": "mongo", + "name": "mongodb", "displayName": "MongoDB", "type": "KEY_VALUE_STORE", "logoUrl": "https://raw.githubusercontent.com/linkedin/datahub/master/datahub-web-react/src/images/mongodblogo.png" diff --git a/metadata-ingestion/examples/mce_files/data_platforms.json b/metadata-ingestion/examples/mce_files/data_platforms.json index 605cbb159b42cd..d80668a7f75348 100644 --- a/metadata-ingestion/examples/mce_files/data_platforms.json +++ b/metadata-ingestion/examples/mce_files/data_platforms.json @@ -201,12 +201,12 @@ "auditHeader": null, "proposedSnapshot": { "com.linkedin.pegasus2avro.metadata.snapshot.DataPlatformSnapshot": { - "urn": "urn:li:dataPlatform:mongo", + "urn": "urn:li:dataPlatform:mongodb", "aspects": [ { "com.linkedin.pegasus2avro.dataplatform.DataPlatformInfo": { "datasetNameDelimiter": ".", - "name": "mongo", + "name": "mongodb", "displayName": "MongoDB", "type": "KEY_VALUE_STORE", "logoUrl": "https://raw.githubusercontent.com/linkedin/datahub/master/datahub-web-react/src/images/mongodblogo.png" diff --git a/metadata-ingestion/examples/recipes/mongodb_to_datahub.yml b/metadata-ingestion/examples/recipes/mongodb_to_datahub.yml new file mode 100644 index 00000000000000..931524093284ac --- /dev/null +++ b/metadata-ingestion/examples/recipes/mongodb_to_datahub.yml @@ -0,0 +1,20 @@ +source: + type: "mongodb" + config: + # For advanced configurations, see the MongoDB docs. + # https://pymongo.readthedocs.io/en/stable/examples/authentication.html + connect_uri: "mongodb://localhost:57017" + username: mongoadmin + password: examplepass + env: "PROD" # Optional, default is "PROD" + authMechanism: "DEFAULT" + options: {} + database_pattern: {} + collection_pattern: {} + enableSchemaInference: True + schemaSamplingSize: 1000 + # database_pattern/collection_pattern are similar to schema_pattern/table_pattern from above +sink: + type: "datahub-rest" + config: + server: "http://localhost:8080" diff --git a/metadata-ingestion/src/datahub/ingestion/source/superset.py b/metadata-ingestion/src/datahub/ingestion/source/superset.py index be09328a0a9589..e93702f62dd6da 100644 --- a/metadata-ingestion/src/datahub/ingestion/source/superset.py +++ b/metadata-ingestion/src/datahub/ingestion/source/superset.py @@ -52,7 +52,7 @@ def get_platform_from_sqlalchemy_uri(sqlalchemy_uri: str) -> str: if sqlalchemy_uri.startswith("mysql"): return "mysql" if sqlalchemy_uri.startswith("mongodb"): - return "mongo" + return "mongodb" if sqlalchemy_uri.startswith("hive"): return "hive" return "external" diff --git a/metadata-utils/src/main/java/com/linkedin/metadata/utils/elasticsearch/ElasticsearchUtil.java b/metadata-utils/src/main/java/com/linkedin/metadata/utils/elasticsearch/ElasticsearchUtil.java index 457c904a5378b2..b33330a8a1b9f3 100644 --- a/metadata-utils/src/main/java/com/linkedin/metadata/utils/elasticsearch/ElasticsearchUtil.java +++ b/metadata-utils/src/main/java/com/linkedin/metadata/utils/elasticsearch/ElasticsearchUtil.java @@ -25,7 +25,7 @@ public enum AccessCountType { .put("hive", '.') .put("kafka", '.') .put("kafka-lc", '.') - .put("mongo", '.') + .put("mongodb", '.') .put("mysql", '.') .put("oracle", '.') .put("pinot", '.')