Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions docs/how/updating-datahub.md
Original file line number Diff line number Diff line change
Expand Up @@ -54,6 +54,7 @@ This file documents any backwards-incompatible changes in DataHub and assists pe
- #14717: The Tableau ingestion source now enables `extract_lineage_from_unsupported_custom_sql_queries` by default. This improves the quality of lineage extracted by using DataHub's SQL parser in cases where the Tableau Catalog API fails to return lineage for Custom SQL queries.
- #14824: DataHub now supports CDC (Change Data Capture) mode for generating MetadataChangeLogs with guaranteed ordering based on database transaction commits. CDC mode is optional and disabled by default. When enabled via `CDC_MCL_PROCESSING_ENABLED=true`, MCLs are generated from Debezium-captured database changes rather than directly from GMS. This provides stronger ordering guarantees and decoupled processing. Requires MySQL 5.7+ or PostgreSQL 10+ with replication enabled. See [CDC Configuration Guide](configure-cdc.md) for setup instructions.
- Added multi-client search engine shim for Elasticsearch and OpenSearch support. This enables DataHub to work with ES 7.17 (with API compatibility mode for ES 8.x servers), ES 8.x, and OpenSearch 2.x through a unified interface. The shim includes auto-detection of search engine types and backward compatibility with existing RestHighLevelClient usage. See [elasticsearch-search-client-shim.md](./elasticsearch-search-client-shim.md) for configuration details.
- Added an ingestion source for IBM Db2 databases.

## 1.2.0

Expand Down
13 changes: 13 additions & 0 deletions metadata-ingestion/docs/sources/db2/db2_recipe.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
source:
type: db2
config:
# Coordinates
host_port: localhost:50000
database: dbname

# Credentials
username: db2inst1
password: password

sink:
# sink configs
3 changes: 3 additions & 0 deletions metadata-ingestion/setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -462,6 +462,7 @@
"datahub-lineage-file": set(),
"datahub-business-glossary": set(),
"delta-lake": {*data_lake_profiling, *delta_lake},
"db2": {"ibm_db_sa"} | sql_common,
"dbt": {"requests"} | dbt_common | aws_common,
"dbt-cloud": {"requests"} | dbt_common,
"dremio": {"requests"} | sql_common,
Expand Down Expand Up @@ -772,6 +773,7 @@
"athena",
"circuit-breaker",
"clickhouse",
"db2",
"delta-lake",
"druid",
"excel",
Expand Down Expand Up @@ -814,6 +816,7 @@
"cockroachdb = datahub.ingestion.source.sql.cockroachdb:CockroachDBSource",
"delta-lake = datahub.ingestion.source.delta_lake:DeltaLakeSource",
"s3 = datahub.ingestion.source.s3:S3Source",
"db2 = datahub.ingestion.source.sql.db2:Db2Source",
"dbt = datahub.ingestion.source.dbt.dbt_core:DBTCoreSource",
"dbt-cloud = datahub.ingestion.source.dbt.dbt_cloud:DBTCloudSource",
"dremio = datahub.ingestion.source.dremio.dremio_source:DremioSource",
Expand Down
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
{
"generated_at": "2025-08-28T07:13:19.226648+00:00",
"generated_at": "2025-10-08T19:45:31.582840+00:00",
"generated_by": "metadata-ingestion/scripts/capability_summary.py",
"plugin_details": {
"abs": {
Expand Down Expand Up @@ -542,6 +542,87 @@
"platform_name": "File Based Lineage",
"support_status": "CERTIFIED"
},
"db2": {
"capabilities": [
{
"capability": "CONTAINERS",
"description": "Enabled by default",
"subtype_modifier": [
"Database",
"Schema"
],
"supported": true
},
{
"capability": "CLASSIFICATION",
"description": "Optionally enabled via `classification.enabled`",
"subtype_modifier": null,
"supported": true
},
{
"capability": "LINEAGE_FINE",
"description": "Enabled by default to get lineage for views via `include_view_column_lineage`",
"subtype_modifier": [
"View"
],
"supported": true
},
{
"capability": "DATA_PROFILING",
"description": "Optionally enabled via configuration",
"subtype_modifier": null,
"supported": true
},
{
"capability": "DESCRIPTIONS",
"description": "Enabled by default",
"subtype_modifier": null,
"supported": true
},
{
"capability": "DELETION_DETECTION",
"description": "Enabled by default via stateful ingestion",
"subtype_modifier": null,
"supported": true
},
{
"capability": "DOMAINS",
"description": "Supported via the `domain` config field",
"subtype_modifier": null,
"supported": true
},
{
"capability": "PLATFORM_INSTANCE",
"description": "Enabled by default",
"subtype_modifier": null,
"supported": true
},
{
"capability": "SCHEMA_METADATA",
"description": "Enabled by default",
"subtype_modifier": null,
"supported": true
},
{
"capability": "LINEAGE_COARSE",
"description": "Enabled by default to get lineage for views via `include_view_lineage`",
"subtype_modifier": [
"View"
],
"supported": true
},
{
"capability": "TEST_CONNECTION",
"description": "Enabled by default",
"subtype_modifier": null,
"supported": true
}
],
"classname": "datahub.ingestion.source.sql.db2.Db2Source",
"platform_id": "db2",
"platform_name": "IBM Db2",
"support_status": "TESTING"
},
"dbt": {
"capabilities": [
{
Expand Down
Loading
Loading