datahub-project
diff --git a/‎metadata-ingestion/docs/sources/dbt/dbt-cloud_pre.md‎
Lines changed: 29 additions & 1 deletion b/‎metadata-ingestion/docs/sources/dbt/dbt-cloud_pre.md‎
Lines changed: 29 additions & 1 deletion
diff --git a/‎metadata-ingestion/docs/sources/dbt/dbt-cloud_recipe.yml‎
Lines changed: 15 additions & 4 deletions b/‎metadata-ingestion/docs/sources/dbt/dbt-cloud_recipe.yml‎
Lines changed: 15 additions & 4 deletions
@@ -5,8 +5,36 @@ This source pulls dbt metadata directly from the dbt Cloud APIs.
 Create a [service account token](https://docs.getdbt.com/docs/dbt-cloud-apis/service-tokens) with the "Metadata Only" permission.
 This is a read-only permission.
 
-You'll need to have a dbt Cloud job set up to run your dbt project, and "Generate docs on run" should be enabled.
+#### Operating Modes
+
+The dbt Cloud source supports two modes of operation:
+
+##### 1. Explicit Mode (Default)
+
+Specify a single dbt Cloud job to ingest metadata from. You'll need to have a dbt Cloud job set up to run your dbt project, and "Generate docs on run" should be enabled.
+
+Note: As this is ingesting only one job, we expect it to process all/most of the models, or else multiple job ingestion might be required.
 
 To get the required IDs, go to the job details page (this is the one with the "Run History" table), and look at the URL.
 It should look something like this: https://cloud.getdbt.com/next/deploy/107298/projects/175705/jobs/148094.
 In this example, the account ID is 107298, the project ID is 175705, and the job ID is 148094.
+
+##### 2. Auto-Discovery Mode
+
+Automatically discovers and ingests metadata from all eligible jobs in a dbt Cloud project. This mode:
+
+- Discovers all jobs in the specified project's **production environment only**
+- Filters to jobs with **"Generate docs on run" enabled** (`generate_docs=True`)
+- Always uses the **latest run** for each job (ignores `run_id` configuration)
+- Supports optional regex-based filtering to include/exclude specific job IDs
+- Ingests metadata from multiple jobs in a single run
+
+**When to use auto-discovery:**
+
+- You have multiple dbt Cloud jobs in a project and want to ingest all of them
+- You want to automatically pick up new jobs without updating configuration
+
+**Requirements:**
+
+- Jobs must be in the production environment
+- Jobs must have "Generate docs on run" enabled
@@ -8,12 +8,23 @@ source:
 
     account_id: "${DBT_ACCOUNT_ID}" # set to your dbt cloud account id
     project_id: "${DBT_PROJECT_ID}" # set to your dbt cloud project id
+
+    # Mode 1: Explicit Mode (specify a single job)
     job_id: "${DBT_JOB_ID}" # set to your dbt cloud job id
-    run_id: # set to your dbt cloud run id. This is optional, and defaults to the latest run
+    run_id: # optional: set to a specific dbt cloud run id. Defaults to the latest run
 
-    target_platform: postgres
+    # Mode 2: Auto-Discovery Mode (automatically discover all eligible jobs)
+    # Uncomment the section below to enable auto-discovery
+    # Note: When auto_discovery is enabled, job_id can be omitted (will be ignored if provided)
+    # and run_id is ignored (always uses the latest run)
+    # auto_discovery:
+    #   enabled: true
+    #   job_id_pattern: # optional
+    #     allow:
+    #       - ".*"  # regex pattern to include jobs (default: include all)
+    #     # deny:
+    #     #   - "test.*"  # optional: regex pattern to exclude specific jobs
 
-    # Options
-    target_platform: "${TARGET_PLATFORM_ID}" # e.g. bigquery/postgres/etc.
+    target_platform: "${TARGET_PLATFORM_ID}" # e.g. bigquery/postgres/snowflake/etc.
 
 # sink configs