{ "pipeline_id": "<slug>", "type": "batch|streaming|hybrid", "orchestration": "airflow|kafka", "layers": { "ingestion": {"sources": [], "method": "full|incremental"}, "transformation": {"tool": "dbt", "models": []}, "quality": {"framework": "great_expectations", "checkpoints": []}, "storage": {"targets": [], "format": "parquet|delta"} }, "schedule": "cron|event-driven" }

{ "pipeline_architecture": { "pipeline_id": "string (slug format)", "type": "batch|streaming|hybrid", "orchestration": { "platform": "airflow|prefect|dagster|kafka", "schedule": "cron expression | event-driven", "parallelism": "integer (max concurrent tasks)" }, "layers": { "ingestion": { "sources": ["array of source configs"], "method": "full|incremental", "connector": "native|fivetran|airbyte|custom" }, "transformation": { "tool": "dbt|spark|custom", "models": ["array of model names"], "materialization": "view|table|incremental" }, "quality": { "framework": "great_expectations|dbt_tests|custom", "checkpoints": ["array of checkpoint configs"], "action_on_failure": "block|warn|quarantine" }, "storage": { "targets": ["array of target configs"], "format": "parquet|delta|iceberg|avro" } }, "monitoring": { "slas": ["array of SLA definitions"], "alerts": ["array of alert configs"], "lineage": "openlineage|datahub|custom" } }, "dag_template": "string (executable code or path to resource)", "quality_checks": "string (Great Expectations suite YAML or dbt test SQL)", "monitoring_config": "string (alert rules, dashboard JSON)", "implementation_guide": "array of step-by-step instructions" }

# Input pipeline_type: batch source_systems: [{type: postgres, name: orders_db, tables: [orders, customers]}] transformation_requirements: [Join orders+customers, Calculate daily revenue] quality_requirements: [order_id unique, order_total > 0] orchestration_platform: airflow target_systems: [{type: snowflake, schema: analytics}] schedule: 0 2 * * * # Output (abbreviated) pipeline_architecture: pipeline_id: ecommerce-orders-elt type: batch orchestration: {platform: airflow, schedule: "0 2 * * *"} layers: ingestion: sources: [orders_db.orders, orders_db.customers] method: incremental transformation: tool: dbt models: [stg_orders, int_order_metrics, fct_daily_revenue] quality: framework: great_expectations checkpoints: [staging_check, marts_check]

name	Data Engineering Pipeline Designer
slug	data-pipeline-designer
description	Design data pipelines with quality checks, orchestration, and governance using modern data stack patterns for robust ELT/ETL workflows.
capabilities	["Design DAGs for batch and streaming pipelines","Embed data quality checks with Great Expectations","Configure Airflow orchestration best practices","Model transformations with dbt patterns","Implement Kafka streaming architectures","Define data lineage and governance controls"]
inputs	[{"pipeline_type":"batch \| streaming \| hybrid"},{"source_systems":"array of data sources (databases, APIs, files, streams)"},{"transformation_requirements":"business logic, aggregations, joins"},{"quality_requirements":"data validation rules, SLAs, monitoring needs"},{"orchestration_platform":"Airflow \| Prefect \| Dagster \| custom"},{"target_systems":"data warehouse, lake, lakehouse destinations"}]
outputs	[{"pipeline_architecture":"JSON schema with components and flow"},{"dag_template":"orchestration code (Airflow DAG, dbt project)"},{"quality_checks":"Great Expectations suite configuration"},{"monitoring_config":"alerts, SLAs, data lineage tracking"},{"implementation_guide":"step-by-step deployment instructions"}]
keywords	["data-engineering","airflow","dbt","great-expectations","kafka","data-quality","orchestration","ETL","ELT","data-pipeline"]
version	1.0.0
owner	cognitive-toolworks
license	MIT
security	No secrets or PII in examples; use environment variables for credentials
links	["https://airflow.apache.org/docs/","https://docs.getdbt.com/","https://greatexpectations.io/","https://kafka.apache.org/documentation/"]

name	Data Engineering Pipeline Designer
slug	data-pipeline-designer
description	Design data pipelines with quality checks, orchestration, and governance using modern data stack patterns for robust ELT/ETL workflows.
capabilities	["Design DAGs for batch and streaming pipelines","Embed data quality checks with Great Expectations","Configure Airflow orchestration best practices","Model transformations with dbt patterns","Implement Kafka streaming architectures","Define data lineage and governance controls"]
inputs	[{"pipeline_type":"batch \| streaming \| hybrid"},{"source_systems":"array of data sources (databases, APIs, files, streams)"},{"transformation_requirements":"business logic, aggregations, joins"},{"quality_requirements":"data validation rules, SLAs, monitoring needs"},{"orchestration_platform":"Airflow \| Prefect \| Dagster \| custom"},{"target_systems":"data warehouse, lake, lakehouse destinations"}]
outputs	[{"pipeline_architecture":"JSON schema with components and flow"},{"dag_template":"orchestration code (Airflow DAG, dbt project)"},{"quality_checks":"Great Expectations suite configuration"},{"monitoring_config":"alerts, SLAs, data lineage tracking"},{"implementation_guide":"step-by-step deployment instructions"}]
keywords	["data-engineering","airflow","dbt","great-expectations","kafka","data-quality","orchestration","ETL","ELT","data-pipeline"]
version	1.0.0
owner	cognitive-toolworks
license	MIT
security	No secrets or PII in examples; use environment variables for credentials
links	["https://airflow.apache.org/docs/","https://docs.getdbt.com/","https://greatexpectations.io/","https://kafka.apache.org/documentation/"]

data-engineering-pipeline-designer

Purpose & When-To-Use

Pre-Checks

Procedure

Tier 1 (≤2k tokens): Quick Pipeline Design

Tier 2 (≤6k tokens): Production-Ready Pipeline with Quality Gates

Tier 3 (≤12k tokens): Advanced Patterns and Optimization

Decision Rules

Output Contract

Examples

Quality Gates

Resources

Purpose & When-To-Use

Pre-Checks

Procedure

Tier 1 (≤2k tokens): Quick Pipeline Design

Tier 2 (≤6k tokens): Production-Ready Pipeline with Quality Gates

Tier 3 (≤12k tokens): Advanced Patterns and Optimization

Decision Rules

Output Contract

Examples

Quality Gates

Resources

data-engineering-pipeline-designer

Mehr aus diesem Repository

Mehr aus diesem Repository

Purpose & When-To-Use

Pre-Checks

Procedure

Tier 1 (≤2k tokens): Quick Pipeline Design

Tier 2 (≤6k tokens): Production-Ready Pipeline with Quality Gates

Tier 3 (≤12k tokens): Advanced Patterns and Optimization

Decision Rules

Output Contract

Examples

Quality Gates

Resources

Purpose & When-To-Use

Pre-Checks

Procedure

Tier 1 (≤2k tokens): Quick Pipeline Design

Tier 2 (≤6k tokens): Production-Ready Pipeline with Quality Gates

Tier 3 (≤12k tokens): Advanced Patterns and Optimization

Decision Rules

Output Contract

Examples

Quality Gates

Resources