[RFC] Only build code locations with changes #590
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Dagster Cloud Hybrid Deployment | |
on: | |
push: # For full deployment | |
branches: | |
- "main" | |
- "master" | |
pull_request: # For branch deployments | |
types: [opened, synchronize, reopened, closed] | |
concurrency: | |
# Cancel in-progress deploys to the same branch | |
group: ${{ github.ref }} | |
cancel-in-progress: true | |
env: | |
DAGSTER_CLOUD_ORGANIZATION: "hooli" | |
DAGSTER_CLOUD_API_TOKEN: ${{ secrets.DAGSTER_CLOUD_API_TOKEN }} | |
DAGSTER_PROJECT_DIR: "." | |
DAGSTER_CLOUD_YAML_PATH: "dagster_cloud.yaml" | |
# The IMAGE_REGISTRY should match the registry: in dagster_cloud.yaml | |
IMAGE_REGISTRY: "764506304434.dkr.ecr.us-west-2.amazonaws.com/hooli-data-science-prod" | |
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }} | |
jobs: | |
dagster-cloud-deploy: | |
runs-on: ubuntu-22.04 | |
steps: | |
- name: Pre-run checks | |
id: prerun | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
- name: Checkout | |
uses: actions/checkout@v4 | |
if: steps.prerun.outputs.result != 'skip' | |
with: | |
ref: ${{ github.head_ref }} | |
- name: Get changed files | |
id: changed-files | |
uses: tj-actions/changed-files@v45 | |
with: | |
files_yaml: | | |
hooli_data_eng: | |
- dbt_project/** | |
- hooli_data_eng/** | |
- pyproject.toml | |
- Dockerfile | |
hooli_basics: | |
- hooli_basics/** | |
hooli_batch_enrichment: | |
- hooli_batch_enrichment/** | |
hooli_snowflake_insights: | |
- hooli_snowflake_insights/** | |
hooli-data-ingest: | |
- hooli-data-ingest/** | |
hooli-bi: | |
- hooli-bi/** | |
- name: Generate docker image tag | |
id: generate-image-tag | |
if: steps.prerun.outputs.result != 'skip' | |
run: | | |
echo "IMAGE_TAG=$GITHUB_SHA-$GITHUB_RUN_ID-$GITHUB_RUN_ATTEMPT" >> $GITHUB_ENV && echo $IMAGE_TAG | |
- name: Get Code locations that changed | |
id: extract-changed-dirs | |
run: | | |
changed_files="${{ steps.changed-files.outputs.hooli_data_eng_all_changed_files }} ${{ steps.changed-files.outputs.hooli_basics_all_changed_files }} ${{ steps.changed-files.outputs.hooli_batch_enrichment_all_changed_files }} ${{ steps.changed-files.outputs.hooli_snowflake_insights_all_changed_files }} ${{ steps.changed-files.outputs.hooli-data-ingest_all_changed_files }} ${{ steps.changed-files.outputs.hooli-bi_all_changed_files }}" | |
filtered_dirs=$(echo $changed_files | tr ' ' '\n' | xargs -n1 dirname | sort | uniq) | |
echo $changed_files | |
echo $filtered_dirs | |
LOCATIONS="" | |
LOCATIONS_WITH_IMAGE="" | |
if [ "${{ steps.changed-files.outputs.hooli_data_eng_any_changed}}" == "true" ]; then | |
LOCATIONS="$LOCATIONS --location-name data-eng-pipeline" | |
LOCATIONS_WITH_IMAGE="$LOCATIONS_WITH_IMAGE --location-name data-eng-pipeline --image-tag=$IMAGE_TAG-data-eng-pipeline" | |
fi | |
if [ "${{ steps.changed-files.outputs.hooli_basics_any_changed}}" == "true" ]; then | |
LOCATIONS="$LOCATIONS --location-name basics" | |
LOCATIONS_WITH_IMAGE="$LOCATIONS_WITH_IMAGE --location-name basics --image-tag=$IMAGE_TAG-basics" | |
fi | |
if [ "${{ steps.changed-files.outputs.hooli_batch_enrichment_any_changed}}" == "true" ]; then | |
LOCATIONS="$LOCATIONS --location-name batch_enrichment" | |
LOCATIONS_WITH_IMAGE="$LOCATIONS_WITH_IMAGE --location-name batch_enrichment --image-tag=$IMAGE_TAG-batch-enrichment" | |
fi | |
if [ "${{ steps.changed-files.outputs.hooli_snowflake_insights_any_changed}}" == "true" ]; then | |
LOCATIONS="$LOCATIONS --location-name snowflake_insights" | |
LOCATIONS_WITH_IMAGE="$LOCATIONS_WITH_IMAGE --location-name snowflake_insights --image-tag=$IMAGE_TAG-snowflake-insights" | |
fi | |
if [ "${{ steps.changed-files.outputs.hooli-data-ingest_any_changed}}" == "true" ]; then | |
LOCATIONS="$LOCATIONS --location-name hooli_data_ingest" | |
LOCATIONS_WITH_IMAGE="$LOCATIONS_WITH_IMAGE --location-name hooli_data_ingest --image-tag=$IMAGE_TAG-hooli-data-ingest" | |
fi | |
if [ "${{ steps.changed-files.outputs.hooli-bi_any_changed}}" == "true" ]; then | |
LOCATIONS="$LOCATIONS --location-name hooli_bi" | |
LOCATIONS_WITH_IMAGE="$LOCATIONS_WITH_IMAGE --location-name hooli_bi --image-tag=$IMAGE_TAG-hooli-bi" | |
fi | |
echo $LOCATIONS | |
echo $LOCATIONS_WITH_IMAGE | |
echo "LOCATIONS=$LOCATIONS" >> $GITHUB_ENV | |
echo "LOCATIONS_WITH_IMAGE=$LOCATIONS_WITH_IMAGE" >> $GITHUB_ENV | |
- name: Install the latest version of uv | |
uses: astral-sh/setup-uv@v3 | |
with: | |
enable-cache: true | |
- name: Validate configuration | |
id: ci-validate | |
if: steps.prerun.outputs.result != 'skip' | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
with: | |
command: "ci check --project-dir ${{ env.DAGSTER_PROJECT_DIR }} --dagster-cloud-yaml-path ${{ env.DAGSTER_CLOUD_YAML_PATH }}" | |
- name: Initialize build session | |
id: ci-init | |
if: steps.prerun.outputs.result != 'skip' | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
with: | |
project_dir: ${{ env.DAGSTER_PROJECT_DIR }} | |
dagster_cloud_yaml_path: ${{ env.DAGSTER_CLOUD_YAML_PATH }} | |
deployment: 'data-eng-prod' | |
- name: Set up Docker Buildx | |
uses: docker/setup-buildx-action@v3 | |
- name: Configure AWS credentials | |
uses: aws-actions/configure-aws-credentials@v4 | |
if: steps.prerun.outputs.result != 'skip' | |
with: | |
aws-access-key-id: ${{ secrets.AWS_ACCESS_KEY_ID }} | |
aws-secret-access-key: ${{ secrets.AWS_SECRET_ACCESS_KEY }} | |
aws-region: us-west-2 | |
- name: Login to ECR | |
if: ${{ steps.prerun.outputs.result != 'skip' }} | |
uses: aws-actions/amazon-ecr-login@v2 | |
with: | |
mask-password: 'true' | |
- name: Set Prod Deployment Environment Variable for Push | |
if: steps.prerun.outputs.result != 'skip' && github.event_name == 'push' | |
run: echo "DAGSTER_CLOUD_DEPLOYMENT_NAME=data-eng-prod" >> $GITHUB_ENV | |
- name: Prepare dbt project | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli_data_eng_any_changed == 'true' | |
run: | | |
uv venv | |
source .venv/bin/activate | |
uv pip install dagster-dbt dagster-cloud dbt-core dbt-duckdb dbt-snowflake --upgrade; | |
dagster-dbt project prepare-and-package --file hooli_data_eng/project.py | |
dagster-cloud ci dagster-dbt project manage-state --file hooli_data_eng/project.py --source-deployment data-eng-prod | |
- name: Build and upload Docker image for data-eng-pipeline | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli_data_eng_any_changed == 'true' | |
uses: docker/build-push-action@v5 | |
with: | |
context: . | |
push: true | |
tags: ${{ env.IMAGE_REGISTRY }}:${{ env.IMAGE_TAG }}-data-eng-pipeline | |
# Build 'basics' code location | |
- name: Build and upload Docker image for basics | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli_basics_any_changed == 'true' | |
uses: docker/build-push-action@v5 | |
with: | |
context: ./hooli_basics | |
push: true | |
tags: ${{ env.IMAGE_REGISTRY }}:${{ env.IMAGE_TAG }}-basics | |
# Build 'batch enrichment' code location | |
- name: Build and upload Docker image for batch enrichment | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli_batch_enrichment_any_changed == 'true' | |
uses: docker/build-push-action@v5 | |
with: | |
context: ./hooli_batch_enrichment | |
push: true | |
tags: ${{ env.IMAGE_REGISTRY }}:${{ env.IMAGE_TAG }}-batch-enrichment | |
# Build 'snowflake_insights' code location | |
- name: Build and upload Docker image for snowflake insights | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli_snowflake_insights_any_changed == 'true' | |
uses: docker/build-push-action@v5 | |
with: | |
context: ./hooli_snowflake_insights | |
push: true | |
tags: ${{ env.IMAGE_REGISTRY }}:${{ env.IMAGE_TAG }}-snowflake-insights | |
# Build 'hooli_data_ingest' code location | |
- name: Build and upload Docker image for hooli_data_ingest | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli-data-ingest_any_changed == 'true' | |
uses: docker/build-push-action@v5 | |
with: | |
context: ./hooli-data-ingest | |
push: true | |
tags: ${{ env.IMAGE_REGISTRY }}:${{ env.IMAGE_TAG }}-hooli-data-ingest | |
# Build 'hooli_bi' code location | |
- name: Build and upload Docker image for hooli_bi | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli-bi_any_changed == 'true' | |
uses: docker/build-push-action@v5 | |
with: | |
context: ./hooli-bi | |
push: true | |
tags: ${{ env.IMAGE_REGISTRY }}:${{ env.IMAGE_TAG }}-hooli-bi | |
# Build pipes example container | |
- name: Build and upload Docker image for pipes example | |
if: steps.prerun.outputs.result != 'skip' && steps.changed-files.outputs.hooli_data_eng_any_changed == 'true' | |
uses: docker/build-push-action@v5 | |
with: | |
context: ./hooli_data_eng/utils/example_container | |
push: true | |
tags: ${{ env.IMAGE_REGISTRY }}:latest-pipes-example | |
#set build output | |
- name: Set build output for Dagster Cloud | |
id: ci-set-build-output | |
if: steps.prerun.outputs.result != 'skip' | |
run: | | |
while [[ $LOCATIONS_WITH_IMAGE ]]; do | |
# Extract the first --location-name and --image-tag pair | |
LOCATION_NAME=$(echo $LOCATIONS_WITH_IMAGE | awk '{print $2}') | |
IMAGE_TAG=$(echo $LOCATIONS_WITH_IMAGE | awk '{print $4}') | |
# Run the ci deploy command | |
echo "Running ci deploy for $LOCATION_NAME with image tag $IMAGE_TAG" | |
dagster-cloud ci deploy --location-name $LOCATION_NAME --image-tag $IMAGE_TAG | |
# Remove the processed pair from LOCATIONS_WITH_IMAGE | |
LOCATIONS_WITH_IMAGE=$(echo $LOCATIONS_WITH_IMAGE | sed 's/--location-name [^ ]* --image-tag=[^ ]*//') | |
done | |
# uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
# with: | |
# command: "ci set-build-output $LOCATIONS_WITH_IMAGE" | |
#Deploy | |
- name: Deploy to Dagster Cloud | |
id: ci-deploy | |
if: steps.prerun.outputs.result != 'skip' | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
with: | |
command: "ci deploy $LOCATIONS" | |
# Get branch deployment as input to job trigger below | |
- name: Get branch deployment | |
id: get-branch-deployment | |
if: steps.prerun.outputs.result != 'skip' && github.event_name == 'pull_request' | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
with: | |
organization_id: 'hooli' | |
# Trigger dbt slim CI job | |
- name: Trigger dbt slim CI | |
if: steps.prerun.outputs.result != 'skip' && github.event_name == 'pull_request' && steps.changed-files.outputs.hooli_bi_any_changed == 'true' | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
with: | |
location_name: data-eng-pipeline | |
deployment: ${{ steps.get-branch-deployment.outputs.deployment }} | |
job_name: dbt_slim_ci_job | |
organization_id: hooli | |
# Summary and comment updates - note these always() run | |
- name: Update PR comment for branch deployments | |
id: ci-notify | |
if: steps.prerun.outputs.result != 'skip' && always() | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
with: | |
command: "ci notify --project-dir=${{ env.DAGSTER_PROJECT_DIR }}" | |
- name: Generate summary | |
id: ci-summary | |
if: steps.prerun.outputs.result != 'skip' && always() | |
uses: dagster-io/dagster-cloud-action/actions/utils/[email protected] | |
with: | |
command: "ci status --output-format=markdown >> $GITHUB_STEP_SUMMARY" |