-
Notifications
You must be signed in to change notification settings - Fork 14.4k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
AIP-65: Add DAG versioning support (#42913)
* AIP-65: Add DAG versioning support This commit introduces versioning for DAGs Changes: - Introduced DagVersion model to handle versioning of DAGs. - Added version_name field to DAG for use in tracking the dagversion by users - Added support for version retrieval in the get_dag_source API endpoint - Modified DAG execution logic to reference dag_version_id instead of the dag_hash to ensure DAG runs are linked to specific versions. Fix tests revert RESTAPI changes * fixup! AIP-65: Add DAG versioning support * fixup! fixup! AIP-65: Add DAG versioning support * fix migration * fix test * more test fixes * update query count * fix static checks * Fix query and add created_at to dag_version table * improve code * Change to using UUID for primary keys * DagCode.bulk_write_code is no longer used * fixup! Change to using UUID for primary keys * fix tests * fixup! fix tests * use uuid for version_name * fixup! use uuid for version_name * use row lock when writing dag version * use row lock when writing dag version * fixup! use row lock when writing dag version * deactivating dag should not remove serialized dags * save version_name as string not uuid * Make dag_version_id unique * fixup! Make dag_version_id unique * Fix tests * Use uuid7 * fix test * fixup! fix test * use binary=False for uuid field to fix sqlite issue * apply suggestions from code review * Remove unnecessary version_name on dagmodel * Fix sqlalchemy 2 warning * Fix conflicts * Apply suggestions from code review Co-authored-by: Jed Cunningham <66968678+jedcunningham@users.noreply.github.com> * fixup! Apply suggestions from code review * fixup! fixup! Apply suggestions from code review * add test for dagversion model and make version_name, number and dag_id unique * Remove commented test as serdag can no longer disappear * Add SQLAlchemy-utils to requirements * mark test_dag_version.py as db_test * make version_name nullable * Apply suggestions from code review * fixup! Apply suggestions from code review * remove file_updater * Use dag_version for creating dagruns instead of dag_version_id * fix conflicts * use if TYPE_CHECKING * Add docstrings to methods * Move getting latest serdags to SerializedDagModel
- Loading branch information
1 parent
da50242
commit 1116f28
Showing
46 changed files
with
3,049 additions
and
2,366 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
151 changes: 151 additions & 0 deletions
151
airflow/migrations/versions/0047_3_0_0_add_dag_versioning.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,151 @@ | ||
# | ||
# Licensed to the Apache Software Foundation (ASF) under one | ||
# or more contributor license agreements. See the NOTICE file | ||
# distributed with this work for additional information | ||
# regarding copyright ownership. The ASF licenses this file | ||
# to you under the Apache License, Version 2.0 (the | ||
# "License"); you may not use this file except in compliance | ||
# with the License. You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, | ||
# software distributed under the License is distributed on an | ||
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY | ||
# KIND, either express or implied. See the License for the | ||
# specific language governing permissions and limitations | ||
# under the License. | ||
|
||
""" | ||
add dag versioning. | ||
Revision ID: 2b47dc6bc8df | ||
Revises: d03e4a635aa3 | ||
Create Date: 2024-10-09 05:44:04.670984 | ||
""" | ||
|
||
from __future__ import annotations | ||
|
||
import sqlalchemy as sa | ||
from alembic import op | ||
from sqlalchemy_utils import UUIDType | ||
|
||
from airflow.migrations.db_types import StringID | ||
from airflow.models.base import naming_convention | ||
from airflow.utils import timezone | ||
from airflow.utils.sqlalchemy import UtcDateTime | ||
|
||
# revision identifiers, used by Alembic. | ||
revision = "2b47dc6bc8df" | ||
down_revision = "d03e4a635aa3" | ||
branch_labels = None | ||
depends_on = None | ||
airflow_version = "3.0.0" | ||
|
||
|
||
def upgrade(): | ||
"""Apply add dag versioning.""" | ||
op.create_table( | ||
"dag_version", | ||
sa.Column("id", UUIDType(binary=False), nullable=False), | ||
sa.Column("version_number", sa.Integer(), nullable=False), | ||
sa.Column("version_name", StringID()), | ||
sa.Column("dag_id", StringID(), nullable=False), | ||
sa.Column("created_at", UtcDateTime(), nullable=False, default=timezone.utcnow), | ||
sa.ForeignKeyConstraint( | ||
("dag_id",), ["dag.dag_id"], name=op.f("dag_version_dag_id_fkey"), ondelete="CASCADE" | ||
), | ||
sa.PrimaryKeyConstraint("id", name=op.f("dag_version_pkey")), | ||
sa.UniqueConstraint("dag_id", "version_number", name="dag_id_v_name_v_number_unique_constraint"), | ||
) | ||
with op.batch_alter_table("dag_code", recreate="always", naming_convention=naming_convention) as batch_op: | ||
batch_op.drop_constraint("dag_code_pkey", type_="primary") | ||
batch_op.add_column( | ||
sa.Column("id", UUIDType(binary=False), primary_key=True), insert_before="fileloc_hash" | ||
) | ||
batch_op.create_primary_key("dag_code_pkey", ["id"]) | ||
batch_op.add_column(sa.Column("dag_version_id", UUIDType(binary=False), nullable=False)) | ||
batch_op.create_foreign_key( | ||
batch_op.f("dag_code_dag_version_id_fkey"), | ||
"dag_version", | ||
["dag_version_id"], | ||
["id"], | ||
ondelete="CASCADE", | ||
) | ||
batch_op.create_unique_constraint("dag_code_dag_version_id_uq", ["dag_version_id"]) | ||
|
||
with op.batch_alter_table( | ||
"serialized_dag", recreate="always", naming_convention=naming_convention | ||
) as batch_op: | ||
batch_op.drop_constraint("serialized_dag_pkey", type_="primary") | ||
batch_op.add_column(sa.Column("id", UUIDType(binary=False), primary_key=True)) | ||
batch_op.drop_index("idx_fileloc_hash") | ||
batch_op.drop_column("fileloc_hash") | ||
batch_op.drop_column("fileloc") | ||
batch_op.create_primary_key("serialized_dag_pkey", ["id"]) | ||
batch_op.add_column(sa.Column("dag_version_id", UUIDType(binary=False), nullable=False)) | ||
batch_op.create_foreign_key( | ||
batch_op.f("serialized_dag_dag_version_id_fkey"), | ||
"dag_version", | ||
["dag_version_id"], | ||
["id"], | ||
ondelete="CASCADE", | ||
) | ||
batch_op.create_unique_constraint("serialized_dag_dag_version_id_uq", ["dag_version_id"]) | ||
|
||
with op.batch_alter_table("task_instance", schema=None) as batch_op: | ||
batch_op.add_column(sa.Column("dag_version_id", UUIDType(binary=False))) | ||
batch_op.create_foreign_key( | ||
batch_op.f("task_instance_dag_version_id_fkey"), | ||
"dag_version", | ||
["dag_version_id"], | ||
["id"], | ||
ondelete="CASCADE", | ||
) | ||
|
||
with op.batch_alter_table("task_instance_history", schema=None) as batch_op: | ||
batch_op.add_column(sa.Column("dag_version_id", UUIDType(binary=False))) | ||
|
||
with op.batch_alter_table("dag_run", schema=None) as batch_op: | ||
batch_op.add_column(sa.Column("dag_version_id", UUIDType(binary=False))) | ||
batch_op.create_foreign_key( | ||
batch_op.f("dag_run_dag_version_id_fkey"), | ||
"dag_version", | ||
["dag_version_id"], | ||
["id"], | ||
ondelete="CASCADE", | ||
) | ||
batch_op.drop_column("dag_hash") | ||
|
||
|
||
def downgrade(): | ||
"""Unapply add dag versioning.""" | ||
with op.batch_alter_table("task_instance_history", schema=None) as batch_op: | ||
batch_op.drop_column("dag_version_id") | ||
|
||
with op.batch_alter_table("task_instance", schema=None) as batch_op: | ||
batch_op.drop_constraint(batch_op.f("task_instance_dag_version_id_fkey"), type_="foreignkey") | ||
batch_op.drop_column("dag_version_id") | ||
|
||
with op.batch_alter_table("dag_code", schema=None) as batch_op: | ||
batch_op.drop_column("id") | ||
batch_op.drop_constraint(batch_op.f("dag_code_dag_version_id_fkey"), type_="foreignkey") | ||
batch_op.drop_column("dag_version_id") | ||
batch_op.create_primary_key("dag_code_pkey", ["fileloc_hash"]) | ||
|
||
with op.batch_alter_table("serialized_dag", schema=None, naming_convention=naming_convention) as batch_op: | ||
batch_op.drop_column("id") | ||
batch_op.add_column(sa.Column("fileloc", sa.String(length=2000), autoincrement=False, nullable=False)) | ||
batch_op.add_column(sa.Column("fileloc_hash", sa.BIGINT(), autoincrement=False, nullable=False)) | ||
batch_op.create_index("idx_fileloc_hash", ["fileloc_hash"], unique=False) | ||
batch_op.create_primary_key("serialized_dag_pkey", ["dag_id"]) | ||
batch_op.drop_constraint(batch_op.f("serialized_dag_dag_version_id_fkey"), type_="foreignkey") | ||
batch_op.drop_column("dag_version_id") | ||
|
||
with op.batch_alter_table("dag_run", schema=None) as batch_op: | ||
batch_op.add_column(sa.Column("dag_hash", sa.String(length=32), autoincrement=False, nullable=True)) | ||
batch_op.drop_constraint(batch_op.f("dag_run_dag_version_id_fkey"), type_="foreignkey") | ||
batch_op.drop_column("dag_version_id") | ||
|
||
op.drop_table("dag_version") |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.