|
| 1 | +"""Add Model Deployment related tables |
| 2 | +
|
| 3 | +Revision ID: 0368087c787d |
| 4 | +Revises: 345551145801 |
| 5 | +Create Date: 2025-08-25 00:54:30.288511 |
| 6 | +
|
| 7 | +""" |
| 8 | +import sqlalchemy as sa |
| 9 | +from alembic import op |
| 10 | +from sqlalchemy.dialects import postgresql |
| 11 | +# revision identifiers, used by Alembic. |
| 12 | +revision = '0368087c787d' |
| 13 | +down_revision = '345551145801' |
| 14 | +branch_labels = None |
| 15 | +depends_on = None |
| 16 | + |
| 17 | + |
| 18 | +def upgrade() -> None: |
| 19 | + # ### commands auto generated by Alembic - please adjust! ### |
| 20 | + op.create_table('blue_green_strategies', |
| 21 | + sa.Column('id', ai.backend.manager.models.base.GUID(), server_default=sa.text('uuid_generate_v4()'), nullable=False), |
| 22 | + sa.Column('pre_switch_wait_time', sa.Integer(), nullable=False), |
| 23 | + sa.Column('switch_timeout', sa.Integer(), nullable=False), |
| 24 | + sa.Column('is_active', sa.Boolean(), nullable=False), |
| 25 | + sa.Column('created_at', sa.DateTime(), nullable=False), |
| 26 | + sa.Column('updated_at', sa.DateTime(), nullable=False), |
| 27 | + sa.PrimaryKeyConstraint('id', name=op.f('pk_blue_green_strategies')) |
| 28 | + ) |
| 29 | + op.create_table('model_deployments', |
| 30 | + sa.Column('id', ai.backend.manager.models.base.GUID(), server_default=sa.text('uuid_generate_v4()'), nullable=False), |
| 31 | + sa.Column('name', sa.String(), nullable=False), |
| 32 | + sa.Column('status', ai.backend.manager.models.base.StrEnumType(length=64), nullable=False), |
| 33 | + sa.Column('tags', sa.String(), nullable=False), |
| 34 | + sa.Column('endpoint_url', sa.String(), nullable=True), |
| 35 | + sa.Column('preferred_domain_name', sa.String(), nullable=True), |
| 36 | + sa.Column('open_to_public', sa.Boolean(), nullable=False), |
| 37 | + sa.Column('desired_replica_count', sa.Integer(), nullable=False), |
| 38 | + sa.Column('created_user_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 39 | + sa.Column('current_revision_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 40 | + sa.Column('deployment_strategy_type', ai.backend.manager.models.base.StrEnumType(length=64), nullable=False), |
| 41 | + sa.Column('deployment_strategy_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 42 | + sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=True), |
| 43 | + sa.Column('updated_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=True), |
| 44 | + sa.ForeignKeyConstraint(['created_user_id'], ['users.uuid'], name=op.f('fk_model_deployments_created_user_id_users')), |
| 45 | + sa.ForeignKeyConstraint(['deployment_strategy_id'], ['blue_green_strategies.id'], name=op.f('fk_model_deployments_deployment_strategy_id_blue_green_strategies')), |
| 46 | + sa.PrimaryKeyConstraint('id', name=op.f('pk_model_deployments')) |
| 47 | + ) |
| 48 | + op.create_index(op.f('ix_model_deployments_created_user_id'), 'model_deployments', ['created_user_id'], unique=False) |
| 49 | + op.create_index(op.f('ix_model_deployments_name'), 'model_deployments', ['name'], unique=False) |
| 50 | + op.create_table('model_deployment_auto_scaling_rules', |
| 51 | + sa.Column('id', ai.backend.manager.models.base.GUID(), server_default=sa.text('uuid_generate_v4()'), nullable=False), |
| 52 | + sa.Column('model_deployment_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 53 | + sa.Column('metric_source', sa.String(), nullable=False), |
| 54 | + sa.Column('metric_name', sa.String(), nullable=False), |
| 55 | + sa.Column('min_threshold', ai.backend.manager.models.base.DecimalType(), nullable=True), |
| 56 | + sa.Column('max_threshold', ai.backend.manager.models.base.DecimalType(), nullable=True), |
| 57 | + sa.Column('step_size', sa.Integer(), nullable=False), |
| 58 | + sa.Column('time_window', sa.Integer(), nullable=False), |
| 59 | + sa.Column('min_replicas', sa.Integer(), nullable=True), |
| 60 | + sa.Column('max_replicas', sa.Integer(), nullable=True), |
| 61 | + sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False), |
| 62 | + sa.Column('last_triggered_at', sa.DateTime(timezone=True), nullable=False), |
| 63 | + sa.CheckConstraint('(min_threshold IS NOT NULL AND max_threshold IS NULL) OR (min_threshold IS NULL AND max_threshold IS NOT NULL)', name=op.f('ck_model_deployment_auto_scaling_rules_check_single_threshold')), |
| 64 | + sa.ForeignKeyConstraint(['model_deployment_id'], ['model_deployments.id'], name=op.f('fk_model_deployment_auto_scaling_rules_model_deployment_id_model_deployments')), |
| 65 | + sa.PrimaryKeyConstraint('id', name=op.f('pk_model_deployment_auto_scaling_rules')), |
| 66 | + sa.UniqueConstraint('model_deployment_id', 'metric_name', name='uq_model_deployment_metric') |
| 67 | + ) |
| 68 | + op.create_table('model_deployment_tokens', |
| 69 | + sa.Column('id', ai.backend.manager.models.base.GUID(), server_default=sa.text('uuid_generate_v4()'), nullable=False), |
| 70 | + sa.Column('token', sa.String(), nullable=False), |
| 71 | + sa.Column('model_deployment_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 72 | + sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=True), |
| 73 | + sa.ForeignKeyConstraint(['model_deployment_id'], ['model_deployments.id'], name=op.f('fk_model_deployment_tokens_model_deployment_id_model_deployments')), |
| 74 | + sa.PrimaryKeyConstraint('id', name=op.f('pk_model_deployment_tokens')) |
| 75 | + ) |
| 76 | + op.create_table('model_revisions', |
| 77 | + sa.Column('id', ai.backend.manager.models.base.GUID(), server_default=sa.text('uuid_generate_v4()'), nullable=False), |
| 78 | + sa.Column('name', sa.String(), nullable=False), |
| 79 | + sa.Column('model_deployment_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 80 | + sa.Column('tags', sa.TEXT(), nullable=False), |
| 81 | + sa.Column('runtime_variant', ai.backend.manager.models.base.StrEnumType(length=64), nullable=False), |
| 82 | + sa.Column('inference_runtime_config', postgresql.JSONB(astext_type=sa.Text()), nullable=False), |
| 83 | + sa.Column('environment_variables', postgresql.JSONB(astext_type=sa.Text()), nullable=False), |
| 84 | + sa.Column('model_vfolder_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 85 | + sa.Column('model_mount_destination', sa.String(), server_default='/models', nullable=False), |
| 86 | + sa.Column('model_definition_path', sa.String(), nullable=False), |
| 87 | + sa.Column('image_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 88 | + sa.Column('cluster_mode', sa.String(), server_default='single-node', nullable=False), |
| 89 | + sa.Column('cluster_size', sa.Integer(), server_default='1', nullable=False), |
| 90 | + sa.Column('resource_group', sa.String(), nullable=False), |
| 91 | + sa.Column('resource_slots', ai.backend.manager.models.base.ResourceSlotColumn(astext_type=Text()), nullable=False), |
| 92 | + sa.Column('resource_opts', postgresql.JSONB(astext_type=sa.Text()), nullable=False), |
| 93 | + sa.Column('extra_mount', ai.backend.manager.models.base.StructuredJSONObjectListColumn(astext_type=Text()), server_default='[]', nullable=False), |
| 94 | + sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False), |
| 95 | + sa.ForeignKeyConstraint(['image_id'], ['images.id'], name=op.f('fk_model_revisions_image_id_images')), |
| 96 | + sa.ForeignKeyConstraint(['model_deployment_id'], ['model_deployments.id'], name=op.f('fk_model_revisions_model_deployment_id_model_deployments')), |
| 97 | + sa.ForeignKeyConstraint(['model_vfolder_id'], ['vfolders.id'], name=op.f('fk_model_revisions_model_vfolder_id_vfolders')), |
| 98 | + sa.PrimaryKeyConstraint('id', name=op.f('pk_model_revisions')) |
| 99 | + ) |
| 100 | + op.create_table('deployment_session_bindings', |
| 101 | + sa.Column('id', ai.backend.manager.models.base.GUID(), server_default=sa.text('uuid_generate_v4()'), nullable=False), |
| 102 | + sa.Column('deployment_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 103 | + sa.Column('session_id', ai.backend.manager.models.base.GUID(), nullable=False), |
| 104 | + sa.Column('weight', ai.backend.manager.models.base.DecimalType(), nullable=False), |
| 105 | + sa.Column('readiness_status', ai.backend.manager.models.base.StrEnumType(length=64), nullable=False), |
| 106 | + sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False), |
| 107 | + sa.Column('updated_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False), |
| 108 | + sa.ForeignKeyConstraint(['deployment_id'], ['model_deployments.id'], name=op.f('fk_deployment_session_bindings_deployment_id_model_deployments')), |
| 109 | + sa.ForeignKeyConstraint(['session_id'], ['sessions.id'], name=op.f('fk_deployment_session_bindings_session_id_sessions')), |
| 110 | + sa.PrimaryKeyConstraint('id', name=op.f('pk_deployment_session_bindings')) |
| 111 | + ) |
| 112 | + # ### end Alembic commands ### |
| 113 | + |
| 114 | + |
| 115 | +def downgrade() -> None: |
| 116 | + # ### commands auto generated by Alembic - please adjust! ### |
| 117 | + op.drop_table('deployment_session_bindings') |
| 118 | + op.drop_table('model_revisions') |
| 119 | + op.drop_table('model_deployment_tokens') |
| 120 | + op.drop_table('model_deployment_auto_scaling_rules') |
| 121 | + op.drop_index(op.f('ix_model_deployments_name'), table_name='model_deployments') |
| 122 | + op.drop_index(op.f('ix_model_deployments_created_user_id'), table_name='model_deployments') |
| 123 | + op.drop_table('model_deployments') |
| 124 | + op.drop_table('blue_green_strategies') |
| 125 | + # ### end Alembic commands ### |
0 commit comments