Skip to content

Commit

Permalink
schemadiff/Online DDL internal refactor (#16767)
Browse files Browse the repository at this point in the history
Signed-off-by: Shlomi Noach <2607934+shlomi-noach@users.noreply.github.com>
  • Loading branch information
shlomi-noach authored Sep 15, 2024
1 parent fe28d72 commit fd18ae4
Show file tree
Hide file tree
Showing 5 changed files with 621 additions and 605 deletions.
47 changes: 47 additions & 0 deletions go/vt/schemadiff/names.go
Original file line number Diff line number Diff line change
Expand Up @@ -20,6 +20,9 @@ import (
"fmt"
"regexp"
"strings"

"vitess.io/vitess/go/textutil"
"vitess.io/vitess/go/vt/sqlparser"
)

// constraint name examples:
Expand Down Expand Up @@ -48,3 +51,47 @@ func ExtractConstraintOriginalName(tableName string, constraintName string) stri

return constraintName
}

// newConstraintName generates a new, unique name for a constraint. Our problem is that a MySQL
// constraint's name is unique in the schema (!). And so as we duplicate the original table, we must
// create completely new names for all constraints.
// Moreover, we really want this name to be consistent across all shards. We therefore use a deterministic
// UUIDv5 (SHA) function over the migration UUID, table name, and constraint's _contents_.
// We _also_ include the original constraint name as prefix, as room allows
// for example, if the original constraint name is "check_1",
// we might generate "check_1_cps1okb4uafunfqusi2lp22u3".
// If we then again migrate a table whose constraint name is "check_1_cps1okb4uafunfqusi2lp22u3 " we
// get for example "check_1_19l09s37kbhj4axnzmi10e18k" (hash changes, and we still try to preserve original name)
//
// Furthermore, per bug report https://bugs.mysql.com/bug.php?id=107772, if the user doesn't provide a name for
// their CHECK constraint, then MySQL picks a name in this format <tablename>_chk_<number>.
// Example: sometable_chk_1
// Next, when MySQL is asked to RENAME TABLE and sees a constraint with this format, it attempts to rename
// the constraint with the new table's name. This is problematic for Vitess, because we often rename tables to
// very long names, such as _vt_HOLD_394f9e6dfc3d11eca0390a43f95f28a3_20220706091048.
// As we rename the constraint to e.g. `sometable_chk_1_cps1okb4uafunfqusi2lp22u3`, this makes MySQL want to
// call the new constraint something like _vt_HOLD_394f9e6dfc3d11eca0390a43f95f28a3_20220706091048_chk_1_cps1okb4uafunfqusi2lp22u3,
// which exceeds the 64 character limit for table names. Long story short, we also trim down <tablename> if the constraint seems
// to be auto-generated.
func newConstraintName(tableName string, baseUUID string, constraintDefinition *sqlparser.ConstraintDefinition, hashExists map[string]bool, seed string, oldName string) string {
constraintType := GetConstraintType(constraintDefinition.Details)

constraintIndicator := constraintIndicatorMap[int(constraintType)]
oldName = ExtractConstraintOriginalName(tableName, oldName)
hash := textutil.UUIDv5Base36(baseUUID, tableName, seed)
for i := 1; hashExists[hash]; i++ {
hash = textutil.UUIDv5Base36(baseUUID, tableName, seed, fmt.Sprintf("%d", i))
}
hashExists[hash] = true
suffix := "_" + hash
maxAllowedNameLength := maxConstraintNameLength - len(suffix)
newName := oldName
if newName == "" {
newName = constraintIndicator // start with something that looks consistent with MySQL's naming
}
if len(newName) > maxAllowedNameLength {
newName = newName[0:maxAllowedNameLength]
}
newName = newName + suffix
return newName
}
188 changes: 188 additions & 0 deletions go/vt/schemadiff/onlineddl.go
Original file line number Diff line number Diff line change
Expand Up @@ -17,14 +17,51 @@ limitations under the License.
package schemadiff

import (
"errors"
"fmt"
"math"
"sort"
"strings"

"vitess.io/vitess/go/mysql/capabilities"
"vitess.io/vitess/go/vt/sqlparser"
)

var (
ErrForeignKeyFound = errors.New("Foreign key found")

copyAlgorithm = sqlparser.AlgorithmValue(sqlparser.CopyStr)
)

const (
maxConstraintNameLength = 64
)

type ConstraintType int

const (
UnknownConstraintType ConstraintType = iota
CheckConstraintType
ForeignKeyConstraintType
)

var (
constraintIndicatorMap = map[int]string{
int(CheckConstraintType): "chk",
int(ForeignKeyConstraintType): "fk",
}
)

func GetConstraintType(constraintInfo sqlparser.ConstraintInfo) ConstraintType {
if _, ok := constraintInfo.(*sqlparser.CheckConstraintDefinition); ok {
return CheckConstraintType
}
if _, ok := constraintInfo.(*sqlparser.ForeignKeyDefinition); ok {
return ForeignKeyConstraintType
}
return UnknownConstraintType
}

// ColumnChangeExpandsDataRange sees if target column has any value set/range that is impossible in source column.
func ColumnChangeExpandsDataRange(source *ColumnDefinitionEntity, target *ColumnDefinitionEntity) (bool, string) {
if target.IsNullable() && !source.IsNullable() {
Expand Down Expand Up @@ -588,3 +625,154 @@ func OnlineDDLMigrationTablesAnalysis(

return analysis, nil
}

// ValidateAndEditCreateTableStatement inspects the CreateTable AST and does the following:
// - extra validation (no FKs for now...)
// - generate new and unique names for all constraints (CHECK and FK; yes, why not handle FK names; even as we don't support FKs today, we may in the future)
func ValidateAndEditCreateTableStatement(originalTableName string, baseUUID string, createTable *sqlparser.CreateTable, allowForeignKeys bool) (constraintMap map[string]string, err error) {
constraintMap = map[string]string{}
hashExists := map[string]bool{}

validateWalk := func(node sqlparser.SQLNode) (kontinue bool, err error) {
switch node := node.(type) {
case *sqlparser.ForeignKeyDefinition:
if !allowForeignKeys {
return false, ErrForeignKeyFound
}
case *sqlparser.ConstraintDefinition:
oldName := node.Name.String()
newName := newConstraintName(originalTableName, baseUUID, node, hashExists, sqlparser.CanonicalString(node.Details), oldName)
node.Name = sqlparser.NewIdentifierCI(newName)
constraintMap[oldName] = newName
}
return true, nil
}
if err := sqlparser.Walk(validateWalk, createTable); err != nil {
return constraintMap, err
}
return constraintMap, nil
}

// ValidateAndEditAlterTableStatement inspects the AlterTable statement and:
// - modifies any CONSTRAINT name according to given name mapping
// - explode ADD FULLTEXT KEY into multiple statements
func ValidateAndEditAlterTableStatement(originalTableName string, baseUUID string, capableOf capabilities.CapableOf, alterTable *sqlparser.AlterTable, constraintMap map[string]string) (alters []*sqlparser.AlterTable, err error) {
capableOfInstantDDLXtrabackup, err := capableOf(capabilities.InstantDDLXtrabackupCapability)
if err != nil {
return nil, err
}

hashExists := map[string]bool{}
validateWalk := func(node sqlparser.SQLNode) (kontinue bool, err error) {
switch node := node.(type) {
case *sqlparser.DropKey:
if node.Type == sqlparser.CheckKeyType || node.Type == sqlparser.ForeignKeyType {
// drop a check or a foreign key constraint
mappedName, ok := constraintMap[node.Name.String()]
if !ok {
return false, fmt.Errorf("Found DROP CONSTRAINT: %v, but could not find constraint name in map", sqlparser.CanonicalString(node))
}
node.Name = sqlparser.NewIdentifierCI(mappedName)
}
case *sqlparser.AddConstraintDefinition:
oldName := node.ConstraintDefinition.Name.String()
newName := newConstraintName(originalTableName, baseUUID, node.ConstraintDefinition, hashExists, sqlparser.CanonicalString(node.ConstraintDefinition.Details), oldName)
node.ConstraintDefinition.Name = sqlparser.NewIdentifierCI(newName)
constraintMap[oldName] = newName
}
return true, nil
}
if err := sqlparser.Walk(validateWalk, alterTable); err != nil {
return alters, err
}
alters = append(alters, alterTable)
// Handle ADD FULLTEXT KEY statements
countAddFullTextStatements := 0
redactedOptions := make([]sqlparser.AlterOption, 0, len(alterTable.AlterOptions))
for i := range alterTable.AlterOptions {
opt := alterTable.AlterOptions[i]
switch opt := opt.(type) {
case sqlparser.AlgorithmValue:
if !capableOfInstantDDLXtrabackup {
// we do not pass ALGORITHM. We choose our own ALGORITHM.
continue
}
case *sqlparser.AddIndexDefinition:
if opt.IndexDefinition.Info.Type == sqlparser.IndexTypeFullText {
countAddFullTextStatements++
if countAddFullTextStatements > 1 {
// We've already got one ADD FULLTEXT KEY. We can't have another
// in the same statement
extraAlterTable := &sqlparser.AlterTable{
Table: alterTable.Table,
AlterOptions: []sqlparser.AlterOption{opt},
}
if !capableOfInstantDDLXtrabackup {
extraAlterTable.AlterOptions = append(extraAlterTable.AlterOptions, copyAlgorithm)
}
alters = append(alters, extraAlterTable)
continue
}
}
}
redactedOptions = append(redactedOptions, opt)
}
alterTable.AlterOptions = redactedOptions
if !capableOfInstantDDLXtrabackup {
alterTable.AlterOptions = append(alterTable.AlterOptions, copyAlgorithm)
}
return alters, nil
}

// AddInstantAlgorithm adds or modifies the AlterTable's ALGORITHM to INSTANT
func AddInstantAlgorithm(alterTable *sqlparser.AlterTable) {
instantOpt := sqlparser.AlgorithmValue("INSTANT")
for i, opt := range alterTable.AlterOptions {
if _, ok := opt.(sqlparser.AlgorithmValue); ok {
// replace an existing algorithm
alterTable.AlterOptions[i] = instantOpt
return
}
}
// append an algorithm
alterTable.AlterOptions = append(alterTable.AlterOptions, instantOpt)
}

// DuplicateCreateTable parses the given `CREATE TABLE` statement, and returns:
// - The format CreateTable AST
// - A new CreateTable AST, with the table renamed as `newTableName`, and with constraints renamed deterministically
// - Map of renamed constraints
func DuplicateCreateTable(originalCreateTable *sqlparser.CreateTable, baseUUID string, newTableName string, allowForeignKeys bool) (
newCreateTable *sqlparser.CreateTable,
constraintMap map[string]string,
err error,
) {
newCreateTable = sqlparser.Clone(originalCreateTable)
newCreateTable.SetTable(newCreateTable.GetTable().Qualifier.CompliantName(), newTableName)

// If this table has a self-referencing foreign key constraint, ensure the referenced table gets renamed:
renameSelfFK := func(node sqlparser.SQLNode) (kontinue bool, err error) {
switch node := node.(type) {
case *sqlparser.ConstraintDefinition:
fk, ok := node.Details.(*sqlparser.ForeignKeyDefinition)
if !ok {
return true, nil
}
if referencedTableName := fk.ReferenceDefinition.ReferencedTable.Name.String(); referencedTableName == originalCreateTable.Table.Name.String() {
// This is a self-referencing foreign key
// We need to rename the referenced table as well
fk.ReferenceDefinition.ReferencedTable.Name = sqlparser.NewIdentifierCS(newTableName)
}
}
return true, nil
}
_ = sqlparser.Walk(renameSelfFK, newCreateTable)

// manipulate CreateTable statement: take care of constraints names which have to be
// unique across the schema
constraintMap, err = ValidateAndEditCreateTableStatement(originalCreateTable.Table.Name.String(), baseUUID, newCreateTable, allowForeignKeys)
if err != nil {
return nil, nil, err
}
return newCreateTable, constraintMap, nil
}
Loading

0 comments on commit fd18ae4

Please sign in to comment.