Skip to content

Commit

Permalink
feat: skip index creation during loading MySQL snapshot (#278)
Browse files Browse the repository at this point in the history
  • Loading branch information
fanyang01 authored Dec 10, 2024
1 parent 73f3a8e commit 0d691f2
Show file tree
Hide file tree
Showing 7 changed files with 62 additions and 10 deletions.
10 changes: 10 additions & 0 deletions backend/loaddata.go
Original file line number Diff line number Diff line change
Expand Up @@ -117,6 +117,16 @@ func (db *DuckBuilder) executeLoadData(ctx *sql.Context, insert *plan.InsertInto
b.Grow(256)

keyless := sql.IsKeyless(dst.Schema())
// TODO(fan): This is an ugly hack for MySQL Shell's utilities to work properly.
if !keyless {
if t, ok := dst.(*catalog.Table); ok {
// Replicated tables do not have physical primary keys.
// Their logical primary keys are fake and should not be used in INSERT INTO statements.
// https://github.com/apecloud/myduckserver/issues/272
keyless = t.ExtraTableInfo().Replicated
}
}

b.WriteString("INSERT")
if load.IsIgnore && !keyless {
b.WriteString(" OR IGNORE")
Expand Down
27 changes: 22 additions & 5 deletions catalog/database.go
Original file line number Diff line number Diff line change
Expand Up @@ -170,11 +170,11 @@ func (d *Database) createAllTable(ctx *sql.Context, name string, schema sql.Prim
primaryKeys = append(primaryKeys, schema.Schema[pkord].Name)
}

withoutIndex := isIndexCreationDisabled(ctx)

// https://github.com/apecloud/myduckserver/issues/272
if !(mycontext.IsReplicationQuery(ctx) && configuration.IsReplicationWithoutIndex()) {
if len(primaryKeys) > 0 {
b.WriteString(fmt.Sprintf(", PRIMARY KEY (%s)", strings.Join(primaryKeys, ", ")))
}
if len(primaryKeys) > 0 && !withoutIndex {
b.WriteString(fmt.Sprintf(", PRIMARY KEY (%s)", strings.Join(primaryKeys, ", ")))
}

b.WriteString(")")
Expand All @@ -183,7 +183,7 @@ func (d *Database) createAllTable(ctx *sql.Context, name string, schema sql.Prim
b.WriteString(fmt.Sprintf(
"; COMMENT ON TABLE %s IS '%s'",
fullTableName,
NewCommentWithMeta(comment, ExtraTableInfo{schema.PkOrdinals}).Encode(),
NewCommentWithMeta(comment, ExtraTableInfo{schema.PkOrdinals, withoutIndex}).Encode(),
))

// Add column comments
Expand All @@ -205,6 +205,23 @@ func (d *Database) createAllTable(ctx *sql.Context, name string, schema sql.Prim
return nil
}

func isIndexCreationDisabled(ctx *sql.Context) bool {
if !configuration.IsReplicationWithoutIndex() {
return false
}
if mycontext.IsReplicationQuery(ctx) {
return true
}
_, vv, ok := sql.SystemVariables.GetGlobal("replica_is_loading_snapshot")
if !ok {
return false
}
if b, ok := vv.(int8); ok {
return b != 0
}
return false
}

// CreateTable implements sql.TableCreator.
func (d *Database) CreateTable(ctx *sql.Context, name string, schema sql.PrimaryKeySchema, collation sql.CollationID, comment string) error {
d.mu.Lock()
Expand Down
4 changes: 2 additions & 2 deletions catalog/table.go
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,6 @@ import (

"github.com/apecloud/myduckserver/adapter"
"github.com/apecloud/myduckserver/configuration"
"github.com/apecloud/myduckserver/mycontext"
"github.com/dolthub/go-mysql-server/sql"
"github.com/dolthub/go-mysql-server/sql/expression"
"github.com/marcboeker/go-duckdb"
Expand All @@ -25,6 +24,7 @@ type Table struct {

type ExtraTableInfo struct {
PkOrdinals []int
Replicated bool
}

type ColumnInfo struct {
Expand Down Expand Up @@ -362,7 +362,7 @@ func (t *Table) CreateIndex(ctx *sql.Context, indexDef sql.IndexDef) error {
defer t.mu.Unlock()

// https://github.com/apecloud/myduckserver/issues/272
if mycontext.IsReplicationQuery(ctx) && configuration.IsReplicationWithoutIndex() {
if isIndexCreationDisabled(ctx) {
return nil
}

Expand Down
2 changes: 1 addition & 1 deletion configuration/env.go
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ const (

func IsReplicationWithoutIndex() bool {
switch strings.ToLower(os.Getenv(replicationWithoutIndex)) {
case "", "t", "1", "true":
case "", "y", "t", "1", "on", "yes", "true":
return true
}
return false
Expand Down
1 change: 1 addition & 0 deletions devtools/replica-setup-mysql/prepare.sh
Original file line number Diff line number Diff line change
Expand Up @@ -17,4 +17,5 @@ echo "Setting local_infile and server_id..."
mysqlsh --sql --host=${MYDUCK_HOST} --port=${MYDUCK_PORT} --user=root --no-password <<EOF
SET GLOBAL local_infile = 1;
SET GLOBAL server_id = ${MYDUCK_SERVER_ID};
SET GLOBAL replica_is_loading_snapshot = ON;
EOF
19 changes: 17 additions & 2 deletions devtools/replica-setup-mysql/snapshot.sh
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,17 @@ echo "Thread count set to: $THREAD_COUNT"

echo "Copying data from MySQL to MyDuck..."
# Run mysqlsh command and capture the output
output=$(mysqlsh --uri "$SOURCE_DSN" $SOURCE_NO_PASSWORD_OPTION -- util copy-instance "mysql://${MYDUCK_USER}:${MYDUCK_PASSWORD}@${MYDUCK_HOST}:${MYDUCK_PORT}" --users false --consistent false --ignore-existing-objects true --handle-grant-errors ignore --threads $THREAD_COUNT --bytesPerChunk 256M --ignore-version true)
output=$(mysqlsh --uri "$SOURCE_DSN" $SOURCE_NO_PASSWORD_OPTION -- util copy-instance "mysql://${MYDUCK_USER}:${MYDUCK_PASSWORD}@${MYDUCK_HOST}:${MYDUCK_PORT}" \
--users false \
--consistent false \
--ignore-existing-objects true \
--handle-grant-errors ignore \
--threads $THREAD_COUNT \
--bytesPerChunk 256M \
--ignore-version true \
--load-indexes false \
--defer-table-indexes all \
)

if [[ $GTID_MODE == "ON" ]]; then
# Extract the EXECUTED_GTID_SET from this output:
Expand Down Expand Up @@ -71,4 +81,9 @@ else
fi


echo "Snapshot completed successfully."
echo "Snapshot completed successfully."

echo "Reset replica_is_loading_snapshot..."
mysqlsh --sql --host=${MYDUCK_HOST} --port=${MYDUCK_PORT} --user=root --no-password <<EOF
SET GLOBAL replica_is_loading_snapshot = OFF;
EOF
9 changes: 9 additions & 0 deletions replica/options.go
Original file line number Diff line number Diff line change
Expand Up @@ -48,5 +48,14 @@ func RegisterReplicaOptions(options *ReplicaOptions) {
Type: types.NewSystemStringType("report_password"),
Default: options.ReportPassword,
},
// MyDuck-specific system variables
&sql.MysqlSystemVariable{
Name: "replica_is_loading_snapshot",
Scope: sql.GetMysqlScope(sql.SystemVariableScope_Global),
Dynamic: true,
SetVarHintApplies: false,
Type: types.NewSystemBoolType("replica_is_loading_snapshot"),
Default: false,
},
})
}

0 comments on commit 0d691f2

Please sign in to comment.