From 0008f867438d7a0d501d0f08f140a0c1aa0361a7 Mon Sep 17 00:00:00 2001 From: "mergify[bot]" <37929162+mergify[bot]@users.noreply.github.com> Date: Wed, 21 Dec 2022 17:56:06 -0500 Subject: [PATCH] cli: add --hard flag to rollback command to remove block as well (backport #9261) (#9465) * cli: add --hard flag to rollback command to remove block as well (#9261) Co-authored-by: Levi Aul (cherry picked from commit e84d43ec93a3456d1b3c9df39513c9c77409ab02) * Fix lint Signed-off-by: Thane Thomson Signed-off-by: Thane Thomson Co-authored-by: Callum Waters Co-authored-by: Thane Thomson --- cmd/cometbft/commands/rollback.go | 26 ++++-- consensus/replay_test.go | 2 + state/mocks/block_store.go | 14 ++++ state/rollback.go | 19 ++++- state/rollback_test.go | 127 +++++++++++++++++++++++++++++- state/services.go | 2 + store/store.go | 47 +++++++++++ store/store_test.go | 3 + 8 files changed, 226 insertions(+), 14 deletions(-) diff --git a/cmd/cometbft/commands/rollback.go b/cmd/cometbft/commands/rollback.go index 027813ef93..b5dd1ded25 100644 --- a/cmd/cometbft/commands/rollback.go +++ b/cmd/cometbft/commands/rollback.go @@ -14,6 +14,12 @@ import ( "github.com/cometbft/cometbft/store" ) +var removeBlock = false + +func init() { + RollbackStateCmd.Flags().BoolVar(&removeBlock, "hard", false, "remove last block as well as state") +} + var RollbackStateCmd = &cobra.Command{ Use: "rollback", Short: "rollback CometBFT state by one height", @@ -21,17 +27,23 @@ var RollbackStateCmd = &cobra.Command{ A state rollback is performed to recover from an incorrect application state transition, when CometBFT has persisted an incorrect app hash and is thus unable to make progress. Rollback overwrites a state at height n with the state at height n - 1. -The application should also roll back to height n - 1. No blocks are removed, so upon -restarting CometBFT the transactions in block n will be re-executed against the -application. +The application should also roll back to height n - 1. If the --hard flag is not used, +no blocks will be removed so upon restarting Tendermint the transactions in block n will be +re-executed against the application. Using --hard will also remove block n. This can +be done multiple times. `, RunE: func(cmd *cobra.Command, args []string) error { - height, hash, err := RollbackState(config) + height, hash, err := RollbackState(config, removeBlock) if err != nil { return fmt.Errorf("failed to rollback state: %w", err) } - fmt.Printf("Rolled back state to height %d and hash %v", height, hash) + if removeBlock { + fmt.Printf("Rolled back both state and block to height %d and hash %X\n", height, hash) + } else { + fmt.Printf("Rolled back state to height %d and hash %X\n", height, hash) + } + return nil }, } @@ -39,7 +51,7 @@ application. // RollbackState takes the state at the current height n and overwrites it with the state // at height n - 1. Note state here refers to CometBFT state not application state. // Returns the latest state height and app hash alongside an error if there was one. -func RollbackState(config *cfg.Config) (int64, []byte, error) { +func RollbackState(config *cfg.Config, removeBlock bool) (int64, []byte, error) { // use the parsed config to load the block and state store blockStore, stateStore, err := loadStateAndBlockStore(config) if err != nil { @@ -51,7 +63,7 @@ func RollbackState(config *cfg.Config) (int64, []byte, error) { }() // rollback the last state - return state.Rollback(blockStore, stateStore) + return state.Rollback(blockStore, stateStore, removeBlock) } func loadStateAndBlockStore(config *cfg.Config) (*store.BlockStore, state.Store, error) { diff --git a/consensus/replay_test.go b/consensus/replay_test.go index 5b81da02f9..c80a7d9369 100644 --- a/consensus/replay_test.go +++ b/consensus/replay_test.go @@ -1241,6 +1241,8 @@ func (bs *mockBlockStore) PruneBlocks(height int64) (uint64, error) { return pruned, nil } +func (bs *mockBlockStore) DeleteLatestBlock() error { return nil } + //--------------------------------------- // Test handshake/init chain diff --git a/state/mocks/block_store.go b/state/mocks/block_store.go index 792dbe2106..e38de9c88b 100644 --- a/state/mocks/block_store.go +++ b/state/mocks/block_store.go @@ -27,6 +27,20 @@ func (_m *BlockStore) Base() int64 { return r0 } +// DeleteLatestBlock provides a mock function with given fields: +func (_m *BlockStore) DeleteLatestBlock() error { + ret := _m.Called() + + var r0 error + if rf, ok := ret.Get(0).(func() error); ok { + r0 = rf() + } else { + r0 = ret.Error(0) + } + + return r0 +} + // Height provides a mock function with given fields: func (_m *BlockStore) Height() int64 { ret := _m.Called() diff --git a/state/rollback.go b/state/rollback.go index 69d1965d95..6420192cf7 100644 --- a/state/rollback.go +++ b/state/rollback.go @@ -12,7 +12,7 @@ import ( // Rollback overwrites the current CometBFT state (height n) with the most // recent previous state (height n - 1). // Note that this function does not affect application state. -func Rollback(bs BlockStore, ss Store) (int64, []byte, error) { +func Rollback(bs BlockStore, ss Store, removeBlock bool) (int64, []byte, error) { invalidState, err := ss.Load() if err != nil { return -1, nil, err @@ -24,9 +24,14 @@ func Rollback(bs BlockStore, ss Store) (int64, []byte, error) { height := bs.Height() // NOTE: persistence of state and blocks don't happen atomically. Therefore it is possible that - // when the user stopped the node the state wasn't updated but the blockstore was. In this situation - // we don't need to rollback any state and can just return early + // when the user stopped the node the state wasn't updated but the blockstore was. Discard the + // pending block before continuing. if height == invalidState.LastBlockHeight+1 { + if removeBlock { + if err := bs.DeleteLatestBlock(); err != nil { + return -1, nil, fmt.Errorf("failed to remove final block from blockstore: %w", err) + } + } return invalidState.LastBlockHeight, invalidState.AppHash, nil } @@ -108,5 +113,13 @@ func Rollback(bs BlockStore, ss Store) (int64, []byte, error) { return -1, nil, fmt.Errorf("failed to save rolled back state: %w", err) } + // If removeBlock is true then also remove the block associated with the previous state. + // This will mean both the last state and last block height is equal to n - 1 + if removeBlock { + if err := bs.DeleteLatestBlock(); err != nil { + return -1, nil, fmt.Errorf("failed to remove final block from blockstore: %w", err) + } + } + return rolledBackState.LastBlockHeight, rolledBackState.AppHash, nil } diff --git a/state/rollback_test.go b/state/rollback_test.go index d4403fc7f6..2e120494a6 100644 --- a/state/rollback_test.go +++ b/state/rollback_test.go @@ -3,6 +3,7 @@ package state_test import ( "crypto/rand" "testing" + "time" dbm "github.com/cometbft/cometbft-db" "github.com/stretchr/testify/require" @@ -13,6 +14,7 @@ import ( cmtversion "github.com/cometbft/cometbft/proto/tendermint/version" "github.com/cometbft/cometbft/state" "github.com/cometbft/cometbft/state/mocks" + "github.com/cometbft/cometbft/store" "github.com/cometbft/cometbft/types" "github.com/cometbft/cometbft/version" ) @@ -50,6 +52,7 @@ func TestRollback(t *testing.T) { BlockID: initialState.LastBlockID, Header: types.Header{ Height: initialState.LastBlockHeight, + Time: initialState.LastBlockTime, AppHash: crypto.CRandBytes(tmhash.Size), LastBlockID: makeBlockIDRandom(), LastResultsHash: initialState.LastResultsHash, @@ -61,6 +64,7 @@ func TestRollback(t *testing.T) { Height: nextState.LastBlockHeight, AppHash: initialState.AppHash, LastBlockID: block.BlockID, + Time: nextState.LastBlockTime, LastResultsHash: nextState.LastResultsHash, }, } @@ -69,7 +73,7 @@ func TestRollback(t *testing.T) { blockStore.On("Height").Return(nextHeight) // rollback the state - rollbackHeight, rollbackHash, err := state.Rollback(blockStore, stateStore) + rollbackHeight, rollbackHash, err := state.Rollback(blockStore, stateStore, false) require.NoError(t, err) require.EqualValues(t, height, rollbackHeight) require.EqualValues(t, initialState.AppHash, rollbackHash) @@ -81,6 +85,120 @@ func TestRollback(t *testing.T) { require.EqualValues(t, initialState, loadedState) } +func TestRollbackHard(t *testing.T) { + const height int64 = 100 + blockStore := store.NewBlockStore(dbm.NewMemDB()) + stateStore := state.NewStore(dbm.NewMemDB(), state.StoreOptions{DiscardABCIResponses: false}) + + valSet, _ := types.RandValidatorSet(5, 10) + + params := types.DefaultConsensusParams() + params.Version.App = 10 + now := time.Date(2020, 1, 1, 0, 0, 0, 0, time.UTC) + + block := &types.Block{ + Header: types.Header{ + Version: cmtversion.Consensus{Block: version.BlockProtocol, App: 1}, + ChainID: "test-chain", + Time: now, + Height: height, + AppHash: crypto.CRandBytes(tmhash.Size), + LastBlockID: makeBlockIDRandom(), + LastCommitHash: crypto.CRandBytes(tmhash.Size), + DataHash: crypto.CRandBytes(tmhash.Size), + ValidatorsHash: valSet.Hash(), + NextValidatorsHash: valSet.CopyIncrementProposerPriority(1).Hash(), + ConsensusHash: params.Hash(), + LastResultsHash: crypto.CRandBytes(tmhash.Size), + EvidenceHash: crypto.CRandBytes(tmhash.Size), + ProposerAddress: crypto.CRandBytes(crypto.AddressSize), + }, + LastCommit: &types.Commit{Height: height - 1}, + } + + partSet := block.MakePartSet(types.BlockPartSizeBytes) + blockStore.SaveBlock(block, partSet, &types.Commit{Height: block.Height}) + + currState := state.State{ + Version: cmtstate.Version{ + Consensus: block.Header.Version, + Software: version.TMCoreSemVer, + }, + LastBlockHeight: block.Height, + LastBlockTime: block.Time, + AppHash: crypto.CRandBytes(tmhash.Size), + LastValidators: valSet, + Validators: valSet.CopyIncrementProposerPriority(1), + NextValidators: valSet.CopyIncrementProposerPriority(2), + ConsensusParams: *params, + LastHeightConsensusParamsChanged: height + 1, + LastHeightValidatorsChanged: height + 1, + LastResultsHash: crypto.CRandBytes(tmhash.Size), + } + require.NoError(t, stateStore.Bootstrap(currState)) + + nextBlock := &types.Block{ + Header: types.Header{ + Version: cmtversion.Consensus{Block: version.BlockProtocol, App: 1}, + ChainID: block.ChainID, + Time: block.Time, + Height: currState.LastBlockHeight + 1, + AppHash: currState.AppHash, + LastBlockID: types.BlockID{Hash: block.Hash(), PartSetHeader: partSet.Header()}, + LastCommitHash: crypto.CRandBytes(tmhash.Size), + DataHash: crypto.CRandBytes(tmhash.Size), + ValidatorsHash: valSet.CopyIncrementProposerPriority(1).Hash(), + NextValidatorsHash: valSet.CopyIncrementProposerPriority(2).Hash(), + ConsensusHash: params.Hash(), + LastResultsHash: currState.LastResultsHash, + EvidenceHash: crypto.CRandBytes(tmhash.Size), + ProposerAddress: crypto.CRandBytes(crypto.AddressSize), + }, + LastCommit: &types.Commit{Height: currState.LastBlockHeight}, + } + + nextPartSet := nextBlock.MakePartSet(types.BlockPartSizeBytes) + blockStore.SaveBlock(nextBlock, nextPartSet, &types.Commit{Height: nextBlock.Height}) + + rollbackHeight, rollbackHash, err := state.Rollback(blockStore, stateStore, true) + require.NoError(t, err) + require.Equal(t, rollbackHeight, currState.LastBlockHeight) + require.Equal(t, rollbackHash, currState.AppHash) + + // state should not have been changed + loadedState, err := stateStore.Load() + require.NoError(t, err) + require.Equal(t, currState, loadedState) + + // resave the same block + blockStore.SaveBlock(nextBlock, nextPartSet, &types.Commit{Height: nextBlock.Height}) + + params.Version.App = 11 + + nextState := state.State{ + Version: cmtstate.Version{ + Consensus: block.Header.Version, + Software: version.TMCoreSemVer, + }, + LastBlockHeight: nextBlock.Height, + LastBlockTime: nextBlock.Time, + AppHash: crypto.CRandBytes(tmhash.Size), + LastValidators: valSet.CopyIncrementProposerPriority(1), + Validators: valSet.CopyIncrementProposerPriority(2), + NextValidators: valSet.CopyIncrementProposerPriority(3), + ConsensusParams: *params, + LastHeightConsensusParamsChanged: nextBlock.Height + 1, + LastHeightValidatorsChanged: nextBlock.Height + 1, + LastResultsHash: crypto.CRandBytes(tmhash.Size), + } + require.NoError(t, stateStore.Save(nextState)) + + rollbackHeight, rollbackHash, err = state.Rollback(blockStore, stateStore, true) + require.NoError(t, err) + require.Equal(t, rollbackHeight, currState.LastBlockHeight) + require.Equal(t, rollbackHash, currState.AppHash) +} + func TestRollbackNoState(t *testing.T) { stateStore := state.NewStore(dbm.NewMemDB(), state.StoreOptions{ @@ -88,7 +206,7 @@ func TestRollbackNoState(t *testing.T) { }) blockStore := &mocks.BlockStore{} - _, _, err := state.Rollback(blockStore, stateStore) + _, _, err := state.Rollback(blockStore, stateStore, false) require.Error(t, err) require.Contains(t, err.Error(), "no state found") } @@ -101,7 +219,7 @@ func TestRollbackNoBlocks(t *testing.T) { blockStore.On("LoadBlockMeta", height).Return(nil) blockStore.On("LoadBlockMeta", height-1).Return(nil) - _, _, err := state.Rollback(blockStore, stateStore) + _, _, err := state.Rollback(blockStore, stateStore, false) require.Error(t, err) require.Contains(t, err.Error(), "block at height 99 not found") } @@ -112,7 +230,7 @@ func TestRollbackDifferentStateHeight(t *testing.T) { blockStore := &mocks.BlockStore{} blockStore.On("Height").Return(height + 2) - _, _, err := state.Rollback(blockStore, stateStore) + _, _, err := state.Rollback(blockStore, stateStore, false) require.Error(t, err) require.Equal(t, err.Error(), "statestore height (100) is not one below or equal to blockstore height (102)") } @@ -138,6 +256,7 @@ func setupStateStore(t *testing.T, height int64) state.Store { AppHash: tmhash.Sum([]byte("app_hash")), LastResultsHash: tmhash.Sum([]byte("last_results_hash")), LastBlockHeight: height, + LastBlockTime: time.Now(), LastValidators: valSet, Validators: valSet.CopyIncrementProposerPriority(1), NextValidators: valSet.CopyIncrementProposerPriority(2), diff --git a/state/services.go b/state/services.go index bb6606bcac..b3e4e28bd4 100644 --- a/state/services.go +++ b/state/services.go @@ -34,6 +34,8 @@ type BlockStore interface { LoadBlockCommit(height int64) *types.Commit LoadSeenCommit(height int64) *types.Commit + + DeleteLatestBlock() error } //----------------------------------------------------------------------------- diff --git a/store/store.go b/store/store.go index 5b946d9f37..72655359ec 100644 --- a/store/store.go +++ b/store/store.go @@ -521,3 +521,50 @@ func mustEncode(pb proto.Message) []byte { } return bz } + +//----------------------------------------------------------------------------- + +// DeleteLatestBlock removes the block pointed to by height, +// lowering height by one. +func (bs *BlockStore) DeleteLatestBlock() error { + bs.mtx.RLock() + targetHeight := bs.height + bs.mtx.RUnlock() + + batch := bs.db.NewBatch() + defer batch.Close() + + // delete what we can, skipping what's already missing, to ensure partial + // blocks get deleted fully. + if meta := bs.LoadBlockMeta(targetHeight); meta != nil { + if err := batch.Delete(calcBlockHashKey(meta.BlockID.Hash)); err != nil { + return err + } + for p := 0; p < int(meta.BlockID.PartSetHeader.Total); p++ { + if err := batch.Delete(calcBlockPartKey(targetHeight, p)); err != nil { + return err + } + } + } + if err := batch.Delete(calcBlockCommitKey(targetHeight)); err != nil { + return err + } + if err := batch.Delete(calcSeenCommitKey(targetHeight)); err != nil { + return err + } + // delete last, so as to not leave keys built on meta.BlockID dangling + if err := batch.Delete(calcBlockMetaKey(targetHeight)); err != nil { + return err + } + + bs.mtx.Lock() + bs.height = targetHeight - 1 + bs.mtx.Unlock() + bs.saveState() + + err := batch.WriteSync() + if err != nil { + return fmt.Errorf("failed to delete height %v: %w", targetHeight, err) + } + return nil +} diff --git a/store/store_test.go b/store/store_test.go index e8250f2f2c..f962fa0cf1 100644 --- a/store/store_test.go +++ b/store/store_test.go @@ -398,6 +398,9 @@ func TestLoadBaseMeta(t *testing.T) { baseBlock := bs.LoadBaseMeta() assert.EqualValues(t, 4, baseBlock.Header.Height) assert.EqualValues(t, 4, bs.Base()) + + require.NoError(t, bs.DeleteLatestBlock()) + require.EqualValues(t, 9, bs.Height()) } func TestLoadBlockPart(t *testing.T) {