From 741048197401416c290c70b18efe6bf1be838133 Mon Sep 17 00:00:00 2001 From: Luis Carvalho Date: Fri, 30 Aug 2024 08:15:42 +0100 Subject: [PATCH] fix: prevent stuck SLCs waiting for valset (#1274) # Related Github tickets - Closes https://github.com/VolumeFi/paloma/issues/1040 # Background If a JIT ValsetUpdate fails, it can lead to SLC messages being stuck. In order to overcome this, we set a watcher on the end blocker to insert new ValsetUpdates when needed if there is an SLC message in the queue (or UploadUserSmartContract message). # Testing completed - [x] test coverage exists or has been added/updated - [x] tested in a private testnet # Breaking changes - [x] I have checked my code for breaking changes - [x] If there are breaking changes, there is a supporting migration. --- x/evm/keeper/keeper.go | 52 ++++++++ x/evm/keeper/keeper_test.go | 254 ++++++++++++++++++++++++++++++++++++ x/evm/module.go | 4 + 3 files changed, 310 insertions(+) diff --git a/x/evm/keeper/keeper.go b/x/evm/keeper/keeper.go index bee1b4553..a1ac6efaa 100644 --- a/x/evm/keeper/keeper.go +++ b/x/evm/keeper/keeper.go @@ -928,3 +928,55 @@ func (k Keeper) GetValidatorAddressByEthAddress(ctx context.Context, ethAddr sky } return } + +func (k Keeper) AddJustInTimeValsetUpdates(ctx context.Context) { + chainInfos, err := k.GetAllChainInfos(ctx) + if err != nil { + k.Logger(ctx).Error("failed to get chains infos", "err", err) + return + } + + for _, chainInfo := range chainInfos { + queueName := consensustypes.Queue( + types.ConsensusTurnstoneMessage, + xchainType, + xchain.ReferenceID(chainInfo.GetChainReferenceID()), + ) + + messages, err := k.ConsensusKeeper.GetMessagesFromQueue(ctx, queueName, 0) + if err != nil { + k.Logger(ctx).Error("failed to get messages from queue", "err", err) + return + } + + var hasUpdateValset, hasFeePayer bool + + for _, msg := range messages { + consMsg, err := msg.ConsensusMsg(k.cdc) + if err != nil { + continue + } + + mmsg, ok := consMsg.(*types.Message) + if !ok { + continue + } + + switch mmsg.Action.(type) { + case *types.Message_UpdateValset: + hasUpdateValset = true + case types.FeePayer: + hasFeePayer = true + } + } + + if hasFeePayer && !hasUpdateValset { + // Check if we need the valset update and add it to the queue + err = k.justInTimeValsetUpdate(ctx, chainInfo) + if err != nil { + k.Logger(ctx).Error("failed to issue valset update", "err", err) + return + } + } + } +} diff --git a/x/evm/keeper/keeper_test.go b/x/evm/keeper/keeper_test.go index a23fc2165..dd298c5e9 100644 --- a/x/evm/keeper/keeper_test.go +++ b/x/evm/keeper/keeper_test.go @@ -7,10 +7,12 @@ import ( "testing" "time" + "cosmossdk.io/math" sdkmath "cosmossdk.io/math" codectypes "github.com/cosmos/cosmos-sdk/codec/types" sdk "github.com/cosmos/cosmos-sdk/types" "github.com/ethereum/go-ethereum/common" + "github.com/palomachain/paloma/util/slice" consensustypes "github.com/palomachain/paloma/x/consensus/types" "github.com/palomachain/paloma/x/evm/types" evmtypes "github.com/palomachain/paloma/x/evm/types" @@ -711,3 +713,255 @@ func TestKeeper_SendValsetMsgForChain(t *testing.T) { assert.NoError(t, err) }) } + +func TestKeeper_AddJustInTimeValsetUpdates(t *testing.T) { + chainInfo := &types.ChainInfo{ + ChainID: 100, + ChainReferenceID: "test-chain", + ReferenceBlockHeight: 1000, + ReferenceBlockHash: "0x00", + MinOnChainBalance: "100", + SmartContractUniqueID: []byte("abc"), + SmartContractAddr: "0x01", + RelayWeights: &types.RelayWeights{ + Fee: "1.0", + Uptime: "1.0", + SuccessRate: "1.0", + ExecutionTime: "1.0", + FeatureSet: "1.0", + }, + } + + type valpower struct { + valAddr sdk.ValAddress + power int64 + externalChain []*valsettypes.ExternalChainInfo + } + + var totalPower int64 = 20 + valpowers := []valpower{ + { + valAddr: sdk.ValAddress("validator-1"), + power: 15, + externalChain: []*valsettypes.ExternalChainInfo{ + { + ChainType: "evm", + ChainReferenceID: chainInfo.GetChainReferenceID(), + Address: "addr1", + Pubkey: []byte("1"), + }, + }, + }, + { + valAddr: sdk.ValAddress("validator-2"), + power: 5, + externalChain: []*valsettypes.ExternalChainInfo{ + { + ChainType: "evm", + ChainReferenceID: chainInfo.GetChainReferenceID(), + Address: "addr1", + Pubkey: []byte("1"), + }, + }, + }, + } + + currentSnapshot := &valsettypes.Snapshot{ + Id: 5, + Validators: slice.Map(valpowers, func(p valpower) valsettypes.Validator { + return valsettypes.Validator{ + ShareCount: sdkmath.NewInt(p.power), + Address: p.valAddr, + ExternalChainInfos: p.externalChain, + } + }), + TotalShares: sdkmath.NewInt(totalPower), + } + + validatorMetrics := &metrixtypes.QueryValidatorsResponse{ + ValMetrics: []metrixtypes.ValidatorMetrics{ + { + ValAddress: sdk.ValAddress("validator-1").String(), + Uptime: sdkmath.LegacyOneDec(), + SuccessRate: sdkmath.LegacyOneDec(), + ExecutionTime: sdkmath.NewInt(0), + Fee: sdkmath.NewInt(0), + FeatureSet: sdkmath.LegacyOneDec(), + }, + }, + } + + fee, _ := sdkmath.LegacyNewDecFromStr("1.1") + relayerFees := map[string]math.LegacyDec{ + sdk.ValAddress("validator-1").String(): fee, + } + + t.Run("Should add valset update with SLC", func(t *testing.T) { + k, ms, ctx := NewEvmKeeper(t) + err := k.updateChainInfo(ctx, chainInfo) + require.NoError(t, err) + + qMsg, _ := codectypes.NewAnyWithValue(&evmtypes.Message{ + TurnstoneID: "abc", + ChainReferenceID: "test-chain", + Assignee: "addr4", + Action: &evmtypes.Message_SubmitLogicCall{ + SubmitLogicCall: &evmtypes.SubmitLogicCall{ + SenderAddress: sdk.ValAddress("sender"), + }, + }, + }) + + msgs := []consensustypes.QueuedSignedMessageI{ + &consensustypes.QueuedSignedMessage{ + Id: 1, + Msg: qMsg, + }, + } + + ms.ConsensusKeeper.On("GetMessagesFromQueue", mock.Anything, + mock.Anything, mock.Anything). + Return(msgs, nil). + Once() + + ms.ValsetKeeper.On("GetCurrentSnapshot", mock.Anything). + Return(currentSnapshot, nil) + + ms.ValsetKeeper.On("GetLatestSnapshotOnChain", mock.Anything, mock.Anything). + Return(&valsettypes.Snapshot{Id: 1}, nil) + + ms.MetrixKeeper.On("Validators", mock.Anything, mock.Anything). + Return(validatorMetrics, nil) + + ms.TreasuryKeeper.On("GetRelayerFeesByChainReferenceID", mock.Anything, + chainInfo.ChainReferenceID). + Return(relayerFees, nil) + + ms.MsgSender.On("SendValsetMsgForChain", mock.Anything, mock.Anything, + mock.Anything, mock.Anything, mock.Anything). + Return(nil) + + k.AddJustInTimeValsetUpdates(ctx) + }) + + t.Run("Should do nothing if no SLC in queue", func(t *testing.T) { + k, ms, ctx := NewEvmKeeper(t) + err := k.updateChainInfo(ctx, chainInfo) + require.NoError(t, err) + + qMsg, _ := codectypes.NewAnyWithValue(&evmtypes.Message{ + TurnstoneID: "abc", + ChainReferenceID: "test-chain", + Assignee: "addr4", + Action: &evmtypes.Message_UploadSmartContract{ + UploadSmartContract: &evmtypes.UploadSmartContract{}, + }, + }) + + msgs := []consensustypes.QueuedSignedMessageI{ + &consensustypes.QueuedSignedMessage{ + Id: 1, + Msg: qMsg, + }, + } + + ms.ConsensusKeeper.On("GetMessagesFromQueue", mock.Anything, mock.Anything, mock.Anything). + Return(msgs, nil). + Once() + + k.AddJustInTimeValsetUpdates(ctx) + }) + + t.Run("Should do nothing if valset update is already scheduled", func(t *testing.T) { + k, ms, ctx := NewEvmKeeper(t) + err := k.updateChainInfo(ctx, chainInfo) + require.NoError(t, err) + + qMsg, _ := codectypes.NewAnyWithValue(&evmtypes.Message{ + TurnstoneID: "abc", + ChainReferenceID: "test-chain", + Assignee: "addr4", + Action: &evmtypes.Message_UpdateValset{ + UpdateValset: &evmtypes.UpdateValset{ + Valset: &evmtypes.Valset{ + ValsetID: 2, + }, + }, + }, + }) + + slcMsg, _ := codectypes.NewAnyWithValue(&evmtypes.Message{ + TurnstoneID: "abc", + ChainReferenceID: "test-chain", + Assignee: "addr4", + Action: &evmtypes.Message_SubmitLogicCall{ + SubmitLogicCall: &evmtypes.SubmitLogicCall{ + SenderAddress: sdk.ValAddress("sender"), + }, + }, + }) + + msgs := []consensustypes.QueuedSignedMessageI{ + &consensustypes.QueuedSignedMessage{ + Id: 1, + Msg: qMsg, + }, + &consensustypes.QueuedSignedMessage{ + Id: 2, + Msg: slcMsg, + }, + } + + ms.ConsensusKeeper.On("GetMessagesFromQueue", mock.Anything, mock.Anything, mock.Anything). + Return(msgs, nil). + Once() + + k.AddJustInTimeValsetUpdates(ctx) + }) + + t.Run("Should add valset update with UploadUserSmartContract", func(t *testing.T) { + k, ms, ctx := NewEvmKeeper(t) + err := k.updateChainInfo(ctx, chainInfo) + require.NoError(t, err) + + qMsg, _ := codectypes.NewAnyWithValue(&evmtypes.Message{ + TurnstoneID: "abc", + ChainReferenceID: "test-chain", + Assignee: "addr4", + Action: &evmtypes.Message_UploadUserSmartContract{ + UploadUserSmartContract: &evmtypes.UploadUserSmartContract{}, + }, + }) + + msgs := []consensustypes.QueuedSignedMessageI{ + &consensustypes.QueuedSignedMessage{ + Id: 1, + Msg: qMsg, + }, + } + + ms.ConsensusKeeper.On("GetMessagesFromQueue", mock.Anything, + mock.Anything, mock.Anything). + Return(msgs, nil). + Once() + + ms.ValsetKeeper.On("GetCurrentSnapshot", mock.Anything). + Return(currentSnapshot, nil) + + ms.ValsetKeeper.On("GetLatestSnapshotOnChain", mock.Anything, mock.Anything). + Return(&valsettypes.Snapshot{Id: 1}, nil) + + ms.MetrixKeeper.On("Validators", mock.Anything, mock.Anything). + Return(validatorMetrics, nil) + + ms.TreasuryKeeper.On("GetRelayerFeesByChainReferenceID", mock.Anything, + chainInfo.ChainReferenceID). + Return(relayerFees, nil) + + ms.MsgSender.On("SendValsetMsgForChain", mock.Anything, mock.Anything, + mock.Anything, mock.Anything, mock.Anything). + Return(nil) + + k.AddJustInTimeValsetUpdates(ctx) + }) +} diff --git a/x/evm/module.go b/x/evm/module.go index 8fe5c20e4..50254d4c1 100644 --- a/x/evm/module.go +++ b/x/evm/module.go @@ -183,6 +183,10 @@ func (am AppModule) EndBlock(ctx context.Context) error { sdkCtx := sdk.UnwrapSDKContext(ctx) am.keeper.TryDeployingLastCompassContractToAllChains(sdkCtx) + // Add valset updates to queue if we have SLCs in the queue and a valset + // mismatch. This should prevent SLCs from getting stuck. + am.keeper.AddJustInTimeValsetUpdates(sdkCtx) + if sdkCtx.BlockHeight()%300 == 0 { if err := am.scheduleExternalBalances(sdkCtx); err != nil { liblog.FromSDKLogger(sdkCtx.Logger()).WithError(err).