From ddab705b092525af085288af618e0cee6733a61e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Facundo=20Dom=C3=ADnguez?= Date: Tue, 20 Aug 2024 21:00:13 +0000 Subject: [PATCH] Update configuration after recovering BulkSync in ouroboros-network --- .../Ouroboros/Consensus/Node.hs | 6 +- .../Ouroboros/Consensus/Node/Genesis.hs | 48 +++++++-------- .../Ouroboros/Consensus/NodeKernel.hs | 8 +++ .../Test/ThreadNet/Network.hs | 7 ++- .../Consensus/PeerSimulator/BlockFetch.hs | 21 ++++--- .../BlockFetch/ClientInterface.hs | 59 ++++++++++--------- .../MiniProtocol/BlockFetch/Client.hs | 20 +++++-- 7 files changed, 99 insertions(+), 70 deletions(-) diff --git a/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node.hs b/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node.hs index f434c0f432..dd391f519d 100644 --- a/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node.hs +++ b/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node.hs @@ -321,7 +321,8 @@ nonImmutableDbPath (MultipleDbPaths _ vol) = vol -- -- See 'stdLowLevelRunNodeArgsIO'. data StdRunNodeArgs m blk (p2p :: Diffusion.P2P) = StdRunNodeArgs - { srnBfcMaxConcurrencyDeadline :: Maybe Word + { srnBfcMaxConcurrencyBulkSync :: Maybe Word + , srnBfcMaxConcurrencyDeadline :: Maybe Word , srnChainDbValidateOverride :: Bool -- ^ If @True@, validate the ChainDB on init no matter what , srnDiskPolicyArgs :: DiskPolicyArgs @@ -985,6 +986,9 @@ stdLowLevelRunNodeArgsIO RunNodeArgs{ rnProtocolInfo maybe id (\mc bfc -> bfc { bfcMaxConcurrencyDeadline = mc }) srnBfcMaxConcurrencyDeadline + . maybe id + (\mc bfc -> bfc { bfcMaxConcurrencyBulkSync = mc }) + srnBfcMaxConcurrencyBulkSync modifyMempoolCapacityOverride = maybe id (\mc nka -> nka { mempoolCapacityOverride = mc }) diff --git a/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node/Genesis.hs b/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node/Genesis.hs index 84a90e90fd..ba08a02408 100644 --- a/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node/Genesis.hs +++ b/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/Node/Genesis.hs @@ -66,26 +66,26 @@ data GenesisConfig = GenesisConfig -- | Genesis configuration flags and low-level args, as parsed from config file or CLI data GenesisConfigFlags = GenesisConfigFlags - { gcfEnableCSJ :: Bool - , gcfEnableLoEAndGDD :: Bool - , gcfEnableLoP :: Bool - , gcfBulkSyncGracePeriod :: Maybe Integer - , gcfBucketCapacity :: Maybe Integer - , gcfBucketRate :: Maybe Integer - , gcfCSJJumpSize :: Maybe Integer - , gcfGDDRateLimit :: Maybe DiffTime + { gcfEnableCSJ :: Bool + , gcfEnableLoEAndGDD :: Bool + , gcfEnableLoP :: Bool + , gcfBlockFetchGracePeriod :: Maybe Integer + , gcfBucketCapacity :: Maybe Integer + , gcfBucketRate :: Maybe Integer + , gcfCSJJumpSize :: Maybe Integer + , gcfGDDRateLimit :: Maybe DiffTime } deriving stock (Eq, Generic, Show) defaultGenesisConfigFlags :: GenesisConfigFlags defaultGenesisConfigFlags = GenesisConfigFlags - { gcfEnableCSJ = True - , gcfEnableLoEAndGDD = True - , gcfEnableLoP = True - , gcfBulkSyncGracePeriod = Nothing - , gcfBucketCapacity = Nothing - , gcfBucketRate = Nothing - , gcfCSJJumpSize = Nothing - , gcfGDDRateLimit = Nothing + { gcfEnableCSJ = True + , gcfEnableLoEAndGDD = True + , gcfEnableLoP = True + , gcfBlockFetchGracePeriod = Nothing + , gcfBucketCapacity = Nothing + , gcfBucketRate = Nothing + , gcfCSJJumpSize = Nothing + , gcfGDDRateLimit = Nothing } enableGenesisConfigDefault :: GenesisConfig @@ -99,7 +99,7 @@ mkGenesisConfig :: Maybe GenesisConfigFlags -> GenesisConfig mkGenesisConfig Nothing = -- disable Genesis GenesisConfig { gcBlockFetchConfig = GenesisBlockFetchConfiguration - { gbfcBulkSyncGracePeriod = 0 -- no grace period when Genesis is disabled + { gbfcGracePeriod = 0 -- no grace period when Genesis is disabled } , gcChainSyncLoPBucketConfig = ChainSyncLoPBucketDisabled , gcCSJConfig = CSJDisabled @@ -109,7 +109,7 @@ mkGenesisConfig Nothing = -- disable Genesis mkGenesisConfig (Just GenesisConfigFlags{..}) = GenesisConfig { gcBlockFetchConfig = GenesisBlockFetchConfiguration - { gbfcBulkSyncGracePeriod + { gbfcGracePeriod } , gcChainSyncLoPBucketConfig = if gcfEnableLoP then ChainSyncLoPBucketEnabled ChainSyncLoPBucketEnabledConfig @@ -134,7 +134,7 @@ mkGenesisConfig (Just GenesisConfigFlags{..}) = -- The minimum amount of time during which the Genesis BlockFetch logic will -- download blocks from a specific peer (even if it is not performing well -- during that period). - defaultBulkSyncGracePeriod = 10 -- seconds + defaultBlockFetchGracePeriod = 10 -- seconds -- LoP parameters. Empirically, it takes less than 1ms to validate a header, -- so leaking one token per 2ms is conservative. The capacity of 100_000 @@ -153,11 +153,11 @@ mkGenesisConfig (Just GenesisConfigFlags{..}) = -- Limiting the performance impact of the GDD. defaultGDDRateLimit = 1.0 -- seconds - gbfcBulkSyncGracePeriod = fromInteger $ fromMaybe defaultBulkSyncGracePeriod gcfBulkSyncGracePeriod - csbcCapacity = fromInteger $ fromMaybe defaultCapacity gcfBucketCapacity - csbcRate = fromInteger $ fromMaybe defaultRate gcfBucketRate - csjcJumpSize = fromInteger $ fromMaybe defaultCSJJumpSize gcfCSJJumpSize - lgpGDDRateLimit = fromMaybe defaultGDDRateLimit gcfGDDRateLimit + gbfcGracePeriod = fromInteger $ fromMaybe defaultBlockFetchGracePeriod gcfBlockFetchGracePeriod + csbcCapacity = fromInteger $ fromMaybe defaultCapacity gcfBucketCapacity + csbcRate = fromInteger $ fromMaybe defaultRate gcfBucketRate + csjcJumpSize = fromInteger $ fromMaybe defaultCSJJumpSize gcfCSJJumpSize + lgpGDDRateLimit = fromMaybe defaultGDDRateLimit gcfGDDRateLimit newtype LoEAndGDDParams = LoEAndGDDParams { -- | How often to evaluate GDD. 0 means as soon as possible. diff --git a/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/NodeKernel.hs b/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/NodeKernel.hs index 075290ec69..c65159737c 100644 --- a/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/NodeKernel.hs +++ b/ouroboros-consensus-diffusion/src/ouroboros-consensus-diffusion/Ouroboros/Consensus/NodeKernel.hs @@ -95,6 +95,7 @@ import Ouroboros.Network.AnchoredFragment (AnchoredFragment, import qualified Ouroboros.Network.AnchoredFragment as AF import Ouroboros.Network.Block (castTip, tipFromHeader) import Ouroboros.Network.BlockFetch +import Ouroboros.Network.ConsensusMode (ConsensusMode (..)) import Ouroboros.Network.Diffusion (PublicPeerSelectionState) import Ouroboros.Network.NodeToNode (ConnectionId, MiniProtocolParameters (..)) @@ -378,6 +379,7 @@ initInternalState NodeKernelArgs { tracers, chainDB, registry, cfg , mempoolCapacityOverride , gsmArgs, getUseBootstrapPeers , getDiffusionPipeliningSupport + , genesisArgs } = do varGsmState <- do let GsmNodeKernelArgs {..} = gsmArgs @@ -398,6 +400,7 @@ initInternalState NodeKernelArgs { tracers, chainDB, registry, cfg slotForgeTimeOracle <- BlockFetchClientInterface.initSlotForgeTimeOracle cfg chainDB let readFetchMode = BlockFetchClientInterface.readFetchModeDefault + (toConsensusMode $ gnkaLoEAndGDDArgs genesisArgs) btime (ChainDB.getCurrentChain chainDB) getUseBootstrapPeers @@ -416,6 +419,11 @@ initInternalState NodeKernelArgs { tracers, chainDB, registry, cfg peerSharingRegistry <- newPeerSharingRegistry return IS {..} + where + toConsensusMode :: forall a. LoEAndGDDConfig a -> ConsensusMode + toConsensusMode = \case + LoEAndGDDDisabled -> PraosMode + LoEAndGDDEnabled _ -> GenesisMode forkBlockForging :: forall m addrNTN addrNTC blk. diff --git a/ouroboros-consensus-diffusion/src/unstable-diffusion-testlib/Test/ThreadNet/Network.hs b/ouroboros-consensus-diffusion/src/unstable-diffusion-testlib/Test/ThreadNet/Network.hs index cd57825c17..d7dd9e75cc 100644 --- a/ouroboros-consensus-diffusion/src/unstable-diffusion-testlib/Test/ThreadNet/Network.hs +++ b/ouroboros-consensus-diffusion/src/unstable-diffusion-testlib/Test/ThreadNet/Network.hs @@ -1013,10 +1013,11 @@ runThreadNetwork systemTime ThreadNetworkArgs txSubmissionMaxUnacked = 1000 -- TODO ? } , blockFetchConfiguration = BlockFetchConfiguration { - bfcMaxConcurrencyDeadline = 2 + bfcMaxConcurrencyBulkSync = 1 + , bfcMaxConcurrencyDeadline = 2 , bfcMaxRequestsInflight = 10 - , bfcDecisionLoopIntervalBulkSync = 0.0 -- Mock testsuite can use sub-second slot - , bfcDecisionLoopIntervalDeadline = 0.0 -- interval which doesn't play nice with + , bfcDecisionLoopIntervalPraos = 0.0 -- Mock testsuite can use sub-second slot + , bfcDecisionLoopIntervalGenesis = 0.0 -- interval which doesn't play nice with -- blockfetch descision interval. , bfcSalt = 0 , bfcGenesisBFConfig = gcBlockFetchConfig enableGenesisConfigDefault diff --git a/ouroboros-consensus-diffusion/test/consensus-test/Test/Consensus/PeerSimulator/BlockFetch.hs b/ouroboros-consensus-diffusion/test/consensus-test/Test/Consensus/PeerSimulator/BlockFetch.hs index f317456254..b7319b8eaf 100644 --- a/ouroboros-consensus-diffusion/test/consensus-test/Test/Consensus/PeerSimulator/BlockFetch.hs +++ b/ouroboros-consensus-diffusion/test/consensus-test/Test/Consensus/PeerSimulator/BlockFetch.hs @@ -37,10 +37,12 @@ import Ouroboros.Consensus.Storage.ChainDB.API import Ouroboros.Consensus.Util (ShowProxy) import Ouroboros.Consensus.Util.IOLike import Ouroboros.Network.BlockFetch (BlockFetchConfiguration (..), - FetchClientRegistry, FetchMode (..), - GenesisBlockFetchConfiguration (..), blockFetchLogic, - bracketFetchClient, bracketKeepAliveClient) + FetchClientRegistry, GenesisBlockFetchConfiguration (..), + blockFetchLogic, bracketFetchClient, + bracketKeepAliveClient) import Ouroboros.Network.BlockFetch.Client (blockFetchClient) +import Ouroboros.Network.BlockFetch.ConsensusInterface + (FetchMode (..)) import Ouroboros.Network.Channel (Channel) import Ouroboros.Network.ControlMessage (ControlMessageSTM) import Ouroboros.Network.Driver (runPeer) @@ -93,13 +95,13 @@ startBlockFetchLogic enableChainSelStarvation registry tracer chainDb fetchClien -- do not serialize the blocks. (\_hdr -> 1000) slotForgeTime - -- This is a syncing test, so we use 'FetchModeBulkSync'. - (pure FetchModeBulkSync) + -- This is a syncing test, so we use 'FetchModeGenesis'. + (pure FetchModeGenesis) DiffusionPipeliningOn bfcGenesisBFConfig = if enableChainSelStarvation then GenesisBlockFetchConfiguration - { gbfcBulkSyncGracePeriod = + { gbfcGracePeriod = if enableChainSelStarvation then 10 -- default value for cardano-node at the time of writing else @@ -110,10 +112,11 @@ startBlockFetchLogic enableChainSelStarvation registry tracer chainDb fetchClien -- Values taken from -- ouroboros-consensus-diffusion/src/unstable-diffusion-testlib/Test/ThreadNet/Network.hs blockFetchCfg = BlockFetchConfiguration - { bfcMaxConcurrencyDeadline = 50 -- unused because of @pure FetchModeBulkSync@ above + { bfcMaxConcurrencyBulkSync = 50 + , bfcMaxConcurrencyDeadline = 50 -- unused because of @pure FetchModeBulkSync@ above , bfcMaxRequestsInflight = 10 - , bfcDecisionLoopIntervalBulkSync = 0 - , bfcDecisionLoopIntervalDeadline = 0 + , bfcDecisionLoopIntervalPraos = 0 + , bfcDecisionLoopIntervalGenesis = 0 , bfcSalt = 0 , bfcGenesisBFConfig } diff --git a/ouroboros-consensus/src/ouroboros-consensus/Ouroboros/Consensus/MiniProtocol/BlockFetch/ClientInterface.hs b/ouroboros-consensus/src/ouroboros-consensus/Ouroboros/Consensus/MiniProtocol/BlockFetch/ClientInterface.hs index 0834b5d57f..7748ab7ac7 100644 --- a/ouroboros-consensus/src/ouroboros-consensus/Ouroboros/Consensus/MiniProtocol/BlockFetch/ClientInterface.hs +++ b/ouroboros-consensus/src/ouroboros-consensus/Ouroboros/Consensus/MiniProtocol/BlockFetch/ClientInterface.hs @@ -46,7 +46,8 @@ import Ouroboros.Network.Block (MaxSlotNo) import Ouroboros.Network.BlockFetch.ConsensusInterface (BlockFetchConsensusInterface (..), ChainSelStarvation (..), FetchMode (..), - FromConsensus (..)) + FromConsensus (..), PraosFetchMode (..), mkReadFetchMode) +import Ouroboros.Network.ConsensusMode (ConsensusMode) import Ouroboros.Network.PeerSelection.Bootstrap (UseBootstrapPeers, requiresBootstrapPeers) import Ouroboros.Network.PeerSelection.LedgerPeers.Type @@ -142,37 +143,41 @@ initSlotForgeTimeOracle cfg chainDB = do readFetchModeDefault :: (MonadSTM m, HasHeader blk) - => BlockchainTime m + => ConsensusMode + -> BlockchainTime m -> STM m (AnchoredFragment blk) -> STM m UseBootstrapPeers -> STM m LedgerStateJudgement -> STM m FetchMode -readFetchModeDefault btime getCurrentChain - getUseBootstrapPeers getLedgerStateJudgement = do - mCurSlot <- getCurrentSlot btime - usingBootstrapPeers <- requiresBootstrapPeers <$> getUseBootstrapPeers - <*> getLedgerStateJudgement +readFetchModeDefault consensusMode btime getCurrentChain + getUseBootstrapPeers getLedgerStateJudgement = + mkReadFetchMode consensusMode getLedgerStateJudgement praosFetchMode + where + praosFetchMode = do + mCurSlot <- getCurrentSlot btime + usingBootstrapPeers <- requiresBootstrapPeers <$> getUseBootstrapPeers + <*> getLedgerStateJudgement - -- This logic means that when the node is using bootstrap peers and is in - -- TooOld state it will always return BulkSync. Otherwise if the node - -- isn't using bootstrap peers (i.e. has them disabled it will use the old - -- logic of returning BulkSync if behind 1000 slots - case (usingBootstrapPeers, mCurSlot) of - (True, _) -> return FetchModeBulkSync - (False, CurrentSlotUnknown) -> return FetchModeBulkSync - (False, CurrentSlot curSlot) -> do - curChainSlot <- AF.headSlot <$> getCurrentChain - let slotsBehind = case curChainSlot of - -- There's nothing in the chain. If the current slot is 0, then - -- we're 1 slot behind. - Origin -> unSlotNo curSlot + 1 - NotOrigin slot -> unSlotNo curSlot - unSlotNo slot - maxSlotsBehind = 1000 - return $ if slotsBehind < maxSlotsBehind - -- When the current chain is near to "now", use deadline mode, - -- when it is far away, use bulk sync mode. - then FetchModeDeadline - else FetchModeBulkSync + -- This logic means that when the node is using bootstrap peers and is in + -- TooOld state it will always return BulkSync. Otherwise if the node + -- isn't using bootstrap peers (i.e. has them disabled it will use the old + -- logic of returning BulkSync if behind 1000 slots + case (usingBootstrapPeers, mCurSlot) of + (True, _) -> return FetchModeBulkSync + (False, CurrentSlotUnknown) -> return FetchModeBulkSync + (False, CurrentSlot curSlot) -> do + curChainSlot <- AF.headSlot <$> getCurrentChain + let slotsBehind = case curChainSlot of + -- There's nothing in the chain. If the current slot is 0, then + -- we're 1 slot behind. + Origin -> unSlotNo curSlot + 1 + NotOrigin slot -> unSlotNo curSlot - unSlotNo slot + maxSlotsBehind = 1000 + return $ if slotsBehind < maxSlotsBehind + -- When the current chain is near to "now", use deadline mode, + -- when it is far away, use bulk sync mode. + then FetchModeDeadline + else FetchModeBulkSync mkBlockFetchConsensusInterface :: forall m peer blk. diff --git a/ouroboros-consensus/test/consensus-test/Test/Consensus/MiniProtocol/BlockFetch/Client.hs b/ouroboros-consensus/test/consensus-test/Test/Consensus/MiniProtocol/BlockFetch/Client.hs index a3c56a3cb4..caa58f3bfc 100644 --- a/ouroboros-consensus/test/consensus-test/Test/Consensus/MiniProtocol/BlockFetch/Client.hs +++ b/ouroboros-consensus/test/consensus-test/Test/Consensus/MiniProtocol/BlockFetch/Client.hs @@ -57,6 +57,8 @@ import Ouroboros.Network.BlockFetch (BlockFetchConfiguration (..), bracketFetchClient, bracketKeepAliveClient, bracketSyncWithFetchClient, newFetchClientRegistry) import Ouroboros.Network.BlockFetch.Client (blockFetchClient) +import Ouroboros.Network.BlockFetch.ConsensusInterface + (PraosFetchMode (..)) import Ouroboros.Network.ControlMessage (ControlMessage (..)) import Ouroboros.Network.Mock.Chain (Chain) import qualified Ouroboros.Network.Mock.Chain as Chain @@ -97,8 +99,9 @@ prop_blockFetch bfcts@BlockFetchClientTestSetup{..} = [ Map.keysSet bfcoBlockFetchResults === Map.keysSet peerUpdates , counterexample ("Fetched blocks per peer: " <> condense bfcoFetchedBlocks) $ property $ case blockFetchMode of - FetchModeDeadline -> all (> 0) bfcoFetchedBlocks - FetchModeBulkSync -> any (> 0) bfcoFetchedBlocks + PraosFetchMode FetchModeDeadline -> all (> 0) bfcoFetchedBlocks + PraosFetchMode FetchModeBulkSync -> all (> 0) bfcoFetchedBlocks + FetchModeGenesis -> any (> 0) bfcoFetchedBlocks ] where BlockFetchClientOutcome{..} = runSimOrThrow $ runBlockFetchTest bfcts @@ -361,18 +364,23 @@ instance Arbitrary BlockFetchClientTestSetup where peerUpdates <- Map.fromList . zip peerIds <$> replicateM numPeers (genUpdateSchedule blockFetchPipelining) - blockFetchMode <- elements [FetchModeBulkSync, FetchModeDeadline] + blockFetchMode <- elements + [ PraosFetchMode FetchModeBulkSync + , PraosFetchMode FetchModeDeadline + , FetchModeGenesis + ] blockFetchCfg <- do let -- ensure that we can download blocks from all peers + bfcMaxConcurrencyBulkSync = fromIntegral numPeers bfcMaxConcurrencyDeadline = fromIntegral numPeers -- This is used to introduce a minimal delay between BlockFetch -- logic iterations in case the monitored state vars change too -- fast, which we don't have to worry about in this test. - bfcDecisionLoopIntervalBulkSync = 0 - bfcDecisionLoopIntervalDeadline = 0 + bfcDecisionLoopIntervalGenesis = 0 + bfcDecisionLoopIntervalPraos = 0 bfcMaxRequestsInflight <- chooseEnum (2, 10) bfcSalt <- arbitrary - gbfcBulkSyncGracePeriod <- fromIntegral <$> chooseInteger (5, 60) + gbfcGracePeriod <- fromIntegral <$> chooseInteger (5, 60) let bfcGenesisBFConfig = GenesisBlockFetchConfiguration {..} pure BlockFetchConfiguration {..} pure BlockFetchClientTestSetup {..}