Skip to content

Commit

Permalink
Support for big ledger peer snapshot
Browse files Browse the repository at this point in the history
This change introduces support for big ledger peers in the node.
A new optional entry in network topology JSON parser is added that is intended
to point to a path containing a serialized snapshot of big ledger peers
taken from some slot a priori. When present, this file is decoded
at node startup, or when a SIGHUP is triggered, and made available
to the diffusion layer via reading from a TVar.
  • Loading branch information
crocodile-dentist committed Apr 22, 2024
1 parent 0cc5b08 commit c10e12e
Show file tree
Hide file tree
Showing 8 changed files with 111 additions and 18 deletions.
5 changes: 5 additions & 0 deletions cardano-node/ChangeLog.md
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,11 @@
## Next version

- Use p2p network stack by default, warn when using the legacy network stack.
- Ledger peer snapshot path entry added to topology JSON parser,
which a new decoder function `readPeerSnapshotFile` processes
at startup and SIGHUP. Data is available to the diffusion layer
via TVar.


## 8.2.1 -- August 2023

Expand Down
1 change: 1 addition & 0 deletions cardano-node/cardano-node.cabal
Original file line number Diff line number Diff line change
Expand Up @@ -145,6 +145,7 @@ library
, base16-bytestring
, bytestring
, cardano-api ^>= 8.44
, cardano-binary
, cardano-crypto-class
, cardano-crypto-wrapper
, cardano-git-rev ^>=0.2.2
Expand Down
29 changes: 25 additions & 4 deletions cardano-node/src/Cardano/Node/Configuration/TopologyP2P.hs
Original file line number Diff line number Diff line change
Expand Up @@ -18,11 +18,13 @@ module Cardano.Node.Configuration.TopologyP2P
, PeerAdvertise(..)
, nodeAddressToSockAddr
, readTopologyFile
, readPeerSnapshotFile
, readTopologyFileOrError
, rootConfigToRelayAccessPoint
)
where

import Cardano.Binary
import Cardano.Node.Configuration.NodeAddress
import Cardano.Node.Configuration.POM (NodeConfiguration (..))
import Cardano.Node.Configuration.Topology (TopologyError (..))
Expand All @@ -31,16 +33,20 @@ import Cardano.Node.Types
import Cardano.Tracing.OrphanInstances.Network ()
import Ouroboros.Network.NodeToNode (PeerAdvertise (..))
import Ouroboros.Network.PeerSelection.Bootstrap (UseBootstrapPeers (..))
import Ouroboros.Network.PeerSelection.LedgerPeers.Type (UseLedgerPeers (..))
import Ouroboros.Network.PeerSelection.LedgerPeers.Type (LedgerPeerSnapshot (..),
UseLedgerPeers (..))
import Ouroboros.Network.PeerSelection.PeerTrustable (PeerTrustable (..))
import Ouroboros.Network.PeerSelection.RelayAccessPoint (RelayAccessPoint (..))
import Ouroboros.Network.PeerSelection.State.LocalRootPeers (HotValency (..),
WarmValency (..))

import Codec.CBOR.Read
import Control.Applicative (Alternative (..))
import Control.DeepSeq
import Control.Exception (IOException)
import qualified Control.Exception as Exception
import Control.Exception.Base (Exception (..))
import Control.Monad.Trans.Except.Extra
import "contra-tracer" Control.Tracer (Tracer, traceWith)
import Data.Aeson
import Data.Bifunctor (Bifunctor (..))
Expand Down Expand Up @@ -175,6 +181,7 @@ data NetworkTopology = RealNodeTopology { ntLocalRootPeersGroups :: !LocalRootPe
, ntPublicRootPeers :: ![PublicRootPeers]
, ntUseLedgerPeers :: !UseLedgerPeers
, ntUseBootstrapPeers :: !UseBootstrapPeers
, ntPeerSnapshotPath :: !(Maybe PeerSnapshotFile)
}
deriving (Eq, Show)

Expand All @@ -183,7 +190,8 @@ instance FromJSON NetworkTopology where
RealNodeTopology <$> (o .: "localRoots" )
<*> (o .: "publicRoots" )
<*> (o .:? "useLedgerAfterSlot" .!= DontUseLedgerPeers )
<*> (o .:? "bootstrapPeers" .!= DontUseBootstrapPeers)
<*> (o .:? "bootstrapPeers" .!= DontUseBootstrapPeers )
<*> (o .:? "peerSnapshotFile")

instance ToJSON NetworkTopology where
toJSON top =
Expand All @@ -192,10 +200,12 @@ instance ToJSON NetworkTopology where
, ntPublicRootPeers
, ntUseLedgerPeers
, ntUseBootstrapPeers
, ntPeerSnapshotPath
} -> object [ "localRoots" .= ntLocalRootPeersGroups
, "publicRoots" .= ntPublicRootPeers
, "useLedgerAfterSlot" .= ntUseLedgerPeers
, "bootstrapPeers" .= ntUseBootstrapPeers
, "peerSnapshotFile" .= ntPeerSnapshotPath
]

--
Expand Down Expand Up @@ -235,7 +245,8 @@ instance FromJSON (Legacy NetworkTopology) where
RealNodeTopology <$> fmap getLegacy (o .: "LocalRoots")
<*> fmap getLegacy (o .: "PublicRoots")
<*> (o .:? "useLedgerAfterSlot" .!= DontUseLedgerPeers)
<*> pure DontUseBootstrapPeers)
<*> pure DontUseBootstrapPeers
<*> pure Nothing)

-- | Read the `NetworkTopology` configuration from the specified file.
--
Expand Down Expand Up @@ -297,14 +308,24 @@ readTopologyFileOrError tr nc =
<> Text.unpack err)
pure

readPeerSnapshotFile :: PeerSnapshotFile -> IO LedgerPeerSnapshot
readPeerSnapshotFile (PeerSnapshotFile psf) = either error pure =<< runExceptT
(handleLeftT (left . ("Cardano.Node.Configuration.TopologyP2P.readPeerSnapshotFile: " <>)) $ do
contents <- BS.readFile psf `catchIOExceptT` displayException
-- sweep it out eagerly
let tryDecode = force . deserialiseFromBytes fromCBOR . LBS.fromStrict $ contents
case tryDecode of
Left _ -> left "Peer snapshot file read but decode failed - incompatible or corrupted file?"
Right (_, lps) -> right lps)

--
-- Checking for chance of progress in bootstrap phase
--

-- | This function returns false if non-trustable peers are configured
--
isValidTrustedPeerConfiguration :: NetworkTopology -> Bool
isValidTrustedPeerConfiguration (RealNodeTopology (LocalRootPeersGroups lprgs) _ _ ubp) =
isValidTrustedPeerConfiguration (RealNodeTopology (LocalRootPeersGroups lprgs) _ _ ubp _) =
case ubp of
DontUseBootstrapPeers -> True
UseBootstrapPeers [] -> anyTrustable
Expand Down
57 changes: 46 additions & 11 deletions cardano-node/src/Cardano/Node/Run.hs
Original file line number Diff line number Diff line change
Expand Up @@ -8,8 +8,8 @@
{-# LANGUAGE NamedFieldPuns #-}
{-# LANGUAGE PackageImports #-}
{-# LANGUAGE ScopedTypeVariables #-}
{-# LANGUAGE TypeApplications #-}
{-# LANGUAGE TupleSections #-}
{-# LANGUAGE TypeApplications #-}

{-# OPTIONS_GHC -Wno-unused-imports #-}

Expand All @@ -34,7 +34,7 @@ import Control.Concurrent (killThread, mkWeakThreadId, myThreadId)
import Control.Concurrent.Class.MonadSTM.Strict
import Control.Exception (try)
import qualified Control.Exception as Exception
import Control.Monad (forM_, unless, void, when)
import Control.Monad (forM, forM_, unless, void, when)
import Control.Monad.Class.MonadThrow (MonadThrow (..))
import Control.Monad.IO.Class (MonadIO (..))
import Control.Monad.Trans.Except (ExceptT, runExceptT)
Expand Down Expand Up @@ -125,7 +125,7 @@ import Cardano.Node.TraceConstraints (TraceConstraints)
import Cardano.Tracing.Tracers
import Ouroboros.Network.PeerSelection.PeerSharing (PeerSharing (..))
import Ouroboros.Network.PeerSelection.State.LocalRootPeers (HotValency, WarmValency)
import Ouroboros.Network.PeerSelection.LedgerPeers.Type (UseLedgerPeers)
import Ouroboros.Network.PeerSelection.LedgerPeers.Type (LedgerPeerSnapshot (..), UseLedgerPeers)
import Ouroboros.Network.PeerSelection.PeerTrustable (PeerTrustable)
import Ouroboros.Network.PeerSelection.Bootstrap (UseBootstrapPeers)

Expand Down Expand Up @@ -420,16 +420,24 @@ handleSimpleNode blockType runP p2pMode tracers nc onKernel = do
nt@TopologyP2P.RealNodeTopology
{ ntUseLedgerPeers
, ntUseBootstrapPeers
, ntPeerSnapshotPath
} <- TopologyP2P.readTopologyFileOrError (startupTracer tracers) nc
let (localRoots, publicRoots) = producerAddresses nt
traceWith (startupTracer tracers)
$ NetworkConfig localRoots
publicRoots
ntUseLedgerPeers
localRootsVar <- newTVarIO localRoots
publicRootsVar <- newTVarIO publicRoots
useLedgerVar <- newTVarIO ntUseLedgerPeers
ntPeerSnapshotPath
localRootsVar <- newTVarIO localRoots
publicRootsVar <- newTVarIO publicRoots
useLedgerVar <- newTVarIO ntUseLedgerPeers
useBootstrapVar <- newTVarIO ntUseBootstrapPeers
ledgerPeerSnapshotPathVar <- newTVarIO ntPeerSnapshotPath
ledgerPeerSnapshotVar <- newTVarIO =<< updateLedgerPeerSnapshot
(startupTracer tracers)
(readTVar ledgerPeerSnapshotPathVar)
(const . pure $ ())

let nodeArgs = RunNodeArgs
{ rnTraceConsensus = consensusTracers tracers
, rnTraceNTN = nodeToNodeTracers tracers
Expand Down Expand Up @@ -462,6 +470,11 @@ handleSimpleNode blockType runP p2pMode tracers nc onKernel = do
updateTopologyConfiguration
(startupTracer tracers) nc
localRootsVar publicRootsVar useLedgerVar useBootstrapVar
ledgerPeerSnapshotPathVar
void $ updateLedgerPeerSnapshot
(startupTracer tracers)
(readTVar ledgerPeerSnapshotPathVar)
(writeTVar ledgerPeerSnapshotVar)
traceWith (startupTracer tracers) (BlockForgingUpdate NotEffective)
)
Nothing
Expand All @@ -473,13 +486,15 @@ handleSimpleNode blockType runP p2pMode tracers nc onKernel = do
(readTVar publicRootsVar)
(readTVar useLedgerVar)
(readTVar useBootstrapVar)
(readTVar ledgerPeerSnapshotVar)
in
Node.run
nodeArgs {
rnNodeKernelHook = \registry nodeKernel -> do
-- reinstall `SIGHUP` handler
installP2PSigHUPHandler (startupTracer tracers) blockType nc nodeKernel
localRootsVar publicRootsVar useLedgerVar useBootstrapVar
ledgerPeerSnapshotPathVar
rnNodeKernelHook nodeArgs registry nodeKernel
}
StdRunNodeArgs
Expand Down Expand Up @@ -648,17 +663,19 @@ installP2PSigHUPHandler :: Tracer IO (StartupTrace blk)
-> StrictTVar IO (Map RelayAccessPoint PeerAdvertise)
-> StrictTVar IO UseLedgerPeers
-> StrictTVar IO UseBootstrapPeers
-> StrictTVar IO (Maybe PeerSnapshotFile)
-> IO ()
#ifndef UNIX
installP2PSigHUPHandler _ _ _ _ _ _ _ _ = return ()
#else
installP2PSigHUPHandler startupTracer blockType nc nodeKernel localRootsVar publicRootsVar useLedgerVar
useBootstrapPeersVar =
useBootstrapPeersVar ledgerPeerSnapshotPathVar =
void $ Signals.installHandler
Signals.sigHUP
(Signals.Catch $ do
updateBlockForging startupTracer blockType nodeKernel nc
updateTopologyConfiguration startupTracer nc localRootsVar publicRootsVar useLedgerVar useBootstrapPeersVar
updateTopologyConfiguration startupTracer nc localRootsVar publicRootsVar
useLedgerVar useBootstrapPeersVar ledgerPeerSnapshotPathVar
)
Nothing
#endif
Expand Down Expand Up @@ -743,9 +760,10 @@ updateTopologyConfiguration :: Tracer IO (StartupTrace blk)
-> StrictTVar IO (Map RelayAccessPoint PeerAdvertise)
-> StrictTVar IO UseLedgerPeers
-> StrictTVar IO UseBootstrapPeers
-> StrictTVar IO (Maybe PeerSnapshotFile)
-> IO ()
updateTopologyConfiguration startupTracer nc localRootsVar publicRootsVar useLedgerVar
useBootsrapPeersVar = do
useBootsrapPeersVar ledgerPeerSnapshotPathVar = do
traceWith startupTracer NetworkConfigUpdate
result <- try $ readTopologyFileOrError startupTracer nc
case result of
Expand All @@ -755,17 +773,31 @@ updateTopologyConfiguration startupTracer nc localRootsVar publicRootsVar useLed
$ pack "Error reading topology configuration file:" <> err
Right nt@RealNodeTopology { ntUseLedgerPeers
, ntUseBootstrapPeers
, ntPeerSnapshotPath
} -> do
let (localRoots, publicRoots) = producerAddresses nt
traceWith startupTracer
$ NetworkConfig localRoots publicRoots ntUseLedgerPeers
$ NetworkConfig localRoots publicRoots ntUseLedgerPeers ntPeerSnapshotPath
atomically $ do
writeTVar localRootsVar localRoots
writeTVar publicRootsVar publicRoots
writeTVar useLedgerVar ntUseLedgerPeers
writeTVar useBootsrapPeersVar ntUseBootstrapPeers
writeTVar ledgerPeerSnapshotPathVar ntPeerSnapshotPath
#endif

updateLedgerPeerSnapshot :: Tracer IO (StartupTrace blk)
-> STM IO (Maybe PeerSnapshotFile)
-> (Maybe LedgerPeerSnapshot -> STM IO ())
-> IO (Maybe LedgerPeerSnapshot)
updateLedgerPeerSnapshot startupTracer readLedgerPeerPath writeVar = do
mPeerSnapshotFile <- atomically readLedgerPeerPath
mLedgerPeerSnapshot <- forM mPeerSnapshotFile $ \f -> do
lps@(LedgerPeerSnapshot (wOrigin, _)) <- readPeerSnapshotFile f
lps <$ traceWith startupTracer (LedgerPeerSnapshotLoaded wOrigin)
atomically . writeVar $ mLedgerPeerSnapshot
pure mLedgerPeerSnapshot

--------------------------------------------------------------------------------
-- Helper functions
--------------------------------------------------------------------------------
Expand Down Expand Up @@ -823,6 +855,7 @@ mkP2PArguments
-> STM IO (Map RelayAccessPoint PeerAdvertise)
-> STM IO UseLedgerPeers
-> STM IO UseBootstrapPeers
-> STM IO (Maybe LedgerPeerSnapshot)
-> Diffusion.ExtraArguments 'Diffusion.P2P IO
mkP2PArguments NodeConfiguration {
ncTargetNumberOfRootPeers,
Expand All @@ -839,13 +872,15 @@ mkP2PArguments NodeConfiguration {
daReadLocalRootPeers
daReadPublicRootPeers
daReadUseLedgerPeers
daReadUseBootstrapPeers =
daReadUseBootstrapPeers
daReadLedgerPeerSnapshot =
Diffusion.P2PArguments P2P.ArgumentsExtra
{ P2P.daPeerSelectionTargets
, P2P.daReadLocalRootPeers
, P2P.daReadPublicRootPeers
, P2P.daReadUseLedgerPeers
, P2P.daReadUseBootstrapPeers
, P2P.daReadLedgerPeerSnapshot
, P2P.daProtocolIdleTimeout = ncProtocolIdleTimeout
, P2P.daTimeWaitTimeout = ncTimeWaitTimeout
, P2P.daDeadlineChurnInterval = 3300
Expand Down
4 changes: 4 additions & 0 deletions cardano-node/src/Cardano/Node/Startup.hs
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,8 @@ import Cardano.Node.Configuration.POM (NodeConfiguration (..), ncProto
import Cardano.Node.Configuration.Socket
import Cardano.Node.Protocol (ProtocolInstantiationError)
import Cardano.Node.Protocol.Types (SomeConsensusProtocol (..))
import Cardano.Node.Types (PeerSnapshotFile)
import Cardano.Slotting.Slot (SlotNo, WithOrigin)
import qualified Ouroboros.Consensus.BlockchainTime.WallClock.Types as WCT
import Ouroboros.Consensus.Cardano.Block
import Ouroboros.Consensus.Cardano.CanHardFork (shelleyLedgerConfig)
Expand Down Expand Up @@ -113,6 +115,7 @@ data StartupTrace blk =
| NetworkConfig [(HotValency, WarmValency, Map RelayAccessPoint (PeerAdvertise, PeerTrustable))]
(Map RelayAccessPoint PeerAdvertise)
UseLedgerPeers
(Maybe PeerSnapshotFile)

-- | Warn when 'DisabledP2P' is set.
| NonP2PWarning
Expand All @@ -131,6 +134,7 @@ data StartupTrace blk =
| BIShelley BasicInfoShelleyBased
| BIByron BasicInfoByron
| BINetwork BasicInfoNetwork
| LedgerPeerSnapshotLoaded (WithOrigin SlotNo)

data EnabledBlockForging = EnabledBlockForging
| DisabledBlockForging
Expand Down
Loading

0 comments on commit c10e12e

Please sign in to comment.