20 #ifndef RIPPLE_CONSENSUS_CONSENSUS_H_INCLUDED
21 #define RIPPLE_CONSENSUS_CONSENSUS_H_INCLUDED
23 #include <ripple/basics/Log.h>
24 #include <ripple/basics/chrono.h>
25 #include <ripple/beast/utility/Journal.h>
26 #include <ripple/consensus/ConsensusParms.h>
27 #include <ripple/consensus/ConsensusProposal.h>
28 #include <ripple/consensus/ConsensusTypes.h>
29 #include <ripple/consensus/DisputedTx.h>
30 #include <ripple/consensus/LedgerTiming.h>
31 #include <ripple/json/json_writer.h>
32 #include <boost/logic/tribool.hpp>
69 ConsensusParms
const& parms,
94 ConsensusParms
const& parms,
286 template <
class Adaptor>
292 using Tx_t =
typename TxSet_t::Tx;
296 typename Ledger_t::ID,
297 typename TxSet_t::ID>;
320 a.onModeChange(
mode_, mode);
405 std::optional<
std::chrono::milliseconds> consensusDelay);
607 template <
class Adaptor>
612 : adaptor_(adaptor), clock_(clock), j_{journal}
614 JLOG(j_.
debug()) <<
"Creating consensus object";
617 template <
class Adaptor>
621 typename Ledger_t::ID
const& prevLedgerID,
629 prevRoundTime_ = adaptor_.parms().ledgerIDLE_INTERVAL;
630 prevCloseTime_ = prevLedger.closeTime();
635 prevCloseTime_ = rawCloseTimes_.self;
638 for (
NodeID_t const& n : nowUntrusted)
639 recentPeerPositions_.erase(n);
642 proposing ? ConsensusMode::proposing : ConsensusMode::observing;
645 if (prevLedger.id() != prevLedgerID)
648 if (
auto newLedger = adaptor_.acquireLedger(prevLedgerID))
650 prevLedger = *newLedger;
654 startMode = ConsensusMode::wrongLedger;
656 <<
"Entering consensus with: " << previousLedger_.id();
657 JLOG(j_.
info()) <<
"Correct LCL is: " << prevLedgerID;
661 startRoundInternal(now, prevLedgerID, prevLedger, startMode);
663 template <
class Adaptor>
667 typename Ledger_t::ID
const& prevLedgerID,
671 phase_ = ConsensusPhase::open;
672 JLOG(j_.
debug()) <<
"transitioned to ConsensusPhase::open";
673 mode_.set(mode, adaptor_);
675 prevLedgerID_ = prevLedgerID;
676 previousLedger_ = prevLedger;
678 convergePercent_ = 0;
679 haveCloseTimeConsensus_ =
false;
680 openTime_.reset(clock_.now());
681 currPeerPositions_.clear();
683 rawCloseTimes_.peers.clear();
684 rawCloseTimes_.self = {};
688 previousLedger_.closeTimeResolution(),
689 previousLedger_.closeAgree(),
690 previousLedger_.seq() +
typename Ledger_t::Seq{1});
693 if (currPeerPositions_.size() > (prevProposers_ / 2))
701 template <
class Adaptor>
707 auto const& peerID = newPeerPos.proposal().nodeID();
711 auto& props = recentPeerPositions_[peerID];
713 if (props.size() >= 10)
716 props.push_back(newPeerPos);
718 return peerProposalInternal(now, newPeerPos);
721 template <
class Adaptor>
728 if (phase_ == ConsensusPhase::accepted)
733 auto const& newPeerProp = newPeerPos.proposal();
735 if (newPeerProp.prevLedger() != prevLedgerID_)
737 JLOG(j_.
debug()) <<
"Got proposal for " << newPeerProp.prevLedger()
738 <<
" but we are on " << prevLedgerID_;
742 auto const& peerID = newPeerProp.nodeID();
744 if (deadNodes_.find(peerID) != deadNodes_.end())
746 JLOG(j_.
info()) <<
"Position from dead node: " << peerID;
752 auto peerPosIt = currPeerPositions_.find(peerID);
754 if (peerPosIt != currPeerPositions_.end())
756 if (newPeerProp.proposeSeq() <=
757 peerPosIt->second.proposal().proposeSeq())
763 if (newPeerProp.isBowOut())
765 JLOG(j_.
info()) <<
"Peer " << peerID <<
" bows out";
768 for (
auto& it : result_->disputes)
769 it.second.unVote(peerID);
771 if (peerPosIt != currPeerPositions_.end())
772 currPeerPositions_.erase(peerID);
773 deadNodes_.insert(peerID);
778 if (peerPosIt != currPeerPositions_.end())
779 peerPosIt->second = newPeerPos;
781 currPeerPositions_.emplace(peerID, newPeerPos);
784 if (newPeerProp.isInitial())
787 JLOG(j_.
trace()) <<
"Peer reports close time as "
788 << newPeerProp.closeTime().time_since_epoch().count();
789 ++rawCloseTimes_.peers[newPeerProp.closeTime()];
792 JLOG(j_.
trace()) <<
"Processing peer proposal " << newPeerProp.proposeSeq()
793 <<
"/" << newPeerProp.position();
796 auto const ait = acquired_.find(newPeerProp.position());
797 if (ait == acquired_.end())
802 if (
auto set = adaptor_.acquireTxSet(newPeerProp.position()))
803 gotTxSet(now_, *
set);
805 JLOG(j_.
debug()) <<
"Don't have tx set for peer";
809 updateDisputes(newPeerProp.nodeID(), ait->second);
816 template <
class Adaptor>
821 if (phase_ == ConsensusPhase::accepted)
829 if (phase_ == ConsensusPhase::open)
833 else if (phase_ == ConsensusPhase::establish)
839 template <
class Adaptor>
846 if (phase_ == ConsensusPhase::accepted)
851 auto id = txSet.id();
855 if (!acquired_.emplace(
id, txSet).second)
860 JLOG(j_.
debug()) <<
"Not creating disputes: no position yet.";
866 assert(
id != result_->position.position());
868 for (
auto const& [nodeId, peerPos] : currPeerPositions_)
870 if (peerPos.proposal().position() ==
id)
872 updateDisputes(nodeId, txSet);
880 <<
"By the time we got " <<
id <<
" no peers were proposing it";
885 template <
class Adaptor>
891 using namespace std::chrono_literals;
892 JLOG(j_.
info()) <<
"Simulating consensus";
895 result_->roundTime.tick(consensusDelay.
value_or(100ms));
896 result_->proposers = prevProposers_ = currPeerPositions_.size();
897 prevRoundTime_ = result_->roundTime.read();
898 phase_ = ConsensusPhase::accepted;
899 adaptor_.onForceAccept(
906 JLOG(j_.
info()) <<
"Simulation complete";
909 template <
class Adaptor>
918 ret[
"proposing"] = (mode_.get() == ConsensusMode::proposing);
919 ret[
"proposers"] =
static_cast<int>(currPeerPositions_.size());
921 if (mode_.get() != ConsensusMode::wrongLedger)
923 ret[
"synched"] =
true;
926 ret[
"close_granularity"] =
static_cast<Int
>(closeResolution_.count());
929 ret[
"synched"] =
false;
931 ret[
"phase"] = to_string(phase_);
933 if (result_ && !result_->disputes.empty() && !full)
934 ret[
"disputes"] =
static_cast<Int
>(result_->disputes.size());
937 ret[
"our_position"] = result_->position.getJson();
943 static_cast<Int
>(result_->roundTime.read().count());
944 ret[
"converge_percent"] = convergePercent_;
945 ret[
"close_resolution"] =
static_cast<Int
>(closeResolution_.count());
946 ret[
"have_time_consensus"] = haveCloseTimeConsensus_;
947 ret[
"previous_proposers"] =
static_cast<Int
>(prevProposers_);
948 ret[
"previous_mseconds"] =
static_cast<Int
>(prevRoundTime_.count());
950 if (!currPeerPositions_.empty())
954 for (
auto const& [nodeId, peerPos] : currPeerPositions_)
956 ppj[to_string(nodeId)] = peerPos.getJson();
958 ret[
"peer_positions"] = std::move(ppj);
961 if (!acquired_.empty())
964 for (
auto const& at : acquired_)
966 acq.
append(to_string(at.first));
968 ret[
"acquired"] = std::move(acq);
971 if (result_ && !result_->disputes.empty())
974 for (
auto const& [txId, dispute] : result_->disputes)
976 dsj[to_string(txId)] = dispute.getJson();
978 ret[
"disputes"] = std::move(dsj);
981 if (!rawCloseTimes_.peers.empty())
984 for (
auto const& ct : rawCloseTimes_.peers)
989 ret[
"close_times"] = std::move(ctj);
992 if (!deadNodes_.empty())
995 for (
auto const& dn : deadNodes_)
997 dnj.
append(to_string(dn));
999 ret[
"dead_nodes"] = std::move(dnj);
1007 template <
class Adaptor>
1011 assert(lgrId != prevLedgerID_ || previousLedger_.id() != lgrId);
1017 if (prevLedgerID_ != lgrId)
1019 prevLedgerID_ = lgrId;
1024 result_->disputes.clear();
1025 result_->compares.clear();
1028 currPeerPositions_.clear();
1029 rawCloseTimes_.peers.clear();
1033 playbackProposals();
1036 if (previousLedger_.id() == prevLedgerID_)
1040 if (
auto newLedger = adaptor_.acquireLedger(prevLedgerID_))
1042 JLOG(j_.
info()) <<
"Have the consensus ledger " << prevLedgerID_;
1044 now_, lgrId, *newLedger, ConsensusMode::switchedLedger);
1048 mode_.set(ConsensusMode::wrongLedger, adaptor_);
1052 template <
class Adaptor>
1057 adaptor_.getPrevLedger(prevLedgerID_, previousLedger_, mode_.get());
1059 if (netLgr != prevLedgerID_)
1061 JLOG(j_.
warn()) <<
"View of consensus changed during "
1062 << to_string(phase_) <<
" status=" << to_string(phase_)
1064 <<
" mode=" << to_string(mode_.get());
1065 JLOG(j_.
warn()) << prevLedgerID_ <<
" to " << netLgr;
1067 JLOG(j_.
debug()) <<
"State on consensus change "
1069 handleWrongLedger(netLgr);
1071 else if (previousLedger_.id() != prevLedgerID_)
1072 handleWrongLedger(netLgr);
1075 template <
class Adaptor>
1079 for (
auto const& it : recentPeerPositions_)
1081 for (
auto const& pos : it.second)
1083 if (pos.proposal().prevLedger() == prevLedgerID_)
1085 if (peerProposalInternal(now_, pos))
1086 adaptor_.share(pos);
1092 template <
class Adaptor>
1099 bool anyTransactions = adaptor_.hasOpenTransactions();
1100 auto proposersClosed = currPeerPositions_.size();
1101 auto proposersValidated = adaptor_.proposersValidated(prevLedgerID_);
1103 openTime_.tick(clock_.now());
1108 bool previousCloseCorrect =
1109 (mode_.get() != ConsensusMode::wrongLedger) &&
1110 previousLedger_.closeAgree() &&
1111 (previousLedger_.closeTime() !=
1112 (previousLedger_.parentCloseTime() + 1s));
1114 auto lastCloseTime = previousCloseCorrect
1115 ? previousLedger_.closeTime()
1118 if (now_ >= lastCloseTime)
1119 sinceClose = duration_cast<milliseconds>(now_ - lastCloseTime);
1121 sinceClose = -duration_cast<milliseconds>(lastCloseTime - now_);
1124 auto const idleInterval = std::max<milliseconds>(
1125 adaptor_.parms().ledgerIDLE_INTERVAL,
1126 2 * previousLedger_.closeTimeResolution());
1145 template <
class Adaptor>
1149 auto const& parms = adaptor_.parms();
1151 previousLedger_.seq() -
1152 std::min(adaptor_.getValidLedgerIndex(), previousLedger_.seq()));
1153 auto [quorum, trustedKeys] = adaptor_.getQuorumKeys();
1154 std::size_t const totalValidators = trustedKeys.size();
1156 adaptor_.laggards(previousLedger_.seq(), trustedKeys);
1160 vars <<
" (working seq: " << previousLedger_.seq() <<
", "
1161 <<
"validated seq: " << adaptor_.getValidLedgerIndex() <<
", "
1162 <<
"am validator: " << adaptor_.validator() <<
", "
1163 <<
"have validated: " << adaptor_.haveValidated() <<
", "
1164 <<
"roundTime: " << result_->roundTime.
read().count() <<
", "
1165 <<
"max consensus time: " << parms.ledgerMAX_CONSENSUS.count() <<
", "
1166 <<
"validators: " << totalValidators <<
", "
1167 <<
"laggards: " << laggards <<
", "
1168 <<
"offline: " << offline <<
", "
1169 <<
"quorum: " << quorum <<
")";
1171 if (!ahead || !laggards || !totalValidators || !adaptor_.validator() ||
1172 !adaptor_.haveValidated() ||
1173 result_->roundTime.read() > parms.ledgerMAX_CONSENSUS)
1175 j_.
debug() <<
"not pausing (early)" << vars.
str();
1179 bool willPause =
false;
1215 std::size_t const phase = (ahead - 1) % (maxPausePhase + 1);
1224 if (laggards + offline > totalValidators - quorum)
1239 float const nonLaggards = totalValidators - (laggards + offline);
1240 float const quorumRatio =
1241 static_cast<float>(quorum) / totalValidators;
1242 float const allowedDissent = 1.0f - quorumRatio;
1243 float const phaseFactor =
static_cast<float>(phase) / maxPausePhase;
1245 if (nonLaggards / totalValidators <
1246 quorumRatio + (allowedDissent * phaseFactor))
1253 j_.
warn() <<
"pausing" << vars.
str();
1255 j_.
debug() <<
"not pausing" << vars.
str();
1259 template <
class Adaptor>
1269 result_->roundTime.tick(clock_.now());
1270 result_->proposers = currPeerPositions_.size();
1272 convergePercent_ = result_->roundTime.read() * 100 /
1279 updateOurPositions();
1282 if (shouldPause() || !haveConsensus())
1285 if (!haveCloseTimeConsensus_)
1287 JLOG(j_.
info()) <<
"We have TX consensus but not CT consensus";
1291 JLOG(j_.
info()) <<
"Converge cutoff (" << currPeerPositions_.size()
1292 <<
" participants)";
1293 adaptor_.updateOperatingMode(currPeerPositions_.size());
1294 prevProposers_ = currPeerPositions_.size();
1295 prevRoundTime_ = result_->roundTime.read();
1296 phase_ = ConsensusPhase::accepted;
1297 JLOG(j_.
debug()) <<
"transitioned to ConsensusPhase::accepted";
1307 template <
class Adaptor>
1314 phase_ = ConsensusPhase::establish;
1315 JLOG(j_.
debug()) <<
"transitioned to ConsensusPhase::establish";
1316 rawCloseTimes_.self = now_;
1318 result_.emplace(adaptor_.onClose(previousLedger_, now_, mode_.get()));
1319 result_->roundTime.reset(clock_.now());
1322 if (acquired_.emplace(result_->txns.id(), result_->txns).second)
1323 adaptor_.share(result_->txns);
1325 if (mode_.get() == ConsensusMode::proposing)
1326 adaptor_.propose(result_->position);
1329 for (
auto const& pit : currPeerPositions_)
1331 auto const& pos = pit.second.proposal().position();
1332 auto const it = acquired_.find(pos);
1333 if (it != acquired_.end())
1335 createDisputes(it->second);
1355 int result = ((participants * percent) + (percent / 2)) / 100;
1357 return (result == 0) ? 1 : result;
1360 template <
class Adaptor>
1375 auto it = currPeerPositions_.
begin();
1376 while (it != currPeerPositions_.end())
1378 Proposal_t const& peerProp = it->second.proposal();
1379 if (peerProp.
isStale(peerCutoff))
1383 JLOG(j_.
warn()) <<
"Removing stale proposal from " << peerID;
1384 for (
auto& dt : result_->disputes)
1385 dt.second.unVote(peerID);
1386 it = currPeerPositions_.erase(it);
1391 ++closeTimeVotes[asCloseTime(peerProp.
closeTime())];
1403 for (
auto& [txId, dispute] : result_->disputes)
1407 if (dispute.updateVote(
1409 mode_.get() == ConsensusMode::proposing,
1413 mutableSet.
emplace(result_->txns);
1415 if (dispute.getOurVote())
1418 mutableSet->insert(dispute.tx());
1423 mutableSet->erase(txId);
1429 ourNewSet.
emplace(std::move(*mutableSet));
1433 haveCloseTimeConsensus_ =
false;
1435 if (currPeerPositions_.empty())
1438 haveCloseTimeConsensus_ =
true;
1439 consensusCloseTime = asCloseTime(result_->position.closeTime());
1454 int participants = currPeerPositions_.size();
1455 if (mode_.get() == ConsensusMode::proposing)
1457 ++closeTimeVotes[asCloseTime(result_->position.closeTime())];
1465 int const threshConsensus =
1468 JLOG(j_.
info()) <<
"Proposers:" << currPeerPositions_.size()
1469 <<
" nw:" << neededWeight <<
" thrV:" << threshVote
1470 <<
" thrC:" << threshConsensus;
1472 for (
auto const& [t, v] : closeTimeVotes)
1476 <<
static_cast<std::uint32_t>(previousLedger_.seq()) + 1 <<
": "
1477 << t.time_since_epoch().count() <<
" has " << v <<
", "
1478 << threshVote <<
" required";
1480 if (v >= threshVote)
1483 consensusCloseTime = t;
1486 if (threshVote >= threshConsensus)
1487 haveCloseTimeConsensus_ =
true;
1491 if (!haveCloseTimeConsensus_)
1494 <<
"No CT consensus:"
1495 <<
" Proposers:" << currPeerPositions_.size()
1496 <<
" Mode:" << to_string(mode_.get())
1497 <<
" Thresh:" << threshConsensus
1503 ((consensusCloseTime != asCloseTime(result_->position.closeTime())) ||
1504 result_->position.isStale(ourCutoff)))
1507 ourNewSet.
emplace(result_->txns);
1512 auto newID = ourNewSet->id();
1514 result_->txns = std::move(*ourNewSet);
1516 JLOG(j_.
info()) <<
"Position change: CTime "
1518 <<
", tx " << newID;
1520 result_->position.changePosition(newID, consensusCloseTime, now_);
1524 if (acquired_.emplace(newID, result_->txns).second)
1526 if (!result_->position.isBowOut())
1527 adaptor_.share(result_->txns);
1529 for (
auto const& [nodeId, peerPos] : currPeerPositions_)
1533 updateDisputes(nodeId, result_->txns);
1538 if (!result_->position.isBowOut() &&
1539 (mode_.get() == ConsensusMode::proposing))
1540 adaptor_.propose(result_->position);
1544 template <
class Adaptor>
1552 int agree = 0, disagree = 0;
1554 auto ourPosition = result_->position.position();
1557 for (
auto const& [nodeId, peerPos] : currPeerPositions_)
1559 Proposal_t const& peerProp = peerPos.proposal();
1560 if (peerProp.
position() == ourPosition)
1566 JLOG(j_.
debug()) << nodeId <<
" has " << peerProp.
position();
1570 auto currentFinished =
1571 adaptor_.proposersFinished(previousLedger_, prevLedgerID_);
1573 JLOG(j_.
debug()) <<
"Checking for TX consensus: agree=" << agree
1574 <<
", disagree=" << disagree;
1583 result_->roundTime.read(),
1585 mode_.get() == ConsensusMode::proposing,
1588 if (result_->state == ConsensusState::No)
1593 if (result_->state == ConsensusState::MovedOn)
1595 JLOG(j_.
error()) <<
"Unable to reach consensus";
1602 template <
class Adaptor>
1606 if (mode_.get() == ConsensusMode::proposing)
1608 if (result_ && !result_->position.isBowOut())
1610 result_->position.bowOut(now_);
1611 adaptor_.propose(result_->position);
1614 mode_.set(ConsensusMode::observing, adaptor_);
1615 JLOG(j_.
info()) <<
"Bowing out of consensus";
1619 template <
class Adaptor>
1627 if (!result_->compares.emplace(o.id()).second)
1631 if (result_->txns.id() == o.id())
1634 JLOG(j_.
debug()) <<
"createDisputes " << result_->txns.id() <<
" to "
1637 auto differences = result_->txns.compare(o);
1641 for (
auto const& [txId, inThisSet] : differences)
1646 (inThisSet && result_->txns.find(txId) && !o.find(txId)) ||
1647 (!inThisSet && !result_->txns.find(txId) && o.find(txId)));
1649 Tx_t tx = inThisSet ? result_->txns.find(txId) : o.find(txId);
1650 auto txID = tx.id();
1652 if (result_->disputes.find(txID) != result_->disputes.end())
1655 JLOG(j_.
debug()) <<
"Transaction " << txID <<
" is disputed";
1659 result_->txns.exists(txID),
1660 std::max(prevProposers_, currPeerPositions_.size()),
1664 for (
auto const& [nodeId, peerPos] : currPeerPositions_)
1666 Proposal_t const& peerProp = peerPos.proposal();
1667 auto const cit = acquired_.find(peerProp.
position());
1668 if (cit != acquired_.end())
1669 dtx.setVote(nodeId, cit->second.exists(txID));
1671 adaptor_.share(dtx.tx());
1673 result_->disputes.emplace(txID, std::move(dtx));
1675 JLOG(j_.
debug()) << dc <<
" differences found";
1678 template <
class Adaptor>
1687 if (result_->compares.find(other.id()) == result_->compares.end())
1688 createDisputes(other);
1690 for (
auto& it : result_->disputes)
1692 auto& d = it.second;
1693 d.setVote(node, other.exists(d.tx().id()));
1697 template <
class Adaptor>