Skip to content

Commit

Permalink
Improve logging related to ledger acquisition
Browse files Browse the repository at this point in the history
  • Loading branch information
ximinez committed Sep 11, 2024
1 parent 1655475 commit 9e5487c
Show file tree
Hide file tree
Showing 6 changed files with 130 additions and 11 deletions.
18 changes: 18 additions & 0 deletions src/xrpld/app/ledger/InboundLedger.h
Original file line number Diff line number Diff line change
Expand Up @@ -196,6 +196,24 @@ class InboundLedger final : public TimeoutCounter,
std::unique_ptr<PeerSet> mPeerSet;
};

inline std::string
to_string(InboundLedger::Reason reason)
{
using enum InboundLedger::Reason;
switch (reason)
{
case HISTORY:

Check warning on line 205 in src/xrpld/app/ledger/InboundLedger.h

View check run for this annotation

Codecov / codecov/patch

src/xrpld/app/ledger/InboundLedger.h#L205

Added line #L205 was not covered by tests
return "HISTORY";
case GENERIC:
return "GENERIC";
case CONSENSUS:
return "CONSENSUS";
default:
assert(false);

Check warning on line 212 in src/xrpld/app/ledger/InboundLedger.h

View check run for this annotation

Codecov / codecov/patch

src/xrpld/app/ledger/InboundLedger.h#L211-L212

Added lines #L211 - L212 were not covered by tests
return "unknown";
}
}

} // namespace ripple

#endif
9 changes: 8 additions & 1 deletion src/xrpld/app/ledger/detail/InboundLedger.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -390,7 +390,14 @@ InboundLedger::onTimer(bool wasProgress, ScopedLockType&)

if (!wasProgress)
{
checkLocal();
if (checkLocal())
{
// Done. Something else (probably consensus) built the ledger
// locally while waiting for data (or possibly before requesting)
assert(isDone());
JLOG(journal_.info()) << "Finished while waiting " << hash_;
return;

Check warning on line 399 in src/xrpld/app/ledger/detail/InboundLedger.cpp

View check run for this annotation

Codecov / codecov/patch

src/xrpld/app/ledger/detail/InboundLedger.cpp#L399

Added line #L399 was not covered by tests
}

mByHash = true;

Expand Down
100 changes: 93 additions & 7 deletions src/xrpld/app/ledger/detail/InboundLedgers.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -74,18 +74,98 @@ class InboundLedgersImp : public InboundLedgers
auto doAcquire = [&, seq, reason]() -> std::shared_ptr<Ledger const> {
assert(hash.isNonZero());

// probably not the right rule
if (app_.getOPs().isNeedNetworkLedger() &&
(reason != InboundLedger::Reason::GENERIC) &&
(reason != InboundLedger::Reason::CONSENSUS))
bool const shouldAcquire = [&]() {
if (!app_.getOPs().isNeedNetworkLedger())
return true;
if (reason == InboundLedger::Reason::GENERIC)
return true;

Check warning on line 81 in src/xrpld/app/ledger/detail/InboundLedgers.cpp

View check run for this annotation

Codecov / codecov/patch

src/xrpld/app/ledger/detail/InboundLedgers.cpp#L81

Added line #L81 was not covered by tests
if (reason == InboundLedger::Reason::CONSENSUS)
return true;
return false;

Check warning on line 84 in src/xrpld/app/ledger/detail/InboundLedgers.cpp

View check run for this annotation

Codecov / codecov/patch

src/xrpld/app/ledger/detail/InboundLedgers.cpp#L83-L84

Added lines #L83 - L84 were not covered by tests
}();
assert(
shouldAcquire ==
!(app_.getOPs().isNeedNetworkLedger() &&
(reason != InboundLedger::Reason::GENERIC) &&
(reason != InboundLedger::Reason::CONSENSUS)));

std::stringstream ss;
ss << "InboundLedger::acquire: "
<< "Request: " << to_string(hash) << ", " << seq
<< " NeedNetworkLedger: "
<< (app_.getOPs().isNeedNetworkLedger() ? "yes" : "no")
<< " Reason: " << to_string(reason)
<< " Should acquire: " << (shouldAcquire ? "true." : "false.");

/* Acquiring ledgers is somewhat expensive. It requires lots of
* computation and network communication. Avoid it when it's not
* appropriate. Every validation from a peer for a ledger that
* we do not have locally results in a call to this function: even
* if we are moments away from validating the same ledger.
*/
bool const shouldBroadcast = [&]() {
// If the node is not in "full" state, it needs to sync to
// the network, and doesn't have the necessary tx's and
// ledger entries to build the ledger.
bool const isFull = app_.getOPs().isFull();
// If everything else is ok, don't try to acquire the ledger
// if the requested seq is in the near future relative to
// the validated ledger. If the requested ledger is between
// 1 and 19 inclusive ledgers ahead of the valid ledger this
// node has not built it yet, but it's possible/likely it
// has the tx's necessary to build it and get caught up.
// Plus it might not become validated. On the other hand, if
// it's more than 20 in the future, this node should request
// it so that it can jump ahead and get caught up.
LedgerIndex const validSeq =
app_.getLedgerMaster().getValidLedgerIndex();
constexpr std::size_t lagLeeway = 20;
bool const nearFuture =
(seq > validSeq) && (seq < validSeq + lagLeeway);
// If everything else is ok, don't try to acquire the ledger
// if the request is related to consensus. (Note that
// consensus calls usually pass a seq of 0, so nearFuture
// will be false other than on a brand new network.)
bool const consensus =
reason == InboundLedger::Reason::CONSENSUS;
ss << " Evaluating whether to broadcast requests to peers"
<< ". full: " << (isFull ? "true" : "false")
<< ". ledger sequence " << seq
<< ". Valid sequence: " << validSeq
<< ". Lag leeway: " << lagLeeway
<< ". request for near future ledger: "
<< (nearFuture ? "true" : "false")
<< ". Consensus: " << (consensus ? "true" : "false");

// If the node is not synced, send requests.
if (!isFull)
return true;

Check warning on line 142 in src/xrpld/app/ledger/detail/InboundLedgers.cpp

View check run for this annotation

Codecov / codecov/patch

src/xrpld/app/ledger/detail/InboundLedgers.cpp#L142

Added line #L142 was not covered by tests
// If the ledger is in the near future, do NOT send requests.
// This node is probably about to build it.
if (nearFuture)
return false;

Check warning on line 146 in src/xrpld/app/ledger/detail/InboundLedgers.cpp

View check run for this annotation

Codecov / codecov/patch

src/xrpld/app/ledger/detail/InboundLedgers.cpp#L146

Added line #L146 was not covered by tests
// If the request is because of consensus, do NOT send requests.
// This node is probably about to build it.
if (consensus)
return false;
return true;
}();
ss << ". Would broadcast to peers? "
<< (shouldBroadcast ? "true." : "false.");

if (!shouldAcquire)
{
JLOG(j_.debug()) << "Abort(rule): " << ss.str();
return {};
}

bool isNew = true;
std::shared_ptr<InboundLedger> inbound;
{
ScopedLockType sl(mLock);
if (stopping_)
{
JLOG(j_.debug()) << "Abort(stopping): " << ss.str();
return {};
}

Expand All @@ -109,23 +189,29 @@ class InboundLedgersImp : public InboundLedgers
++mCounter;
}
}
ss << " IsNew: " << (isNew ? "true" : "false");

if (inbound->isFailed())
{
JLOG(j_.debug()) << "Abort(failed): " << ss.str();
return {};
}

if (!isNew)
inbound->update(seq);

if (!inbound->isComplete())
{
JLOG(j_.debug()) << "InProgress: " << ss.str();
return {};
}

JLOG(j_.debug()) << "Complete: " << ss.str();
return inbound->getLedger();
};
using namespace std::chrono_literals;
std::shared_ptr<Ledger const> ledger = perf::measureDurationAndLog(
return perf::measureDurationAndLog(
doAcquire, "InboundLedgersImp::acquire", 500ms, j_);

return ledger;
}

void
Expand Down
5 changes: 3 additions & 2 deletions src/xrpld/app/ledger/detail/LedgerMaster.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -1046,8 +1046,9 @@ LedgerMaster::checkAccept(std::shared_ptr<Ledger const> const& ledger)
}

JLOG(m_journal.info()) << "Advancing accepted ledger to "
<< ledger->info().seq << " with >= " << minVal
<< " validations";
<< ledger->info().seq << " ("
<< to_short_string(ledger->info().hash)
<< ") with >= " << minVal << " validations";

ledger->setValidated();
ledger->setFull();
Expand Down
8 changes: 8 additions & 0 deletions src/xrpld/app/ledger/detail/TimeoutCounter.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -52,6 +52,8 @@ TimeoutCounter::setTimer(ScopedLockType& sl)
{
if (isDone())
return;
JLOG(journal_.debug()) << "Setting timer for " << timerInterval_.count()
<< "ms";
timer_.expires_after(timerInterval_);
timer_.async_wait(
[wptr = pmDowncast()](boost::system::error_code const& ec) {
Expand All @@ -60,6 +62,12 @@ TimeoutCounter::setTimer(ScopedLockType& sl)

if (auto ptr = wptr.lock())
{
JLOG(ptr->journal_.debug())
<< "timer: ec: " << ec << " (operation_aborted: "
<< boost::asio::error::operation_aborted << " - "
<< (ec == boost::asio::error::operation_aborted ? "aborted"
: "other")
<< ")";
ScopedLockType sl(ptr->mtx_);
ptr->queueJob(sl);
}
Expand Down
1 change: 0 additions & 1 deletion src/xrpld/overlay/detail/PeerImp.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -32,7 +32,6 @@
#include <xrpld/overlay/detail/PeerImp.h>
#include <xrpld/overlay/detail/ProtocolMessage.h>
#include <xrpld/overlay/detail/Tuning.h>
#include <xrpld/overlay/detail/ProtocolMessage.h>
#include <xrpld/overlay/predicates.h>
#include <xrpld/perflog/PerfLog.h>
#include <xrpl/basics/UptimeClock.h>
Expand Down

0 comments on commit 9e5487c

Please sign in to comment.