rippled
Loading...
Searching...
No Matches
NuDBFactory.cpp
1#include <xrpl/basics/contract.h>
2#include <xrpl/beast/core/LexicalCast.h>
3#include <xrpl/beast/utility/instrumentation.h>
4#include <xrpl/nodestore/Factory.h>
5#include <xrpl/nodestore/Manager.h>
6#include <xrpl/nodestore/detail/DecodedBlob.h>
7#include <xrpl/nodestore/detail/EncodedBlob.h>
8#include <xrpl/nodestore/detail/codec.h>
9
10#include <boost/filesystem.hpp>
11
12#include <nudb/nudb.hpp>
13
14#include <chrono>
15#include <cstdint>
16#include <cstdio>
17#include <exception>
18#include <memory>
19
20namespace xrpl {
21namespace NodeStore {
22
23class NuDBBackend : public Backend
24{
25public:
26 // "appnum" is an application-defined constant stored in the header of a
27 // NuDB database. We used it to identify shard databases before that code
28 // was removed. For now, its only use is a sanity check that the database
29 // was created by xrpld.
30 static constexpr std::uint64_t appnum = 1;
31
33 size_t const keyBytes_;
37 nudb::store db_;
40
42 size_t keyBytes,
43 Section const& keyValues,
45 Scheduler& scheduler,
46 beast::Journal journal)
47 : j_(journal)
48 , keyBytes_(keyBytes)
50 , name_(get(keyValues, "path"))
51 , blockSize_(parseBlockSize(name_, keyValues, journal))
52 , deletePath_(false)
53 , scheduler_(scheduler)
54 {
55 if (name_.empty())
56 Throw<std::runtime_error>("nodestore: Missing path in NuDB backend");
57 }
58
60 size_t keyBytes,
61 Section const& keyValues,
63 Scheduler& scheduler,
64 nudb::context& context,
65 beast::Journal journal)
66 : j_(journal)
67 , keyBytes_(keyBytes)
69 , name_(get(keyValues, "path"))
70 , blockSize_(parseBlockSize(name_, keyValues, journal))
71 , db_(context)
72 , deletePath_(false)
73 , scheduler_(scheduler)
74 {
75 if (name_.empty())
76 Throw<std::runtime_error>("nodestore: Missing path in NuDB backend");
77 }
78
79 ~NuDBBackend() override
80 {
81 try
82 {
83 // close can throw and we don't want the destructor to throw.
84 close();
85 }
86 catch (nudb::system_error const&)
87 {
88 // Don't allow exceptions to propagate out of destructors.
89 // close() has already logged the error.
90 }
91 }
92
94 getName() override
95 {
96 return name_;
97 }
98
100 getBlockSize() const override
101 {
102 return blockSize_;
103 }
104
105 void
106 open(bool createIfMissing, uint64_t appType, uint64_t uid, uint64_t salt) override
107 {
108 using namespace boost::filesystem;
109 if (db_.is_open())
110 {
111 // LCOV_EXCL_START
112 UNREACHABLE(
113 "xrpl::NodeStore::NuDBBackend::open : database is already "
114 "open");
115 JLOG(j_.error()) << "database is already open";
116 return;
117 // LCOV_EXCL_STOP
118 }
119 auto const folder = path(name_);
120 auto const dp = (folder / "nudb.dat").string();
121 auto const kp = (folder / "nudb.key").string();
122 auto const lp = (folder / "nudb.log").string();
123 nudb::error_code ec;
124 if (createIfMissing)
125 {
126 create_directories(folder);
127 nudb::create<nudb::xxhasher>(
128 dp, kp, lp, appType, uid, salt, keyBytes_, blockSize_, 0.50, ec);
129 if (ec == nudb::errc::file_exists)
130 ec = {};
131 if (ec)
132 Throw<nudb::system_error>(ec);
133 }
134 db_.open(dp, kp, lp, ec);
135 if (ec)
136 Throw<nudb::system_error>(ec);
137
138 if (db_.appnum() != appnum)
139 Throw<std::runtime_error>("nodestore: unknown appnum");
140 db_.set_burst(burstSize_);
141 }
142
143 bool
144 isOpen() override
145 {
146 return db_.is_open();
147 }
148
149 void
150 open(bool createIfMissing) override
151 {
152 open(createIfMissing, appnum, nudb::make_uid(), nudb::make_salt());
153 }
154
155 void
156 close() override
157 {
158 if (db_.is_open())
159 {
160 nudb::error_code ec;
161 db_.close(ec);
162 if (ec)
163 {
164 // Log to make sure the nature of the error gets to the user.
165 JLOG(j_.fatal()) << "NuBD close() failed: " << ec.message();
166 Throw<nudb::system_error>(ec);
167 }
168
169 if (deletePath_)
170 {
171 boost::filesystem::remove_all(name_, ec);
172 if (ec)
173 {
174 JLOG(j_.fatal())
175 << "Filesystem remove_all of " << name_ << " failed with: " << ec.message();
176 }
177 }
178 }
179 }
180
181 Status
182 fetch(void const* key, std::shared_ptr<NodeObject>* pno) override
183 {
184 Status status;
185 pno->reset();
186 nudb::error_code ec;
187 db_.fetch(
188 key,
189 [key, pno, &status](void const* data, std::size_t size) {
190 nudb::detail::buffer bf;
191 auto const result = nodeobject_decompress(data, size, bf);
192 DecodedBlob decoded(key, result.first, result.second);
193 if (!decoded.wasOk())
194 {
195 status = dataCorrupt;
196 return;
197 }
198 *pno = decoded.createObject();
199 status = ok;
200 },
201 ec);
202 if (ec == nudb::error::key_not_found)
203 return notFound;
204 if (ec)
205 Throw<nudb::system_error>(ec);
206 return status;
207 }
208
211 {
213 results.reserve(hashes.size());
214 for (auto const& h : hashes)
215 {
217 Status status = fetch(h->begin(), &nObj);
218 if (status != ok)
219 results.push_back({});
220 else
221 results.push_back(nObj);
222 }
223
224 return {results, ok};
225 }
226
227 void
229 {
230 EncodedBlob e(no);
231 nudb::error_code ec;
232 nudb::detail::buffer bf;
233 auto const result = nodeobject_compress(e.getData(), e.getSize(), bf);
234 db_.insert(e.getKey(), result.first, result.second, ec);
235 if (ec && ec != nudb::error::key_exists)
236 Throw<nudb::system_error>(ec);
237 }
238
239 void
241 {
242 BatchWriteReport report;
243 report.writeCount = 1;
244 auto const start = std::chrono::steady_clock::now();
245 do_insert(no);
246 report.elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(
248 scheduler_.onBatchWrite(report);
249 }
250
251 void
252 storeBatch(Batch const& batch) override
253 {
254 BatchWriteReport report;
255 report.writeCount = batch.size();
256 auto const start = std::chrono::steady_clock::now();
257 for (auto const& e : batch)
258 do_insert(e);
259 report.elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(
261 scheduler_.onBatchWrite(report);
262 }
263
264 void
265 sync() override
266 {
267 }
268
269 void
271 {
272 auto const dp = db_.dat_path();
273 auto const kp = db_.key_path();
274 auto const lp = db_.log_path();
275 // auto const appnum = db_.appnum();
276 nudb::error_code ec;
277 db_.close(ec);
278 if (ec)
279 Throw<nudb::system_error>(ec);
280 nudb::visit(
281 dp,
282 [&](void const* key,
283 std::size_t key_bytes,
284 void const* data,
285 std::size_t size,
286 nudb::error_code&) {
287 nudb::detail::buffer bf;
288 auto const result = nodeobject_decompress(data, size, bf);
289 DecodedBlob decoded(key, result.first, result.second);
290 if (!decoded.wasOk())
291 {
292 ec = make_error_code(nudb::error::missing_value);
293 return;
294 }
295 f(decoded.createObject());
296 },
297 nudb::no_progress{},
298 ec);
299 if (ec)
300 Throw<nudb::system_error>(ec);
301 db_.open(dp, kp, lp, ec);
302 if (ec)
303 Throw<nudb::system_error>(ec);
304 }
305
306 int
307 getWriteLoad() override
308 {
309 return 0;
310 }
311
312 void
313 setDeletePath() override
314 {
315 deletePath_ = true;
316 }
317
318 void
319 verify() override
320 {
321 auto const dp = db_.dat_path();
322 auto const kp = db_.key_path();
323 auto const lp = db_.log_path();
324 nudb::error_code ec;
325 db_.close(ec);
326 if (ec)
327 Throw<nudb::system_error>(ec);
328 nudb::verify_info vi;
329 nudb::verify<nudb::xxhasher>(vi, dp, kp, 0, nudb::no_progress{}, ec);
330 if (ec)
331 Throw<nudb::system_error>(ec);
332 db_.open(dp, kp, lp, ec);
333 if (ec)
334 Throw<nudb::system_error>(ec);
335 }
336
337 int
338 fdRequired() const override
339 {
340 return 3;
341 }
342
343private:
344 static std::size_t
345 parseBlockSize(std::string const& name, Section const& keyValues, beast::Journal journal)
346 {
347 using namespace boost::filesystem;
348 auto const folder = path(name);
349 auto const kp = (folder / "nudb.key").string();
350
351 std::size_t const defaultSize = nudb::block_size(kp); // Default 4K from NuDB
352 std::size_t blockSize = defaultSize;
353 std::string blockSizeStr;
354
355 if (!get_if_exists(keyValues, "nudb_block_size", blockSizeStr))
356 {
357 return blockSize; // Early return with default
358 }
359
360 try
361 {
362 std::size_t const parsedBlockSize = beast::lexicalCastThrow<std::size_t>(blockSizeStr);
363
364 // Validate: must be power of 2 between 4K and 32K
365 if (parsedBlockSize < 4096 || parsedBlockSize > 32768 ||
366 (parsedBlockSize & (parsedBlockSize - 1)) != 0)
367 {
369 s << "Invalid nudb_block_size: " << parsedBlockSize
370 << ". Must be power of 2 between 4096 and 32768.";
371 Throw<std::runtime_error>(s.str());
372 }
373
374 JLOG(journal.info()) << "Using custom NuDB block size: " << parsedBlockSize << " bytes";
375 return parsedBlockSize;
376 }
377 catch (std::exception const& e)
378 {
380 s << "Invalid nudb_block_size value: " << blockSizeStr << ". Error: " << e.what();
381 Throw<std::runtime_error>(s.str());
382 }
383 }
384};
385
386//------------------------------------------------------------------------------
387
388class NuDBFactory : public Factory
389{
390private:
392
393public:
394 explicit NuDBFactory(Manager& manager) : manager_(manager)
395 {
396 manager_.insert(*this);
397 }
398
400 getName() const override
401 {
402 return "NuDB";
403 }
404
407 size_t keyBytes,
408 Section const& keyValues,
410 Scheduler& scheduler,
411 beast::Journal journal) override
412 {
413 return std::make_unique<NuDBBackend>(keyBytes, keyValues, burstSize, scheduler, journal);
414 }
415
418 size_t keyBytes,
419 Section const& keyValues,
421 Scheduler& scheduler,
422 nudb::context& context,
423 beast::Journal journal) override
424 {
426 keyBytes, keyValues, burstSize, scheduler, context, journal);
427 }
428};
429
430void
432{
433 static NuDBFactory instance{manager};
434}
435
436} // namespace NodeStore
437} // namespace xrpl
A generic endpoint for log messages.
Definition Journal.h:40
Stream fatal() const
Definition Journal.h:325
Stream error() const
Definition Journal.h:319
Stream info() const
Definition Journal.h:307
A backend used for the NodeStore.
Definition Backend.h:20
Parsed key/value blob into NodeObject components.
Definition DecodedBlob.h:19
std::shared_ptr< NodeObject > createObject()
Create a NodeObject from this data.
bool wasOk() const noexcept
Determine if the decoding was successful.
Definition DecodedBlob.h:26
Convert a NodeObject from in-memory to database format.
Definition EncodedBlob.h:36
void const * getKey() const noexcept
Definition EncodedBlob.h:89
std::size_t getSize() const noexcept
Definition EncodedBlob.h:95
void const * getData() const noexcept
Base class for backend factories.
Definition Factory.h:16
Singleton for managing NodeStore factories and back ends.
Definition Manager.h:12
virtual void insert(Factory &factory)=0
Add a factory.
NuDBBackend(size_t keyBytes, Section const &keyValues, std::size_t burstSize, Scheduler &scheduler, beast::Journal journal)
std::size_t const blockSize_
void verify() override
Perform consistency checks on database.
void storeBatch(Batch const &batch) override
Store a group of objects.
int getWriteLoad() override
Estimate the number of write operations pending.
std::pair< std::vector< std::shared_ptr< NodeObject > >, Status > fetchBatch(std::vector< uint256 const * > const &hashes) override
Fetch a batch synchronously.
std::optional< std::size_t > getBlockSize() const override
Get the block size for backends that support it.
static std::size_t parseBlockSize(std::string const &name, Section const &keyValues, beast::Journal journal)
int fdRequired() const override
Returns the number of file descriptors the backend expects to need.
void store(std::shared_ptr< NodeObject > const &no) override
Store a single object.
beast::Journal const j_
static constexpr std::uint64_t appnum
NuDBBackend(size_t keyBytes, Section const &keyValues, std::size_t burstSize, Scheduler &scheduler, nudb::context &context, beast::Journal journal)
std::string getName() override
Get the human-readable name of this backend.
Status fetch(void const *key, std::shared_ptr< NodeObject > *pno) override
Fetch a single object.
void do_insert(std::shared_ptr< NodeObject > const &no)
void open(bool createIfMissing) override
Open the backend.
void open(bool createIfMissing, uint64_t appType, uint64_t uid, uint64_t salt) override
Open the backend.
std::size_t const burstSize_
void close() override
Close the backend.
void setDeletePath() override
Remove contents on disk upon destruction.
bool isOpen() override
Returns true is the database is open.
void for_each(std::function< void(std::shared_ptr< NodeObject >)> f) override
Visit every object in the database This is usually called during import.
std::atomic< bool > deletePath_
std::unique_ptr< Backend > createInstance(size_t keyBytes, Section const &keyValues, std::size_t burstSize, Scheduler &scheduler, nudb::context &context, beast::Journal journal) override
Create an instance of this factory's backend.
NuDBFactory(Manager &manager)
std::unique_ptr< Backend > createInstance(size_t keyBytes, Section const &keyValues, std::size_t burstSize, Scheduler &scheduler, beast::Journal journal) override
Create an instance of this factory's backend.
std::string getName() const override
Retrieve the name of this factory.
Scheduling for asynchronous backend activity.
virtual void onBatchWrite(BatchWriteReport const &report)=0
Reports the completion of a batch write Allows the scheduler to monitor the node store's performance.
Holds a collection of configuration values.
Definition BasicConfig.h:24
T empty(T... args)
T is_same_v
void registerNuDBFactory(Manager &manager)
std::pair< void const *, std::size_t > nodeobject_compress(void const *in, std::size_t in_size, BufferFactory &&bf)
Definition codec.h:190
Status
Return codes from Backend operations.
std::pair< void const *, std::size_t > nodeobject_decompress(void const *in, std::size_t in_size, BufferFactory &&bf)
Definition codec.h:86
Use hash_* containers for keys that do not need a cryptographically secure hashing algorithm.
Definition algorithm.h:5
std::error_code make_error_code(xrpl::TokenCodecErrc e)
T get(Section const &section, std::string const &name, T const &defaultValue=T{})
Retrieve a key/value pair from a section.
@ open
We haven't closed our ledger yet, but others might have.
bool get_if_exists(Section const &section, std::string const &name, T &v)
@ no
Definition Steps.h:24
T push_back(T... args)
T reserve(T... args)
T reset(T... args)
T size(T... args)
T str(T... args)
Contains information about a batch write operation.
T what(T... args)