libmdbx/test/extra/crunched_delete.c++
2025-01-10 23:50:05 +03:00

393 lines
12 KiB
C++
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

#include "mdbx.h++"
#include <array>
#include <iostream>
#include <random>
#include <vector>
#if MDBX_DEBUG || !defined(NDEBUG) || defined(__APPLE__) || defined(_WIN32)
#define NN 1024
#else
#define NN 4096
#endif
std::string format_va(const char *fmt, va_list ap) {
va_list ones;
va_copy(ones, ap);
#ifdef _MSC_VER
int needed = _vscprintf(fmt, ap);
#else
int needed = vsnprintf(nullptr, 0, fmt, ap);
#endif
assert(needed >= 0);
std::string result;
result.reserve(size_t(needed + 1));
result.resize(size_t(needed), '\0');
assert(int(result.capacity()) > needed);
int actual = vsnprintf(const_cast<char *>(result.data()), result.capacity(), fmt, ones);
assert(actual == needed);
(void)actual;
va_end(ones);
return result;
}
std::string format(const char *fmt, ...) {
va_list ap;
va_start(ap, fmt);
std::string result = format_va(fmt, ap);
va_end(ap);
return result;
}
struct acase {
unsigned klen_min, klen_max;
unsigned vlen_min, vlen_max;
unsigned dupmax_log2;
acase(unsigned klen_min, unsigned klen_max, unsigned vlen_min, unsigned vlen_max, unsigned dupmax_log2)
: klen_min(klen_min), klen_max(klen_max), vlen_min(vlen_min), vlen_max(vlen_max), dupmax_log2(dupmax_log2) {}
};
// std::random_device rd;
std::mt19937_64 rnd;
static unsigned prng_fast(uint32_t &seed) {
seed = seed * 1103515245 + 12345;
return seed >> 17;
}
static mdbx::slice mk(mdbx::default_buffer &buf, unsigned min, unsigned max) {
uint32_t seed = rnd() % (NN + NN);
unsigned len = (min < max) ? min + prng_fast(seed) % (max - min) : min;
buf.clear_and_reserve(len);
for (unsigned i = 0; i < len; ++i)
buf.append_byte(mdbx::byte(prng_fast(seed)));
return buf.slice();
}
static mdbx::slice mk_key(mdbx::default_buffer &buf, const acase &thecase) {
return mk(buf, thecase.klen_min, thecase.klen_max);
}
static mdbx::slice mk_val(mdbx::default_buffer &buf, const acase &thecase) {
return mk(buf, thecase.vlen_min, thecase.vlen_max);
}
static std::string name(unsigned n) { return format("Commitment_%05u", n); }
static mdbx::map_handle create_and_fill(mdbx::txn txn, const acase &thecase, const unsigned n) {
auto map = txn.create_map(name(n),
(thecase.klen_min == thecase.klen_max && (thecase.klen_min == 4 || thecase.klen_max == 8))
? mdbx::key_mode::ordinal
: mdbx::key_mode::usual,
(thecase.vlen_min == thecase.vlen_max) ? mdbx::value_mode::multi_samelength
: mdbx::value_mode::multi);
if (txn.get_map_stat(map).ms_entries < NN) {
mdbx::default_buffer k, v;
for (auto i = 0u; i < NN; i++) {
mk_key(k, thecase);
for (auto ii = thecase.dupmax_log2 ? 1u + (rnd() & ((2u << thecase.dupmax_log2) - 1u)) : 1u; ii > 0; --ii)
txn.upsert(map, k, mk_val(v, thecase));
}
}
return map;
}
static void chunched_delete(mdbx::txn txn, const acase &thecase, const unsigned n) {
// printf(">> %s, case #%i\n", __FUNCTION__, n);
mdbx::default_buffer k, v;
auto map = txn.open_map_accede(name(n));
{
auto cursor = txn.open_cursor(map);
while (true) {
const auto all = cursor.txn().get_map_stat(cursor.map()).ms_entries;
// printf("== seek random of %u\n", all);
const char *last_op;
bool last_r;
if (true == ((last_op = "MDBX_GET_BOTH"),
(last_r = cursor.find_multivalue(mk_key(k, thecase), mk_val(v, thecase), false))) ||
rnd() % 3 == 0 ||
true == ((last_op = "MDBX_SET_RANGE"), (last_r = cursor.lower_bound(mk_key(k, thecase), false)))) {
int i = int(rnd() % 7) - 3;
// if (i)
// printf(" %s -> %s\n", last_op, last_r ? "true" : "false");
// printf("== shift multi %i\n", i);
try {
while (i < 0 && true == ((last_op = "MDBX_PREV_DUP"), (last_r = cursor.to_current_prev_multi(false))))
++i;
while (i > 0 && true == ((last_op = "MDBX_NEXT_DUP"), (last_r = cursor.to_current_next_multi(false))))
--i;
} catch (const mdbx::no_data &) {
printf("cursor_del() -> exception, last %s %s\n", last_op, last_r ? "true" : "false");
continue;
}
}
// printf(" %s -> %s\n", last_op, last_r ? "true" : "false");
if (all < 42) {
// printf("== erase-tail\n");
break;
}
auto i = all % 17 + 1;
try {
last_r = cursor.erase();
do {
// printf("== erase-chunk: %u\n", i);
// printf(" cursor_del() -> %s\n", last_r ? "true" : "false");
} while (cursor.to_next(false) && --i > 0);
} catch (const mdbx::no_data &) {
printf("cursor_del() -> exception, last %s %s\n", last_op, last_r ? "true" : "false");
}
// (void) last_op;
// (void) last_r;
}
if (cursor.to_first(false))
do
cursor.erase();
while (cursor.to_next(false));
}
// printf("<< %s, case #%i\n", __FUNCTION__, n);
}
static char log_buffer[1024];
static void logger_nofmt(MDBX_log_level_t loglevel, const char *function, int line, const char *msg,
unsigned length) noexcept {
(void)length;
(void)loglevel;
fprintf(stdout, "%s:%u %s", function, line, msg);
}
bool outofrange_prev(mdbx::env env) {
mdbx::cursor_managed cursor;
const std::array<mdbx::pair, 4> items = {{{"k1", "v1"}, {"k1", "v2"}, {"k2", "v1"}, {"k2", "v2"}}};
auto txn = env.start_write();
auto multi = txn.create_map("multi", mdbx::key_mode::usual, mdbx::value_mode::multi);
auto simple = txn.create_map("simple");
txn.clear_map(multi);
txn.clear_map(simple);
txn.insert(simple, items[0]);
txn.insert(simple, items[3]);
cursor.bind(txn, simple);
const auto simple_oor = cursor.lower_bound("k3");
if (simple_oor) {
std::cerr << "simple-outofrange " << simple_oor << "\n";
return false;
}
const auto simple_oor_prevdup = cursor.to_current_prev_multi(false);
if (simple_oor_prevdup) {
std::cerr << "simple-outofrange-prevdup " << simple_oor_prevdup << "\n";
return false;
}
const auto simple_oor_prev = cursor.to_previous(false);
if (!simple_oor_prev || simple_oor_prev != items[3]) {
std::cerr << "simple-outofrange-prev " << simple_oor_prev << "\n";
return false;
}
txn.append(multi, items[0]);
txn.append(multi, items[1]);
txn.append(multi, items[2]);
txn.append(multi, items[3]);
cursor.bind(txn, multi);
const auto multi_oor = cursor.lower_bound("k3");
if (multi_oor) {
std::cerr << "multi-outofrange " << multi_oor << "\n";
return false;
}
const auto multi_oor_prevdup = cursor.to_current_prev_multi(false);
if (multi_oor_prevdup) {
std::cerr << "multi-outofrange-prevdup " << multi_oor_prevdup << "\n";
return false;
}
const auto multi_oor_prev = cursor.to_previous(false);
if (!multi_oor_prev || multi_oor_prev != items[3]) {
std::cerr << "multi-outofrange-prev " << multi_oor_prev << "\n";
return false;
}
txn.commit();
return true;
}
bool next_prev_current(mdbx::env env) {
const std::array<mdbx::pair, 4> items = {{{"k1", "v1"}, {"k1", "v2"}, {"k2", "v1"}, {"k2", "v2"}}};
auto txn = env.start_write();
auto map = txn.create_map("multi", mdbx::key_mode::usual, mdbx::value_mode::multi);
txn.clear_map(map);
for (const auto &i : items)
txn.upsert(map, i);
auto cursor = txn.open_cursor(map);
const auto first = cursor.to_first(false);
if (!first || first != items[0]) {
std::cerr << "bad-first " << first << "\n";
return false;
}
const auto next1 = cursor.to_next(false);
if (!next1 || next1 != items[1]) {
std::cerr << "bad-next-1 " << next1 << "\n";
return false;
}
const auto next2 = cursor.to_next(false);
if (!next2 || next2 != items[2]) {
std::cerr << "bad-next-2 " << next2 << "\n";
return false;
}
const auto prev1 = cursor.to_previous(false);
if (!prev1 || prev1 != items[1]) {
std::cerr << "bad-prev-1 " << prev1 << "\n";
return false;
}
const auto prev2 = cursor.to_previous(false);
if (!prev2 || prev2 != items[0]) {
std::cerr << "bad-prev-2 " << prev2 << "\n";
return false;
}
if (!cursor.erase(false)) {
std::cerr << "bad-erase\n";
return false;
}
const auto after_del = cursor.current(false);
if (!after_del || after_del != items[1]) {
std::cerr << "bad-after-del, current " << after_del << "\n";
return false;
}
const auto next_after_del1 = cursor.to_next(false);
if (!next_after_del1 || next_after_del1 != items[2]) {
std::cerr << "bad-next_after_del1 " << next_after_del1;
return false;
}
const auto next_after_del2 = cursor.to_next(false);
if (!next_after_del2 || next_after_del2 != items[3]) {
std::cerr << "bad-next_after_del2 " << next_after_del2;
return false;
}
const auto next_after_del3 = cursor.to_next(false);
if (next_after_del3) {
std::cerr << "bad-next_after_del3 " << next_after_del3;
return false;
}
txn.commit();
return true;
}
bool simple(mdbx::env env) {
const std::array<mdbx::pair, 3> items = {{{"k0", "v0"}, {"k1", "v1"}, {"k2", "v2"}}};
auto txn = env.start_write();
auto map = txn.create_map("simple");
txn.clear_map(map);
for (const auto &i : items)
txn.insert(map, i);
auto cursor = txn.open_cursor(map);
cursor.seek(items[1].key);
const auto seek = cursor.current(false);
if (seek != items[1]) {
std::cerr << "bad-seek, current " << seek << "\n";
return false;
}
if (!cursor.erase()) {
std::cerr << "bad-erase\n";
return false;
}
const auto next = cursor.to_next(false);
if (!next || next != items[2]) {
std::cerr << "bad-next " << next;
return false;
}
const auto after_del = cursor.current(false);
if (!after_del || after_del != items[2]) {
std::cerr << "bad-after-del, current " << after_del << "\n";
return false;
}
txn.commit();
txn = env.start_read();
cursor.bind(txn, map);
#define BAD_CODE 1
#if BAD_CODE
const auto first = cursor.to_next(false);
#else
const auto first = cursor.to_first(false);
#endif
const auto second = cursor.to_next(false);
const auto eof = cursor.to_next(false);
if (!first || first != items[0]) {
std::cerr << "bad-first " << first << "\n";
return false;
}
if (!second || second != items[2]) {
std::cerr << "bad-second " << second << "\n";
return false;
}
if (eof) {
std::cerr << "bad-eof " << eof << "\n";
return false;
}
return true;
}
int main(int argc, const char *argv[]) {
(void)argc;
(void)argv;
mdbx_setup_debug_nofmt(MDBX_LOG_NOTICE, MDBX_DBG_ASSERT, logger_nofmt, log_buffer, sizeof(log_buffer));
mdbx::path db_filename = "test-crunched-del";
mdbx::env::remove(db_filename);
mdbx::env_managed env(db_filename, mdbx::env_managed::create_parameters(), mdbx::env::operate_parameters(42));
if (!simple(env) || !next_prev_current(env) || !outofrange_prev(env))
return EXIT_FAILURE;
std::vector<acase> testset;
// Там ключи разной длины - от 1 до 64 байт.
// Значения разной длины от 100 до 1000 байт.
testset.emplace_back(/* keylen_min */ 1, /* keylen_max */ 64,
/* datalen_min */ 100, /* datalen_max */
mdbx_env_get_valsize4page_max(env, MDBX_db_flags_t(mdbx::value_mode::multi)),
/* dups_log2 */ 6);
// В одной таблице DupSort: path -> version_u64+data
// path - это префикс в дереве. Самые частые длины: 1-5 байт и 32-36 байт.
testset.emplace_back(1, 5, 100, 1000, 8);
testset.emplace_back(32, 36, 100, 1000, 7);
// В другой DupSort: timestamp_u64 -> path
testset.emplace_back(8, 8, 1, 5, 10);
testset.emplace_back(8, 8, 32, 36, 9);
auto txn = env.start_write();
for (unsigned i = 0; i < testset.size(); ++i)
create_and_fill(txn, testset[i], i);
txn.commit();
// mdbx_setup_debug_nofmt(MDBX_LOG_TRACE, MDBX_DBG_AUDIT | MDBX_DBG_ASSERT,
// logger_nofmt, log_buffer, sizeof(log_buffer));
txn = env.start_write();
for (unsigned i = 0; i < testset.size(); ++i)
chunched_delete(txn, testset[i], i);
txn.commit();
std::cout << "OK\n";
return EXIT_SUCCESS;
}