mirror of
https://github.com/isar/libmdbx.git
synced 2025-01-16 01:34:29 +08:00
230 lines
7.7 KiB
C
230 lines
7.7 KiB
C
/// \copyright SPDX-License-Identifier: Apache-2.0
|
|
/// \author Леонид Юрьев aka Leonid Yuriev <leo@yuriev.ru> \date 2015-2024
|
|
|
|
#include "internals.h"
|
|
|
|
#if MDBX_ENABLE_REFUND
|
|
static void refund_reclaimed(MDBX_txn *txn) {
|
|
/* Scanning in descend order */
|
|
pgno_t first_unallocated = txn->geo.first_unallocated;
|
|
const pnl_t pnl = txn->tw.relist;
|
|
tASSERT(txn,
|
|
MDBX_PNL_GETSIZE(pnl) && MDBX_PNL_MOST(pnl) == first_unallocated - 1);
|
|
#if MDBX_PNL_ASCENDING
|
|
size_t i = MDBX_PNL_GETSIZE(pnl);
|
|
tASSERT(txn, pnl[i] == first_unallocated - 1);
|
|
while (--first_unallocated, --i > 0 && pnl[i] == first_unallocated - 1)
|
|
;
|
|
MDBX_PNL_SETSIZE(pnl, i);
|
|
#else
|
|
size_t i = 1;
|
|
tASSERT(txn, pnl[i] == first_unallocated - 1);
|
|
size_t len = MDBX_PNL_GETSIZE(pnl);
|
|
while (--first_unallocated, ++i <= len && pnl[i] == first_unallocated - 1)
|
|
;
|
|
MDBX_PNL_SETSIZE(pnl, len -= i - 1);
|
|
for (size_t move = 0; move < len; ++move)
|
|
pnl[1 + move] = pnl[i + move];
|
|
#endif
|
|
VERBOSE("refunded %" PRIaPGNO " pages: %" PRIaPGNO " -> %" PRIaPGNO,
|
|
txn->geo.first_unallocated - first_unallocated,
|
|
txn->geo.first_unallocated, first_unallocated);
|
|
txn->geo.first_unallocated = first_unallocated;
|
|
tASSERT(txn,
|
|
pnl_check_allocated(txn->tw.relist, txn->geo.first_unallocated - 1));
|
|
}
|
|
|
|
static void refund_loose(MDBX_txn *txn) {
|
|
tASSERT(txn, txn->tw.loose_pages != nullptr);
|
|
tASSERT(txn, txn->tw.loose_count > 0);
|
|
|
|
dpl_t *const dl = txn->tw.dirtylist;
|
|
if (dl) {
|
|
tASSERT(txn, dl->length >= txn->tw.loose_count);
|
|
tASSERT(txn, (txn->flags & MDBX_WRITEMAP) == 0 || MDBX_AVOID_MSYNC);
|
|
} else {
|
|
tASSERT(txn, (txn->flags & MDBX_WRITEMAP) != 0 && !MDBX_AVOID_MSYNC);
|
|
}
|
|
|
|
pgno_t onstack[MDBX_CACHELINE_SIZE * 8 / sizeof(pgno_t)];
|
|
pnl_t suitable = onstack;
|
|
|
|
if (!dl || dl->length - dl->sorted > txn->tw.loose_count) {
|
|
/* Dirty list is useless since unsorted. */
|
|
if (pnl_bytes2size(sizeof(onstack)) < txn->tw.loose_count) {
|
|
suitable = pnl_alloc(txn->tw.loose_count);
|
|
if (unlikely(!suitable))
|
|
return /* this is not a reason for transaction fail */;
|
|
}
|
|
|
|
/* Collect loose-pages which may be refunded. */
|
|
tASSERT(txn,
|
|
txn->geo.first_unallocated >= MIN_PAGENO + txn->tw.loose_count);
|
|
pgno_t most = MIN_PAGENO;
|
|
size_t w = 0;
|
|
for (const page_t *lp = txn->tw.loose_pages; lp; lp = page_next(lp)) {
|
|
tASSERT(txn, lp->flags == P_LOOSE);
|
|
tASSERT(txn, txn->geo.first_unallocated > lp->pgno);
|
|
if (likely(txn->geo.first_unallocated - txn->tw.loose_count <=
|
|
lp->pgno)) {
|
|
tASSERT(txn,
|
|
w < ((suitable == onstack) ? pnl_bytes2size(sizeof(onstack))
|
|
: MDBX_PNL_ALLOCLEN(suitable)));
|
|
suitable[++w] = lp->pgno;
|
|
most = (lp->pgno > most) ? lp->pgno : most;
|
|
}
|
|
MDBX_ASAN_UNPOISON_MEMORY_REGION(&page_next(lp), sizeof(page_t *));
|
|
VALGRIND_MAKE_MEM_DEFINED(&page_next(lp), sizeof(page_t *));
|
|
}
|
|
|
|
if (most + 1 == txn->geo.first_unallocated) {
|
|
/* Sort suitable list and refund pages at the tail. */
|
|
MDBX_PNL_SETSIZE(suitable, w);
|
|
pnl_sort(suitable, MAX_PAGENO + 1);
|
|
|
|
/* Scanning in descend order */
|
|
const intptr_t step = MDBX_PNL_ASCENDING ? -1 : 1;
|
|
const intptr_t begin =
|
|
MDBX_PNL_ASCENDING ? MDBX_PNL_GETSIZE(suitable) : 1;
|
|
const intptr_t end =
|
|
MDBX_PNL_ASCENDING ? 0 : MDBX_PNL_GETSIZE(suitable) + 1;
|
|
tASSERT(txn, suitable[begin] >= suitable[end - step]);
|
|
tASSERT(txn, most == suitable[begin]);
|
|
|
|
for (intptr_t i = begin + step; i != end; i += step) {
|
|
if (suitable[i] != most - 1)
|
|
break;
|
|
most -= 1;
|
|
}
|
|
const size_t refunded = txn->geo.first_unallocated - most;
|
|
DEBUG("refund-suitable %zu pages %" PRIaPGNO " -> %" PRIaPGNO, refunded,
|
|
most, txn->geo.first_unallocated);
|
|
txn->geo.first_unallocated = most;
|
|
txn->tw.loose_count -= refunded;
|
|
if (dl) {
|
|
txn->tw.dirtyroom += refunded;
|
|
dl->pages_including_loose -= refunded;
|
|
assert(txn->tw.dirtyroom <= txn->env->options.dp_limit);
|
|
|
|
/* Filter-out dirty list */
|
|
size_t r = 0;
|
|
w = 0;
|
|
if (dl->sorted) {
|
|
do {
|
|
if (dl->items[++r].pgno < most) {
|
|
if (++w != r)
|
|
dl->items[w] = dl->items[r];
|
|
}
|
|
} while (r < dl->sorted);
|
|
dl->sorted = w;
|
|
}
|
|
while (r < dl->length) {
|
|
if (dl->items[++r].pgno < most) {
|
|
if (++w != r)
|
|
dl->items[w] = dl->items[r];
|
|
}
|
|
}
|
|
dpl_setlen(dl, w);
|
|
tASSERT(txn, txn->tw.dirtyroom + txn->tw.dirtylist->length ==
|
|
(txn->parent ? txn->parent->tw.dirtyroom
|
|
: txn->env->options.dp_limit));
|
|
}
|
|
goto unlink_loose;
|
|
}
|
|
} else {
|
|
/* Dirtylist is mostly sorted, just refund loose pages at the end. */
|
|
dpl_sort(txn);
|
|
tASSERT(txn,
|
|
dl->length < 2 || dl->items[1].pgno < dl->items[dl->length].pgno);
|
|
tASSERT(txn, dl->sorted == dl->length);
|
|
|
|
/* Scan dirtylist tail-forward and cutoff suitable pages. */
|
|
size_t n;
|
|
for (n = dl->length; dl->items[n].pgno == txn->geo.first_unallocated - 1 &&
|
|
dl->items[n].ptr->flags == P_LOOSE;
|
|
--n) {
|
|
tASSERT(txn, n > 0);
|
|
page_t *dp = dl->items[n].ptr;
|
|
DEBUG("refund-sorted page %" PRIaPGNO, dp->pgno);
|
|
tASSERT(txn, dp->pgno == dl->items[n].pgno);
|
|
txn->geo.first_unallocated -= 1;
|
|
}
|
|
dpl_setlen(dl, n);
|
|
|
|
if (dl->sorted != dl->length) {
|
|
const size_t refunded = dl->sorted - dl->length;
|
|
dl->sorted = dl->length;
|
|
txn->tw.loose_count -= refunded;
|
|
txn->tw.dirtyroom += refunded;
|
|
dl->pages_including_loose -= refunded;
|
|
tASSERT(txn, txn->tw.dirtyroom + txn->tw.dirtylist->length ==
|
|
(txn->parent ? txn->parent->tw.dirtyroom
|
|
: txn->env->options.dp_limit));
|
|
|
|
/* Filter-out loose chain & dispose refunded pages. */
|
|
unlink_loose:
|
|
for (page_t *__restrict *__restrict link = &txn->tw.loose_pages; *link;) {
|
|
page_t *dp = *link;
|
|
tASSERT(txn, dp->flags == P_LOOSE);
|
|
MDBX_ASAN_UNPOISON_MEMORY_REGION(&page_next(dp), sizeof(page_t *));
|
|
VALGRIND_MAKE_MEM_DEFINED(&page_next(dp), sizeof(page_t *));
|
|
if (txn->geo.first_unallocated > dp->pgno) {
|
|
link = &page_next(dp);
|
|
} else {
|
|
*link = page_next(dp);
|
|
if ((txn->flags & MDBX_WRITEMAP) == 0)
|
|
page_shadow_release(txn->env, dp, 1);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
tASSERT(txn, dpl_check(txn));
|
|
if (suitable != onstack)
|
|
pnl_free(suitable);
|
|
txn->tw.loose_refund_wl = txn->geo.first_unallocated;
|
|
}
|
|
|
|
bool txn_refund(MDBX_txn *txn) {
|
|
const pgno_t before = txn->geo.first_unallocated;
|
|
|
|
if (txn->tw.loose_pages &&
|
|
txn->tw.loose_refund_wl > txn->geo.first_unallocated)
|
|
refund_loose(txn);
|
|
|
|
while (true) {
|
|
if (MDBX_PNL_GETSIZE(txn->tw.relist) == 0 ||
|
|
MDBX_PNL_MOST(txn->tw.relist) != txn->geo.first_unallocated - 1)
|
|
break;
|
|
|
|
refund_reclaimed(txn);
|
|
if (!txn->tw.loose_pages ||
|
|
txn->tw.loose_refund_wl <= txn->geo.first_unallocated)
|
|
break;
|
|
|
|
const pgno_t memo = txn->geo.first_unallocated;
|
|
refund_loose(txn);
|
|
if (memo == txn->geo.first_unallocated)
|
|
break;
|
|
}
|
|
|
|
if (before == txn->geo.first_unallocated)
|
|
return false;
|
|
|
|
if (txn->tw.spilled.list)
|
|
/* Squash deleted pagenums if we refunded any */
|
|
spill_purge(txn);
|
|
|
|
return true;
|
|
}
|
|
|
|
#else /* MDBX_ENABLE_REFUND */
|
|
|
|
bool txn_refund(MDBX_txn *txn) {
|
|
(void)txn;
|
|
/* No online auto-compactification. */
|
|
return false;
|
|
}
|
|
|
|
#endif /* MDBX_ENABLE_REFUND */
|