From f53dc70038cd61e66782301f4dea247c46f3da43 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=D0=9B=D0=B5=D0=BE=D0=BD=D0=B8=D0=B4=20=D0=AE=D1=80=D1=8C?= =?UTF-8?q?=D0=B5=D0=B2=20=28Leonid=20Yuriev=29?= Date: Fri, 30 Dec 2022 01:51:08 +0300 Subject: [PATCH] =?UTF-8?q?mdbx:=20=D0=B4=D0=BE=D0=B1=D0=B0=D0=B2=D0=BB?= =?UTF-8?q?=D0=B5=D0=BD=D0=B8=D0=B5=20`eq=5Ffast()`=20=D0=B4=D0=BB=D1=8F?= =?UTF-8?q?=20=D1=81=D1=80=D0=B0=D0=B2=D0=BD=D0=B5=D0=BD=D0=B8=D0=B9=20?= =?UTF-8?q?=D0=BD=D0=B0=20(=D0=BD=D0=B5)=D1=80=D0=B0=D0=B2=D0=B5=D0=BD?= =?UTF-8?q?=D1=81=D1=82=D0=B2=D0=BE.?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Цель в том, чтобы уменьшить кол-во условных и безусловных переходов при сравнениях равно/неравно, в том числе избегать вызовов задаваемых кастомных компаратаров и memcmp() для коротких ключей/значений. --- src/core.c | 92 +++++++++++++++++++++++++++++------------------------- 1 file changed, 50 insertions(+), 42 deletions(-) diff --git a/src/core.c b/src/core.c index fef9b487..3116448d 100644 --- a/src/core.c +++ b/src/core.c @@ -15236,12 +15236,31 @@ __hot static int cmp_lenfast(const MDBX_val *a, const MDBX_val *b) { : memcmp(a->iov_base, b->iov_base, a->iov_len); } -static bool unsure_equal(MDBX_cmp_func cmp, const MDBX_val *a, - const MDBX_val *b) { - /* checking for the use of a known good comparator - * or/otherwise for a full byte-to-byte match */ - return cmp == cmp_lenfast || cmp == cmp_lexical || cmp == cmp_reverse || - cmp == cmp_int_unaligned || cmp_lenfast(a, b) == 0; +__hot static bool eq_fast_slowpath(const uint8_t *a, const uint8_t *b, + size_t l) { + if (likely(l > 3)) { + if (MDBX_UNALIGNED_OK >= 4 && likely(l < 9)) + return ((unaligned_peek_u32(1, a) - unaligned_peek_u32(1, b)) | + (unaligned_peek_u32(1, a + l - 4) - + unaligned_peek_u32(1, b + l - 4))) == 0; + if (MDBX_UNALIGNED_OK >= 8 && sizeof(size_t) > 7 && likely(l < 17)) + return ((unaligned_peek_u64(1, a) - unaligned_peek_u64(1, b)) | + (unaligned_peek_u64(1, a + l - 8) - + unaligned_peek_u64(1, b + l - 8))) == 0; + return memcmp(a, b, l) == 0; + } + if (likely(l)) { + STATIC_ASSERT(sizeof(int) > 2); + const unsigned a3 = a[0] << 16 | a[l >> 1] << 8 | a[l - 1]; + const unsigned b3 = b[0] << 16 | b[l >> 1] << 8 | b[l - 1]; + return a3 == b3; + } + return true; +} + +static __always_inline bool eq_fast(const MDBX_val *a, const MDBX_val *b) { + return unlikely(a->iov_len == b->iov_len) && + eq_fast_slowpath(a->iov_base, b->iov_base, a->iov_len); } /* Search for key within a page, using binary search. @@ -17099,25 +17118,21 @@ static __hot int cursor_put_nochecklen(MDBX_cursor *mc, const MDBX_val *key, flags -= MDBX_ALLDUPS; rc = MDBX_NOTFOUND; exact = false; - } else /* checking for early exit without dirtying pages */ - if (!(flags & (MDBX_RESERVE | MDBX_MULTIPLE)) && - unlikely(mc->mc_dbx->md_dcmp(data, &olddata) == 0)) { - if (!mc->mc_xcursor) - /* the same data, nothing to update */ - return MDBX_SUCCESS; - if (flags & MDBX_NODUPDATA) - return MDBX_KEYEXIST; - if (flags & MDBX_APPENDDUP) - return MDBX_EKEYMISMATCH; - if (likely(unsure_equal(mc->mc_dbx->md_dcmp, data, &olddata))) - /* data is match exactly byte-to-byte, nothing to update */ - return MDBX_SUCCESS; - else { - /* The data has differences, but the user-provided comparator - * considers them equal. So continue update since called without. - * Continue to update since was called without MDBX_NODUPDATA. */ + } else if (!(flags & (MDBX_RESERVE | MDBX_MULTIPLE))) { + /* checking for early exit without dirtying pages */ + if (unlikely(eq_fast(data, &olddata))) { + cASSERT(mc, mc->mc_dbx->md_dcmp(data, &olddata) == 0); + if (mc->mc_xcursor) { + if (flags & MDBX_NODUPDATA) + return MDBX_KEYEXIST; + if (flags & MDBX_APPENDDUP) + return MDBX_EKEYMISMATCH; } + /* the same data, nothing to update */ + return MDBX_SUCCESS; } + cASSERT(mc, mc->mc_dbx->md_dcmp(data, &olddata) != 0); + } } } else if (unlikely(rc != MDBX_NOTFOUND)) return rc; @@ -17322,28 +17337,21 @@ static __hot int cursor_put_nochecklen(MDBX_cursor *mc, const MDBX_val *key, /* Was a single item before, must convert now */ if (!(node_flags(node) & F_DUPDATA)) { - /* does data match? */ - const int cmp = mc->mc_dbx->md_dcmp(data, &olddata); - if ((flags & MDBX_APPENDDUP) && unlikely(cmp <= 0)) - return MDBX_EKEYMISMATCH; - if (cmp == 0) { + if (flags & MDBX_APPENDDUP) { + const int cmp = mc->mc_dbx->md_dcmp(data, &olddata); + cASSERT(mc, cmp != 0 || eq_fast(data, &olddata)); + if (unlikely(cmp <= 0)) + return MDBX_EKEYMISMATCH; + } else if (eq_fast(data, &olddata)) { + cASSERT(mc, mc->mc_dbx->md_dcmp(data, &olddata) == 0); if (flags & MDBX_NODUPDATA) return MDBX_KEYEXIST; - if (likely(unsure_equal(mc->mc_dbx->md_dcmp, data, &olddata))) { - /* data is match exactly byte-to-byte, nothing to update */ - if (unlikely(flags & MDBX_MULTIPLE)) { - rc = MDBX_SUCCESS; - goto continue_multiple; - } - return MDBX_SUCCESS; - } else { - /* The data has differences, but the user-provided comparator - * considers them equal. So continue update since called without. - * Continue to update since was called without MDBX_NODUPDATA. */ - } - cASSERT(mc, node_size(key, data) <= env->me_leaf_nodemax); - goto current; + /* data is match exactly byte-to-byte, nothing to update */ + rc = MDBX_SUCCESS; + if (likely((flags & MDBX_MULTIPLE) == 0)) + return rc; + goto continue_multiple; } /* Just overwrite the current item */