/// \copyright SPDX-License-Identifier: Apache-2.0 /// \author Леонид Юрьев aka Leonid Yuriev \date 2015-2024 #include "internals.h" __cold static unsigned default_rp_augment_limit(const MDBX_env *env) { const size_t timeframe = /* 16 секунд */ 16 << 16; const size_t remain_1sec = (env->options.gc_time_limit < timeframe) ? timeframe - (size_t)env->options.gc_time_limit : 0; const size_t minimum = (env->maxgc_large1page * 2 > MDBX_PNL_INITIAL) ? env->maxgc_large1page * 2 : MDBX_PNL_INITIAL; const size_t one_third = env->geo_in_bytes.now / 3 >> env->ps2ln; const size_t augment_limit = (one_third > minimum) ? minimum + (one_third - minimum) / timeframe * remain_1sec : minimum; eASSERT(env, augment_limit < PAGELIST_LIMIT); return pnl_bytes2size(pnl_size2bytes(augment_limit)); } static bool default_prefault_write(const MDBX_env *env) { return !MDBX_MMAP_INCOHERENT_FILE_WRITE && !env->incore && (env->flags & (MDBX_WRITEMAP | MDBX_RDONLY)) == MDBX_WRITEMAP; } static bool default_prefer_waf_insteadof_balance(const MDBX_env *env) { (void)env; return false; } void env_options_init(MDBX_env *env) { env->options.rp_augment_limit = MDBX_PNL_INITIAL; env->options.dp_reserve_limit = MDBX_PNL_INITIAL; env->options.dp_initial = MDBX_PNL_INITIAL; env->options.spill_max_denominator = 8; env->options.spill_min_denominator = 8; env->options.spill_parent4child_denominator = 0; env->options.dp_loose_limit = 64; env->options.merge_threshold_16dot16_percent = 65536 / 4 /* 25% */; if (default_prefer_waf_insteadof_balance(env)) env->options.prefer_waf_insteadof_balance = true; #if !(defined(_WIN32) || defined(_WIN64)) env->options.writethrough_threshold = #if defined(__linux__) || defined(__gnu_linux__) globals.running_on_WSL1 ? MAX_PAGENO : #endif /* Linux */ MDBX_WRITETHROUGH_THRESHOLD_DEFAULT; #endif /* Windows */ } void env_options_adjust_defaults(MDBX_env *env) { if (!env->options.flags.non_auto.rp_augment_limit) env->options.rp_augment_limit = default_rp_augment_limit(env); if (!env->options.flags.non_auto.prefault_write) env->options.prefault_write = default_prefault_write(env); const size_t basis = env->geo_in_bytes.now; /* TODO: use options? */ const unsigned factor = 9; size_t threshold = (basis < ((size_t)65536 << factor)) ? 65536 /* minimal threshold */ : (basis > (MEGABYTE * 4 << factor)) ? MEGABYTE * 4 /* maximal threshold */ : basis >> factor; threshold = (threshold < env->geo_in_bytes.shrink || !env->geo_in_bytes.shrink) ? threshold : env->geo_in_bytes.shrink; env->madv_threshold = bytes2pgno(env, bytes_align2os_bytes(env, threshold)); } //------------------------------------------------------------------------------ __cold int mdbx_env_set_option(MDBX_env *env, const MDBX_option_t option, uint64_t value) { int err = check_env(env, false); if (unlikely(err != MDBX_SUCCESS)) return err; const bool lock_needed = ((env->flags & ENV_ACTIVE) && env->basal_txn && !env_txn0_owned(env)); bool should_unlock = false; switch (option) { case MDBX_opt_sync_bytes: if (value == /* default */ UINT64_MAX) value = MAX_WRITE; if (unlikely(env->flags & MDBX_RDONLY)) return MDBX_EACCESS; if (unlikely(!(env->flags & ENV_ACTIVE))) return MDBX_EPERM; if (unlikely(value > SIZE_MAX - 65536)) return MDBX_EINVAL; value = bytes2pgno(env, (size_t)value + env->ps - 1); if ((uint32_t)value != atomic_load32(&env->lck->autosync_threshold, mo_AcquireRelease) && atomic_store32(&env->lck->autosync_threshold, (uint32_t)value, mo_Relaxed) /* Дергаем sync(force=off) только если задано новое не-нулевое значение * и мы вне транзакции */ && lock_needed) { err = env_sync(env, false, false); if (err == /* нечего сбрасывать на диск */ MDBX_RESULT_TRUE) err = MDBX_SUCCESS; } break; case MDBX_opt_sync_period: if (value == /* default */ UINT64_MAX) value = 2780315 /* 42.42424 секунды */; if (unlikely(env->flags & MDBX_RDONLY)) return MDBX_EACCESS; if (unlikely(!(env->flags & ENV_ACTIVE))) return MDBX_EPERM; if (unlikely(value > UINT32_MAX)) return MDBX_EINVAL; value = osal_16dot16_to_monotime((uint32_t)value); if (value != atomic_load64(&env->lck->autosync_period, mo_AcquireRelease) && atomic_store64(&env->lck->autosync_period, value, mo_Relaxed) /* Дергаем sync(force=off) только если задано новое не-нулевое значение * и мы вне транзакции */ && lock_needed) { err = env_sync(env, false, false); if (err == /* нечего сбрасывать на диск */ MDBX_RESULT_TRUE) err = MDBX_SUCCESS; } break; case MDBX_opt_max_db: if (value == /* default */ UINT64_MAX) value = 42; if (unlikely(value > MDBX_MAX_DBI)) return MDBX_EINVAL; if (unlikely(env->dxb_mmap.base)) return MDBX_EPERM; env->max_dbi = (unsigned)value + CORE_DBS; break; case MDBX_opt_max_readers: if (value == /* default */ UINT64_MAX) value = MDBX_READERS_LIMIT; if (unlikely(value < 1 || value > MDBX_READERS_LIMIT)) return MDBX_EINVAL; if (unlikely(env->dxb_mmap.base)) return MDBX_EPERM; env->max_readers = (unsigned)value; break; case MDBX_opt_dp_reserve_limit: if (value == /* default */ UINT64_MAX) value = INT_MAX; if (unlikely(value > INT_MAX)) return MDBX_EINVAL; if (env->options.dp_reserve_limit != (unsigned)value) { if (lock_needed) { err = lck_txn_lock(env, false); if (unlikely(err != MDBX_SUCCESS)) return err; should_unlock = true; } env->options.dp_reserve_limit = (unsigned)value; while (env->shadow_reserve_len > env->options.dp_reserve_limit) { eASSERT(env, env->shadow_reserve != nullptr); page_t *dp = env->shadow_reserve; MDBX_ASAN_UNPOISON_MEMORY_REGION(dp, env->ps); VALGRIND_MAKE_MEM_DEFINED(&page_next(dp), sizeof(page_t *)); env->shadow_reserve = page_next(dp); void *const ptr = ptr_disp(dp, -(ptrdiff_t)sizeof(size_t)); osal_free(ptr); env->shadow_reserve_len -= 1; } } break; case MDBX_opt_rp_augment_limit: if (value == /* default */ UINT64_MAX) { env->options.flags.non_auto.rp_augment_limit = 0; env->options.rp_augment_limit = default_rp_augment_limit(env); } else if (unlikely(value > PAGELIST_LIMIT)) return MDBX_EINVAL; else { env->options.flags.non_auto.rp_augment_limit = 1; env->options.rp_augment_limit = (unsigned)value; } break; case MDBX_opt_gc_time_limit: if (value == /* default */ UINT64_MAX) value = 0; if (unlikely(value > UINT32_MAX)) return MDBX_EINVAL; if (unlikely(env->flags & MDBX_RDONLY)) return MDBX_EACCESS; value = osal_16dot16_to_monotime((uint32_t)value); if (value != env->options.gc_time_limit) { if (env->txn && lock_needed) return MDBX_EPERM; env->options.gc_time_limit = value; if (!env->options.flags.non_auto.rp_augment_limit) env->options.rp_augment_limit = default_rp_augment_limit(env); } break; case MDBX_opt_txn_dp_limit: case MDBX_opt_txn_dp_initial: if (value == /* default */ UINT64_MAX) value = PAGELIST_LIMIT; if (unlikely(value > PAGELIST_LIMIT || value < CURSOR_STACK_SIZE * 4)) return MDBX_EINVAL; if (unlikely(env->flags & MDBX_RDONLY)) return MDBX_EACCESS; if (lock_needed) { err = lck_txn_lock(env, false); if (unlikely(err != MDBX_SUCCESS)) return err; should_unlock = true; } if (env->txn) err = MDBX_EPERM /* unable change during transaction */; else { const pgno_t value32 = (pgno_t)value; if (option == MDBX_opt_txn_dp_initial && env->options.dp_initial != value32) { env->options.dp_initial = value32; if (env->options.dp_limit < value32) { env->options.dp_limit = value32; env->options.flags.non_auto.dp_limit = 1; } } if (option == MDBX_opt_txn_dp_limit && env->options.dp_limit != value32) { env->options.dp_limit = value32; env->options.flags.non_auto.dp_limit = 1; if (env->options.dp_initial > value32) env->options.dp_initial = value32; } } break; case MDBX_opt_spill_max_denominator: if (value == /* default */ UINT64_MAX) value = 8; if (unlikely(value > 255)) return MDBX_EINVAL; env->options.spill_max_denominator = (uint8_t)value; break; case MDBX_opt_spill_min_denominator: if (value == /* default */ UINT64_MAX) value = 8; if (unlikely(value > 255)) return MDBX_EINVAL; env->options.spill_min_denominator = (uint8_t)value; break; case MDBX_opt_spill_parent4child_denominator: if (value == /* default */ UINT64_MAX) value = 0; if (unlikely(value > 255)) return MDBX_EINVAL; env->options.spill_parent4child_denominator = (uint8_t)value; break; case MDBX_opt_loose_limit: if (value == /* default */ UINT64_MAX) value = 64; if (unlikely(value > 255)) return MDBX_EINVAL; env->options.dp_loose_limit = (uint8_t)value; break; case MDBX_opt_merge_threshold_16dot16_percent: if (value == /* default */ UINT64_MAX) value = 65536 / 4 /* 25% */; if (unlikely(value < 8192 || value > 32768)) return MDBX_EINVAL; env->options.merge_threshold_16dot16_percent = (unsigned)value; recalculate_merge_thresholds(env); break; case MDBX_opt_writethrough_threshold: #if defined(_WIN32) || defined(_WIN64) /* позволяем "установить" значение по-умолчанию и совпадающее * с поведением соответствующим текущей установке MDBX_NOMETASYNC */ if (value == /* default */ UINT64_MAX && value != ((env->flags & MDBX_NOMETASYNC) ? 0 : UINT_MAX)) err = MDBX_EINVAL; #else if (value == /* default */ UINT64_MAX) value = MDBX_WRITETHROUGH_THRESHOLD_DEFAULT; if (value != (unsigned)value) err = MDBX_EINVAL; else env->options.writethrough_threshold = (unsigned)value; #endif break; case MDBX_opt_prefault_write_enable: if (value == /* default */ UINT64_MAX) { env->options.prefault_write = default_prefault_write(env); env->options.flags.non_auto.prefault_write = false; } else if (value > 1) err = MDBX_EINVAL; else { env->options.prefault_write = value != 0; env->options.flags.non_auto.prefault_write = true; } break; case MDBX_opt_prefer_waf_insteadof_balance: if (value == /* default */ UINT64_MAX) env->options.prefer_waf_insteadof_balance = default_prefer_waf_insteadof_balance(env); else if (value > 1) err = MDBX_EINVAL; else env->options.prefer_waf_insteadof_balance = value != 0; break; default: return MDBX_EINVAL; } if (should_unlock) lck_txn_unlock(env); return err; } __cold int mdbx_env_get_option(const MDBX_env *env, const MDBX_option_t option, uint64_t *pvalue) { int err = check_env(env, false); if (unlikely(err != MDBX_SUCCESS)) return err; if (unlikely(!pvalue)) return MDBX_EINVAL; switch (option) { case MDBX_opt_sync_bytes: if (unlikely(!(env->flags & ENV_ACTIVE))) return MDBX_EPERM; *pvalue = pgno2bytes( env, atomic_load32(&env->lck->autosync_threshold, mo_Relaxed)); break; case MDBX_opt_sync_period: if (unlikely(!(env->flags & ENV_ACTIVE))) return MDBX_EPERM; *pvalue = osal_monotime_to_16dot16( atomic_load64(&env->lck->autosync_period, mo_Relaxed)); break; case MDBX_opt_max_db: *pvalue = env->max_dbi - CORE_DBS; break; case MDBX_opt_max_readers: *pvalue = env->max_readers; break; case MDBX_opt_dp_reserve_limit: *pvalue = env->options.dp_reserve_limit; break; case MDBX_opt_rp_augment_limit: *pvalue = env->options.rp_augment_limit; break; case MDBX_opt_gc_time_limit: *pvalue = osal_monotime_to_16dot16(env->options.gc_time_limit); break; case MDBX_opt_txn_dp_limit: *pvalue = env->options.dp_limit; break; case MDBX_opt_txn_dp_initial: *pvalue = env->options.dp_initial; break; case MDBX_opt_spill_max_denominator: *pvalue = env->options.spill_max_denominator; break; case MDBX_opt_spill_min_denominator: *pvalue = env->options.spill_min_denominator; break; case MDBX_opt_spill_parent4child_denominator: *pvalue = env->options.spill_parent4child_denominator; break; case MDBX_opt_loose_limit: *pvalue = env->options.dp_loose_limit; break; case MDBX_opt_merge_threshold_16dot16_percent: *pvalue = env->options.merge_threshold_16dot16_percent; break; case MDBX_opt_writethrough_threshold: #if defined(_WIN32) || defined(_WIN64) *pvalue = (env->flags & MDBX_NOMETASYNC) ? 0 : INT_MAX; #else *pvalue = env->options.writethrough_threshold; #endif break; case MDBX_opt_prefault_write_enable: *pvalue = env->options.prefault_write; break; case MDBX_opt_prefer_waf_insteadof_balance: *pvalue = env->options.prefer_waf_insteadof_balance; break; default: return MDBX_EINVAL; } return MDBX_SUCCESS; }