2018-03-07 12:09:43 +03:00
|
|
|
/*
|
2018-02-04 13:09:18 +03:00
|
|
|
* Copyright 2015-2018 Leonid Yuriev <leo@yuriev.ru>
|
2017-03-16 18:09:27 +03:00
|
|
|
* and other libmdbx authors: please see AUTHORS file.
|
|
|
|
* All rights reserved.
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted only as authorized by the OpenLDAP
|
|
|
|
* Public License.
|
|
|
|
*
|
|
|
|
* A copy of this license is available in the file LICENSE in the
|
|
|
|
* top-level directory of the distribution or, alternatively, at
|
|
|
|
* <http://www.OpenLDAP.org/license.html>.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "./bits.h"
|
|
|
|
|
|
|
|
/* PREAMBLE FOR WINDOWS:
|
|
|
|
*
|
|
|
|
* We are not concerned for performance here.
|
|
|
|
* If you are running Windows a performance could NOT be the goal.
|
|
|
|
* Otherwise please use Linux.
|
|
|
|
*
|
|
|
|
* Regards,
|
|
|
|
* LY
|
|
|
|
*/
|
|
|
|
|
2018-06-12 17:05:25 +03:00
|
|
|
static void mdbx_winnt_import(void);
|
2017-03-16 18:09:27 +03:00
|
|
|
|
2018-06-12 17:05:25 +03:00
|
|
|
#if !MDBX_CONFIG_MANUAL_TLS_CALLBACK
|
|
|
|
static
|
|
|
|
#endif /* !MDBX_CONFIG_MANUAL_TLS_CALLBACK */
|
|
|
|
void NTAPI
|
|
|
|
mdbx_dll_callback(PVOID module, DWORD reason, PVOID reserved) {
|
2017-03-16 18:09:27 +03:00
|
|
|
(void)reserved;
|
|
|
|
switch (reason) {
|
|
|
|
case DLL_PROCESS_ATTACH:
|
2018-06-12 17:05:25 +03:00
|
|
|
mdbx_winnt_import();
|
2018-03-28 15:57:16 +03:00
|
|
|
mdbx_rthc_global_init();
|
2017-03-16 18:09:27 +03:00
|
|
|
break;
|
|
|
|
case DLL_PROCESS_DETACH:
|
2018-03-28 15:57:16 +03:00
|
|
|
mdbx_rthc_global_dtor();
|
2017-03-16 18:09:27 +03:00
|
|
|
break;
|
|
|
|
|
|
|
|
case DLL_THREAD_ATTACH:
|
|
|
|
break;
|
|
|
|
case DLL_THREAD_DETACH:
|
2018-03-28 15:57:16 +03:00
|
|
|
mdbx_rthc_thread_dtor(module);
|
2017-03-16 18:09:27 +03:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-06-12 17:05:25 +03:00
|
|
|
#if !MDBX_CONFIG_MANUAL_TLS_CALLBACK
|
2017-03-16 18:09:27 +03:00
|
|
|
/* *INDENT-OFF* */
|
|
|
|
/* clang-format off */
|
|
|
|
#if defined(_MSC_VER)
|
|
|
|
# pragma const_seg(push)
|
|
|
|
# pragma data_seg(push)
|
|
|
|
|
|
|
|
# ifdef _WIN64
|
|
|
|
/* kick a linker to create the TLS directory if not already done */
|
|
|
|
# pragma comment(linker, "/INCLUDE:_tls_used")
|
|
|
|
/* Force some symbol references. */
|
2018-06-12 17:05:25 +03:00
|
|
|
# pragma comment(linker, "/INCLUDE:mdbx_tls_anchor")
|
2017-03-16 18:09:27 +03:00
|
|
|
/* specific const-segment for WIN64 */
|
|
|
|
# pragma const_seg(".CRT$XLB")
|
|
|
|
const
|
|
|
|
# else
|
|
|
|
/* kick a linker to create the TLS directory if not already done */
|
|
|
|
# pragma comment(linker, "/INCLUDE:__tls_used")
|
|
|
|
/* Force some symbol references. */
|
2018-06-12 17:05:25 +03:00
|
|
|
# pragma comment(linker, "/INCLUDE:_mdbx_tls_anchor")
|
2017-03-16 18:09:27 +03:00
|
|
|
/* specific data-segment for WIN32 */
|
|
|
|
# pragma data_seg(".CRT$XLB")
|
|
|
|
# endif
|
|
|
|
|
2018-06-12 17:05:25 +03:00
|
|
|
__declspec(allocate(".CRT$XLB")) PIMAGE_TLS_CALLBACK mdbx_tls_anchor = mdbx_dll_callback;
|
2017-03-16 18:09:27 +03:00
|
|
|
# pragma data_seg(pop)
|
|
|
|
# pragma const_seg(pop)
|
|
|
|
|
|
|
|
#elif defined(__GNUC__)
|
|
|
|
# ifdef _WIN64
|
|
|
|
const
|
|
|
|
# endif
|
2018-06-12 17:05:25 +03:00
|
|
|
PIMAGE_TLS_CALLBACK mdbx_tls_anchor __attribute__((section(".CRT$XLB"), used)) = mdbx_dll_callback;
|
2017-03-16 18:09:27 +03:00
|
|
|
#else
|
|
|
|
# error FIXME
|
|
|
|
#endif
|
|
|
|
/* *INDENT-ON* */
|
|
|
|
/* clang-format on */
|
2018-06-12 17:05:25 +03:00
|
|
|
#endif /* !MDBX_CONFIG_MANUAL_TLS_CALLBACK */
|
2017-03-16 18:09:27 +03:00
|
|
|
|
|
|
|
/*----------------------------------------------------------------------------*/
|
|
|
|
|
|
|
|
#define LCK_SHARED 0
|
|
|
|
#define LCK_EXCLUSIVE LOCKFILE_EXCLUSIVE_LOCK
|
|
|
|
#define LCK_WAITFOR 0
|
|
|
|
#define LCK_DONTWAIT LOCKFILE_FAIL_IMMEDIATELY
|
|
|
|
|
2017-05-24 18:50:24 +03:00
|
|
|
static __inline BOOL flock(mdbx_filehandle_t fd, DWORD flags, uint64_t offset,
|
2017-04-26 14:17:52 +03:00
|
|
|
size_t bytes) {
|
2017-03-16 18:09:27 +03:00
|
|
|
OVERLAPPED ov;
|
|
|
|
ov.hEvent = 0;
|
|
|
|
ov.Offset = (DWORD)offset;
|
|
|
|
ov.OffsetHigh = HIGH_DWORD(offset);
|
|
|
|
return LockFileEx(fd, flags, 0, (DWORD)bytes, HIGH_DWORD(bytes), &ov);
|
|
|
|
}
|
|
|
|
|
2017-05-24 18:50:24 +03:00
|
|
|
static __inline BOOL funlock(mdbx_filehandle_t fd, uint64_t offset,
|
|
|
|
size_t bytes) {
|
2017-04-26 14:17:52 +03:00
|
|
|
return UnlockFile(fd, (DWORD)offset, HIGH_DWORD(offset), (DWORD)bytes,
|
|
|
|
HIGH_DWORD(bytes));
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/*----------------------------------------------------------------------------*/
|
|
|
|
/* global `write` lock for write-txt processing,
|
|
|
|
* exclusive locking both meta-pages) */
|
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
#define LCK_MAXLEN (1u + (size_t)(MAXSSIZE_T))
|
|
|
|
#define LCK_META_OFFSET 0
|
|
|
|
#define LCK_META_LEN 0x10000u
|
|
|
|
#define LCK_BODY_OFFSET LCK_META_LEN
|
2018-01-09 21:32:01 +03:00
|
|
|
#define LCK_BODY_LEN (LCK_MAXLEN - LCK_BODY_OFFSET)
|
2017-04-23 12:57:27 +03:00
|
|
|
#define LCK_META LCK_META_OFFSET, LCK_META_LEN
|
|
|
|
#define LCK_BODY LCK_BODY_OFFSET, LCK_BODY_LEN
|
|
|
|
#define LCK_WHOLE 0, LCK_MAXLEN
|
|
|
|
|
2017-10-26 21:47:41 +03:00
|
|
|
int mdbx_txn_lock(MDBX_env *env, bool dontwait) {
|
2018-01-31 15:15:54 +03:00
|
|
|
if (dontwait) {
|
|
|
|
if (!TryEnterCriticalSection(&env->me_windowsbug_lock))
|
|
|
|
return MDBX_BUSY;
|
|
|
|
} else {
|
|
|
|
EnterCriticalSection(&env->me_windowsbug_lock);
|
|
|
|
}
|
|
|
|
|
2018-06-18 21:29:12 +03:00
|
|
|
if (flock(env->me_fd,
|
|
|
|
dontwait ? (LCK_EXCLUSIVE | LCK_DONTWAIT)
|
|
|
|
: (LCK_EXCLUSIVE | LCK_WAITFOR),
|
2017-10-26 21:47:41 +03:00
|
|
|
LCK_BODY))
|
2017-10-25 19:41:28 -04:00
|
|
|
return MDBX_SUCCESS;
|
|
|
|
int rc = GetLastError();
|
2018-01-31 15:15:54 +03:00
|
|
|
LeaveCriticalSection(&env->me_windowsbug_lock);
|
2017-10-26 21:47:41 +03:00
|
|
|
return (!dontwait || rc != ERROR_LOCK_VIOLATION) ? rc : MDBX_BUSY;
|
2017-10-25 19:41:28 -04:00
|
|
|
}
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
void mdbx_txn_unlock(MDBX_env *env) {
|
2018-01-31 15:15:54 +03:00
|
|
|
int rc = funlock(env->me_fd, LCK_BODY);
|
|
|
|
LeaveCriticalSection(&env->me_windowsbug_lock);
|
|
|
|
if (!rc)
|
2017-03-16 18:09:27 +03:00
|
|
|
mdbx_panic("%s failed: errcode %u", mdbx_func_, GetLastError());
|
|
|
|
}
|
|
|
|
|
|
|
|
/*----------------------------------------------------------------------------*/
|
|
|
|
/* global `read` lock for readers registration,
|
|
|
|
* exclusive locking `mti_numreaders` (second) cacheline */
|
|
|
|
|
|
|
|
#define LCK_LO_OFFSET 0
|
|
|
|
#define LCK_LO_LEN offsetof(MDBX_lockinfo, mti_numreaders)
|
|
|
|
#define LCK_UP_OFFSET LCK_LO_LEN
|
|
|
|
#define LCK_UP_LEN (MDBX_LOCKINFO_WHOLE_SIZE - LCK_UP_OFFSET)
|
|
|
|
#define LCK_LOWER LCK_LO_OFFSET, LCK_LO_LEN
|
|
|
|
#define LCK_UPPER LCK_UP_OFFSET, LCK_UP_LEN
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
int mdbx_rdt_lock(MDBX_env *env) {
|
2018-06-12 16:43:33 +03:00
|
|
|
mdbx_srwlock_AcquireShared(&env->me_remap_guard);
|
2017-03-16 18:09:27 +03:00
|
|
|
if (env->me_lfd == INVALID_HANDLE_VALUE)
|
2017-05-24 01:42:10 +03:00
|
|
|
return MDBX_SUCCESS; /* readonly database in readonly filesystem */
|
2017-03-16 18:09:27 +03:00
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
/* transite from S-? (used) to S-E (locked), e.g. exclusive lock upper-part */
|
2017-03-16 18:09:27 +03:00
|
|
|
if (flock(env->me_lfd, LCK_EXCLUSIVE | LCK_WAITFOR, LCK_UPPER))
|
2017-05-24 01:42:10 +03:00
|
|
|
return MDBX_SUCCESS;
|
2018-04-12 00:56:38 +03:00
|
|
|
|
|
|
|
int rc = GetLastError();
|
2018-06-12 16:43:33 +03:00
|
|
|
mdbx_srwlock_ReleaseShared(&env->me_remap_guard);
|
2018-04-12 00:56:38 +03:00
|
|
|
return rc;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
void mdbx_rdt_unlock(MDBX_env *env) {
|
2017-03-16 18:09:27 +03:00
|
|
|
if (env->me_lfd != INVALID_HANDLE_VALUE) {
|
|
|
|
/* transite from S-E (locked) to S-? (used), e.g. unlock upper-part */
|
|
|
|
if (!funlock(env->me_lfd, LCK_UPPER))
|
|
|
|
mdbx_panic("%s failed: errcode %u", mdbx_func_, GetLastError());
|
|
|
|
}
|
2018-06-12 16:43:33 +03:00
|
|
|
mdbx_srwlock_ReleaseShared(&env->me_remap_guard);
|
2018-01-07 14:37:38 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
static int suspend_and_append(mdbx_handle_array_t **array,
|
|
|
|
const DWORD ThreadId) {
|
|
|
|
const unsigned limit = (*array)->limit;
|
|
|
|
if ((*array)->count == limit) {
|
|
|
|
void *ptr = realloc((limit > ARRAY_LENGTH((*array)->handles))
|
|
|
|
? *array
|
|
|
|
: /* don't free initial array on the stack */ NULL,
|
|
|
|
sizeof(mdbx_handle_array_t) +
|
|
|
|
sizeof(HANDLE) *
|
|
|
|
(limit * 2 - ARRAY_LENGTH((*array)->handles)));
|
|
|
|
if (!ptr)
|
|
|
|
return MDBX_ENOMEM;
|
|
|
|
(*array) = (mdbx_handle_array_t *)ptr;
|
|
|
|
(*array)->limit = limit * 2;
|
|
|
|
}
|
|
|
|
|
|
|
|
HANDLE hThread = OpenThread(THREAD_SUSPEND_RESUME, FALSE, ThreadId);
|
|
|
|
if (hThread == NULL)
|
|
|
|
return GetLastError();
|
|
|
|
if (SuspendThread(hThread) == -1) {
|
|
|
|
CloseHandle(hThread);
|
|
|
|
return GetLastError();
|
|
|
|
}
|
|
|
|
|
|
|
|
(*array)->handles[(*array)->count++] = hThread;
|
|
|
|
return MDBX_SUCCESS;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mdbx_suspend_threads_before_remap(MDBX_env *env,
|
|
|
|
mdbx_handle_array_t **array) {
|
|
|
|
const mdbx_pid_t CurrentTid = GetCurrentThreadId();
|
|
|
|
int rc;
|
|
|
|
if (env->me_lck) {
|
|
|
|
/* Scan LCK for threads of the current process */
|
|
|
|
const MDBX_reader *const begin = env->me_lck->mti_readers;
|
|
|
|
const MDBX_reader *const end = begin + env->me_lck->mti_numreaders;
|
|
|
|
const mdbx_tid_t WriteTxnOwner = env->me_txn0 ? env->me_txn0->mt_owner : 0;
|
|
|
|
for (const MDBX_reader *reader = begin; reader < end; ++reader) {
|
2018-01-08 18:07:11 +03:00
|
|
|
if (reader->mr_pid != env->me_pid || !reader->mr_tid) {
|
|
|
|
skip_lck:
|
2018-01-07 14:37:38 +03:00
|
|
|
continue;
|
2018-01-08 18:07:11 +03:00
|
|
|
}
|
|
|
|
if (reader->mr_tid == CurrentTid || reader->mr_tid == WriteTxnOwner)
|
|
|
|
goto skip_lck;
|
2018-01-07 14:37:38 +03:00
|
|
|
if (env->me_flags & MDBX_NOTLS) {
|
|
|
|
/* Skip duplicates in no-tls mode */
|
2018-01-08 18:07:11 +03:00
|
|
|
for (const MDBX_reader *scan = reader; --scan >= begin;)
|
2018-01-07 14:37:38 +03:00
|
|
|
if (scan->mr_tid == reader->mr_tid)
|
2018-01-08 18:07:11 +03:00
|
|
|
goto skip_lck;
|
2018-01-07 14:37:38 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
rc = suspend_and_append(array, reader->mr_tid);
|
|
|
|
if (rc != MDBX_SUCCESS) {
|
|
|
|
bailout_lck:
|
|
|
|
(void)mdbx_resume_threads_after_remap(*array);
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (WriteTxnOwner && WriteTxnOwner != CurrentTid) {
|
|
|
|
rc = suspend_and_append(array, WriteTxnOwner);
|
|
|
|
if (rc != MDBX_SUCCESS)
|
|
|
|
goto bailout_lck;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/* Without LCK (i.e. read-only mode).
|
|
|
|
* Walk thougth a snapshot of all running threads */
|
2018-01-08 18:07:11 +03:00
|
|
|
mdbx_assert(env, env->me_txn0 == NULL);
|
|
|
|
const HANDLE hSnapshot = CreateToolhelp32Snapshot(TH32CS_SNAPTHREAD, 0);
|
|
|
|
if (hSnapshot == INVALID_HANDLE_VALUE)
|
2018-01-07 14:37:38 +03:00
|
|
|
return GetLastError();
|
|
|
|
|
|
|
|
THREADENTRY32 entry;
|
|
|
|
entry.dwSize = sizeof(THREADENTRY32);
|
|
|
|
|
2018-01-08 18:07:11 +03:00
|
|
|
if (!Thread32First(hSnapshot, &entry)) {
|
2018-01-07 14:37:38 +03:00
|
|
|
rc = GetLastError();
|
|
|
|
bailout_toolhelp:
|
2018-01-08 18:07:11 +03:00
|
|
|
CloseHandle(hSnapshot);
|
2018-01-07 14:37:38 +03:00
|
|
|
(void)mdbx_resume_threads_after_remap(*array);
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
|
|
|
do {
|
|
|
|
if (entry.th32OwnerProcessID != env->me_pid ||
|
|
|
|
entry.th32ThreadID == CurrentTid)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
rc = suspend_and_append(array, entry.th32ThreadID);
|
|
|
|
if (rc != MDBX_SUCCESS)
|
|
|
|
goto bailout_toolhelp;
|
|
|
|
|
2018-01-08 18:07:11 +03:00
|
|
|
} while (Thread32Next(hSnapshot, &entry));
|
2018-01-07 14:37:38 +03:00
|
|
|
|
|
|
|
rc = GetLastError();
|
|
|
|
if (rc != ERROR_NO_MORE_FILES)
|
|
|
|
goto bailout_toolhelp;
|
2018-01-08 18:07:11 +03:00
|
|
|
CloseHandle(hSnapshot);
|
2018-01-07 14:37:38 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
return MDBX_SUCCESS;
|
|
|
|
}
|
|
|
|
|
|
|
|
int mdbx_resume_threads_after_remap(mdbx_handle_array_t *array) {
|
|
|
|
int rc = MDBX_SUCCESS;
|
|
|
|
for (unsigned i = 0; i < array->count; ++i) {
|
|
|
|
if (ResumeThread(array->handles[i]) == -1)
|
|
|
|
rc = GetLastError();
|
|
|
|
CloseHandle(array->handles[i]);
|
|
|
|
}
|
|
|
|
return rc;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/*----------------------------------------------------------------------------*/
|
|
|
|
/* global `initial` lock for lockfile initialization,
|
2017-07-19 09:12:46 +03:00
|
|
|
* exclusive/shared locking first cacheline */
|
2017-03-16 18:09:27 +03:00
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
/* FIXME: locking schema/algo descritpion.
|
2017-03-16 18:09:27 +03:00
|
|
|
?-? = free
|
|
|
|
S-? = used
|
2017-07-19 09:12:46 +03:00
|
|
|
E-? = exclusive-read
|
2017-03-16 18:09:27 +03:00
|
|
|
?-S
|
|
|
|
?-E = middle
|
|
|
|
S-S
|
|
|
|
S-E = locked
|
|
|
|
E-S
|
2017-07-19 09:12:46 +03:00
|
|
|
E-E = exclusive-write
|
2017-03-16 18:09:27 +03:00
|
|
|
*/
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
int mdbx_lck_init(MDBX_env *env) {
|
2017-03-16 18:09:27 +03:00
|
|
|
(void)env;
|
2017-05-24 01:42:10 +03:00
|
|
|
return MDBX_SUCCESS;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
/* Seize state as 'exclusive-write' (E-E and returns MDBX_RESULT_TRUE)
|
|
|
|
* or as 'used' (S-? and returns MDBX_RESULT_FALSE), otherwise returns an error
|
|
|
|
*/
|
2017-04-23 12:57:27 +03:00
|
|
|
static int internal_seize_lck(HANDLE lfd) {
|
|
|
|
int rc;
|
|
|
|
assert(lfd != INVALID_HANDLE_VALUE);
|
2017-03-16 18:09:27 +03:00
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
/* 1) now on ?-? (free), get ?-E (middle) */
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-04-23 12:57:27 +03:00
|
|
|
if (!flock(lfd, LCK_EXCLUSIVE | LCK_WAITFOR, LCK_UPPER)) {
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError() /* 2) something went wrong, give up */;
|
2017-04-23 12:57:27 +03:00
|
|
|
mdbx_error("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"?-?(free) >> ?-E(middle)", rc);
|
|
|
|
return rc;
|
|
|
|
}
|
2017-04-26 14:17:52 +03:00
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
/* 3) now on ?-E (middle), try E-E (exclusive-write) */
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-04-23 12:57:27 +03:00
|
|
|
if (flock(lfd, LCK_EXCLUSIVE | LCK_DONTWAIT, LCK_LOWER))
|
2017-07-19 09:12:46 +03:00
|
|
|
return MDBX_RESULT_TRUE /* 4) got E-E (exclusive-write), done */;
|
2017-03-16 18:09:27 +03:00
|
|
|
|
|
|
|
/* 5) still on ?-E (middle) */
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-03-16 18:09:27 +03:00
|
|
|
if (rc != ERROR_SHARING_VIOLATION && rc != ERROR_LOCK_VIOLATION) {
|
|
|
|
/* 6) something went wrong, give up */
|
2017-05-15 12:08:04 +03:00
|
|
|
if (!funlock(lfd, LCK_UPPER))
|
2017-03-16 18:09:27 +03:00
|
|
|
mdbx_panic("%s(%s) failed: errcode %u", mdbx_func_,
|
2017-05-15 12:08:04 +03:00
|
|
|
"?-E(middle) >> ?-?(free)", GetLastError());
|
2017-03-16 18:09:27 +03:00
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* 7) still on ?-E (middle), try S-E (locked) */
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = flock(lfd, LCK_SHARED | LCK_DONTWAIT, LCK_LOWER) ? MDBX_RESULT_FALSE
|
|
|
|
: GetLastError();
|
2017-04-23 12:57:27 +03:00
|
|
|
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-04-23 12:57:27 +03:00
|
|
|
if (rc != MDBX_RESULT_FALSE)
|
|
|
|
mdbx_error("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"?-E(middle) >> S-E(locked)", rc);
|
2017-03-16 18:09:27 +03:00
|
|
|
|
|
|
|
/* 8) now on S-E (locked) or still on ?-E (middle),
|
2018-06-18 21:29:12 +03:00
|
|
|
* transite to S-? (used) or ?-? (free) */
|
2017-05-15 12:08:04 +03:00
|
|
|
if (!funlock(lfd, LCK_UPPER))
|
2017-03-16 18:09:27 +03:00
|
|
|
mdbx_panic("%s(%s) failed: errcode %u", mdbx_func_,
|
2017-05-15 12:08:04 +03:00
|
|
|
"X-E(locked/middle) >> X-?(used/free)", GetLastError());
|
2017-03-16 18:09:27 +03:00
|
|
|
|
|
|
|
/* 9) now on S-? (used, DONE) or ?-? (free, FAILURE) */
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
int mdbx_lck_seize(MDBX_env *env) {
|
2017-03-16 18:09:27 +03:00
|
|
|
int rc;
|
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
assert(env->me_fd != INVALID_HANDLE_VALUE);
|
|
|
|
if (env->me_lfd == INVALID_HANDLE_VALUE) {
|
|
|
|
/* LY: without-lck mode (e.g. on read-only filesystem) */
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-04-23 12:57:27 +03:00
|
|
|
if (!flock(env->me_fd, LCK_SHARED | LCK_DONTWAIT, LCK_WHOLE)) {
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-04-23 12:57:27 +03:00
|
|
|
mdbx_error("%s(%s) failed: errcode %u", mdbx_func_, "without-lck", rc);
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
return MDBX_RESULT_FALSE;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
rc = internal_seize_lck(env->me_lfd);
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-05-24 01:42:10 +03:00
|
|
|
if (rc == MDBX_RESULT_TRUE && (env->me_flags & MDBX_RDONLY) == 0) {
|
2017-04-23 12:57:27 +03:00
|
|
|
/* Check that another process don't operates in without-lck mode.
|
|
|
|
* Doing such check by exclusive locking the body-part of db. Should be
|
|
|
|
* noted:
|
|
|
|
* - we need an exclusive lock for do so;
|
|
|
|
* - we can't lock meta-pages, otherwise other process could get an error
|
|
|
|
* while opening db in valid (non-conflict) mode. */
|
|
|
|
if (!flock(env->me_fd, LCK_EXCLUSIVE | LCK_DONTWAIT, LCK_BODY)) {
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-04-23 12:57:27 +03:00
|
|
|
mdbx_error("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"lock-against-without-lck", rc);
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-04-23 12:57:27 +03:00
|
|
|
mdbx_lck_destroy(env);
|
2017-04-26 14:17:52 +03:00
|
|
|
} else {
|
2017-04-27 15:51:58 +03:00
|
|
|
mdbx_jitter4testing(false);
|
2017-05-15 12:08:04 +03:00
|
|
|
if (!funlock(env->me_fd, LCK_BODY))
|
2017-04-26 14:17:52 +03:00
|
|
|
mdbx_panic("%s(%s) failed: errcode %u", mdbx_func_,
|
2017-05-15 12:08:04 +03:00
|
|
|
"unlock-against-without-lck", GetLastError());
|
2017-04-23 12:57:27 +03:00
|
|
|
}
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
int mdbx_lck_downgrade(MDBX_env *env, bool complete) {
|
|
|
|
/* Transite from exclusive state (E-?) to used (S-?) */
|
2017-04-23 12:57:27 +03:00
|
|
|
assert(env->me_fd != INVALID_HANDLE_VALUE);
|
2017-06-06 20:18:09 +03:00
|
|
|
assert(env->me_lfd != INVALID_HANDLE_VALUE);
|
2017-04-23 12:57:27 +03:00
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
/* 1) must be at E-E (exclusive-write) */
|
|
|
|
if (!complete) {
|
|
|
|
/* transite from E-E to E_? (exclusive-read) */
|
|
|
|
if (!funlock(env->me_lfd, LCK_UPPER))
|
|
|
|
mdbx_panic("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"E-E(exclusive-write) >> E-?(exclusive-read)", GetLastError());
|
|
|
|
return MDBX_SUCCESS /* 2) now at E-? (exclusive-read), done */;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* 3) now at E-E (exclusive-write), transite to ?_E (middle) */
|
2017-06-06 20:18:09 +03:00
|
|
|
if (!funlock(env->me_lfd, LCK_LOWER))
|
|
|
|
mdbx_panic("%s(%s) failed: errcode %u", mdbx_func_,
|
2017-07-19 09:12:46 +03:00
|
|
|
"E-E(exclusive-write) >> ?-E(middle)", GetLastError());
|
2017-04-23 12:57:27 +03:00
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
/* 4) now at ?-E (middle), transite to S-E (locked) */
|
2017-06-06 20:18:09 +03:00
|
|
|
if (!flock(env->me_lfd, LCK_SHARED | LCK_DONTWAIT, LCK_LOWER)) {
|
2017-07-19 09:12:46 +03:00
|
|
|
int rc = GetLastError() /* 5) something went wrong, give up */;
|
|
|
|
mdbx_error("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"?-E(middle) >> S-E(locked)", rc);
|
2017-06-06 20:18:09 +03:00
|
|
|
return rc;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
2017-06-06 20:18:09 +03:00
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
/* 6) got S-E (locked), continue transition to S-? (used) */
|
2017-06-06 20:18:09 +03:00
|
|
|
if (!funlock(env->me_lfd, LCK_UPPER))
|
|
|
|
mdbx_panic("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"S-E(locked) >> S-?(used)", GetLastError());
|
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
return MDBX_SUCCESS /* 7) now at S-? (used), done */;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
2017-06-06 20:18:09 +03:00
|
|
|
int mdbx_lck_upgrade(MDBX_env *env) {
|
2017-07-19 09:12:46 +03:00
|
|
|
/* Transite from locked state (S-E) to exclusive-write (E-E) */
|
2017-06-06 20:18:09 +03:00
|
|
|
assert(env->me_fd != INVALID_HANDLE_VALUE);
|
|
|
|
assert(env->me_lfd != INVALID_HANDLE_VALUE);
|
|
|
|
|
|
|
|
/* 1) must be at S-E (locked), transite to ?_E (middle) */
|
|
|
|
if (!funlock(env->me_lfd, LCK_LOWER))
|
|
|
|
mdbx_panic("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"S-E(locked) >> ?-E(middle)", GetLastError());
|
|
|
|
|
2017-07-19 09:12:46 +03:00
|
|
|
/* 3) now on ?-E (middle), try E-E (exclusive-write) */
|
2017-06-06 20:18:09 +03:00
|
|
|
mdbx_jitter4testing(false);
|
|
|
|
if (flock(env->me_lfd, LCK_EXCLUSIVE | LCK_DONTWAIT, LCK_LOWER))
|
2017-07-19 09:12:46 +03:00
|
|
|
return MDBX_RESULT_TRUE; /* 4) got E-E (exclusive-write), done */
|
2017-06-06 20:18:09 +03:00
|
|
|
|
|
|
|
/* 5) still on ?-E (middle) */
|
2017-06-21 01:41:25 +03:00
|
|
|
int rc = GetLastError();
|
2017-06-06 20:18:09 +03:00
|
|
|
mdbx_jitter4testing(false);
|
|
|
|
if (rc != ERROR_SHARING_VIOLATION && rc != ERROR_LOCK_VIOLATION) {
|
|
|
|
/* 6) something went wrong, report but continue */
|
|
|
|
mdbx_error("%s(%s) failed: errcode %u", mdbx_func_,
|
2017-07-19 09:12:46 +03:00
|
|
|
"?-E(middle) >> E-E(exclusive-write)", rc);
|
2017-06-06 20:18:09 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
/* 7) still on ?-E (middle), try restore S-E (locked) */
|
|
|
|
mdbx_jitter4testing(false);
|
|
|
|
rc = flock(env->me_lfd, LCK_SHARED | LCK_DONTWAIT, LCK_LOWER)
|
|
|
|
? MDBX_RESULT_FALSE
|
2017-06-21 01:41:25 +03:00
|
|
|
: GetLastError();
|
2017-06-06 20:18:09 +03:00
|
|
|
|
|
|
|
mdbx_jitter4testing(false);
|
|
|
|
if (rc != MDBX_RESULT_FALSE) {
|
|
|
|
mdbx_fatal("%s(%s) failed: errcode %u", mdbx_func_,
|
|
|
|
"?-E(middle) >> S-E(locked)", rc);
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* 8) now on S-E (locked) */
|
|
|
|
return MDBX_RESULT_FALSE;
|
|
|
|
}
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
void mdbx_lck_destroy(MDBX_env *env) {
|
2017-03-16 18:09:27 +03:00
|
|
|
int rc;
|
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
if (env->me_lfd != INVALID_HANDLE_VALUE) {
|
|
|
|
/* double `unlock` for robustly remove overlapped shared/exclusive locks */
|
|
|
|
while (funlock(env->me_lfd, LCK_LOWER))
|
|
|
|
;
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-04-23 12:57:27 +03:00
|
|
|
assert(rc == ERROR_NOT_LOCKED);
|
|
|
|
(void)rc;
|
|
|
|
SetLastError(ERROR_SUCCESS);
|
|
|
|
|
|
|
|
while (funlock(env->me_lfd, LCK_UPPER))
|
|
|
|
;
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-04-23 12:57:27 +03:00
|
|
|
assert(rc == ERROR_NOT_LOCKED);
|
|
|
|
(void)rc;
|
|
|
|
SetLastError(ERROR_SUCCESS);
|
|
|
|
}
|
|
|
|
|
2017-03-16 18:09:27 +03:00
|
|
|
if (env->me_fd != INVALID_HANDLE_VALUE) {
|
|
|
|
/* explicitly unlock to avoid latency for other processes (windows kernel
|
2017-06-06 20:18:09 +03:00
|
|
|
* releases such locks via deferred queues) */
|
2017-04-23 12:57:27 +03:00
|
|
|
while (funlock(env->me_fd, LCK_BODY))
|
2017-03-16 18:09:27 +03:00
|
|
|
;
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-03-16 18:09:27 +03:00
|
|
|
assert(rc == ERROR_NOT_LOCKED);
|
|
|
|
(void)rc;
|
|
|
|
SetLastError(ERROR_SUCCESS);
|
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
while (funlock(env->me_fd, LCK_META))
|
2017-03-16 18:09:27 +03:00
|
|
|
;
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-03-16 18:09:27 +03:00
|
|
|
assert(rc == ERROR_NOT_LOCKED);
|
|
|
|
(void)rc;
|
|
|
|
SetLastError(ERROR_SUCCESS);
|
|
|
|
|
2017-04-23 12:57:27 +03:00
|
|
|
while (funlock(env->me_fd, LCK_WHOLE))
|
2017-03-16 18:09:27 +03:00
|
|
|
;
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-03-16 18:09:27 +03:00
|
|
|
assert(rc == ERROR_NOT_LOCKED);
|
|
|
|
(void)rc;
|
|
|
|
SetLastError(ERROR_SUCCESS);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*----------------------------------------------------------------------------*/
|
|
|
|
/* reader checking (by pid) */
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
int mdbx_rpid_set(MDBX_env *env) {
|
2017-03-16 18:09:27 +03:00
|
|
|
(void)env;
|
2017-05-24 01:42:10 +03:00
|
|
|
return MDBX_SUCCESS;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
2017-05-24 01:42:10 +03:00
|
|
|
int mdbx_rpid_clear(MDBX_env *env) {
|
2017-03-16 18:09:27 +03:00
|
|
|
(void)env;
|
2017-05-24 01:42:10 +03:00
|
|
|
return MDBX_SUCCESS;
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
2017-04-21 18:26:32 +03:00
|
|
|
/* Checks reader by pid.
|
|
|
|
*
|
|
|
|
* Returns:
|
|
|
|
* MDBX_RESULT_TRUE, if pid is live (unable to acquire lock)
|
|
|
|
* MDBX_RESULT_FALSE, if pid is dead (lock acquired)
|
|
|
|
* or otherwise the errcode. */
|
2017-05-24 01:42:10 +03:00
|
|
|
int mdbx_rpid_check(MDBX_env *env, mdbx_pid_t pid) {
|
2017-03-16 18:09:27 +03:00
|
|
|
(void)env;
|
2018-05-04 01:52:17 +03:00
|
|
|
HANDLE hProcess = OpenProcess(SYNCHRONIZE, FALSE, pid);
|
2017-03-16 18:09:27 +03:00
|
|
|
int rc;
|
2018-05-04 01:52:17 +03:00
|
|
|
if (likely(hProcess)) {
|
2017-03-16 18:09:27 +03:00
|
|
|
rc = WaitForSingleObject(hProcess, 0);
|
2018-05-04 01:52:17 +03:00
|
|
|
if (unlikely(rc == WAIT_FAILED))
|
|
|
|
rc = GetLastError();
|
2017-03-16 18:09:27 +03:00
|
|
|
CloseHandle(hProcess);
|
|
|
|
} else {
|
2017-06-21 01:41:25 +03:00
|
|
|
rc = GetLastError();
|
2017-03-16 18:09:27 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
switch (rc) {
|
|
|
|
case ERROR_INVALID_PARAMETER:
|
|
|
|
/* pid seem invalid */
|
|
|
|
return MDBX_RESULT_FALSE;
|
|
|
|
case WAIT_OBJECT_0:
|
|
|
|
/* process just exited */
|
|
|
|
return MDBX_RESULT_FALSE;
|
|
|
|
case WAIT_TIMEOUT:
|
|
|
|
/* pid running */
|
|
|
|
return MDBX_RESULT_TRUE;
|
|
|
|
default:
|
|
|
|
/* failure */
|
|
|
|
return rc;
|
|
|
|
}
|
|
|
|
}
|
2018-06-12 16:43:33 +03:00
|
|
|
|
|
|
|
//----------------------------------------------------------------------------
|
|
|
|
// Stub for slim read-write lock
|
|
|
|
// Copyright (C) 1995-2002 Brad Wilson
|
|
|
|
|
|
|
|
static void WINAPI stub_srwlock_Init(MDBX_srwlock *srwl) {
|
|
|
|
srwl->readerCount = srwl->writerCount = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void WINAPI stub_srwlock_AcquireShared(MDBX_srwlock *srwl) {
|
|
|
|
while (true) {
|
|
|
|
assert(srwl->writerCount >= 0 && srwl->readerCount >= 0);
|
|
|
|
|
|
|
|
// If there's a writer already, spin without unnecessarily
|
|
|
|
// interlocking the CPUs
|
|
|
|
if (srwl->writerCount != 0) {
|
|
|
|
YieldProcessor();
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Add to the readers list
|
|
|
|
_InterlockedIncrement(&srwl->readerCount);
|
|
|
|
|
|
|
|
// Check for writers again (we may have been pre-empted). If
|
|
|
|
// there are no writers writing or waiting, then we're done.
|
|
|
|
if (srwl->writerCount == 0)
|
|
|
|
break;
|
|
|
|
|
|
|
|
// Remove from the readers list, spin, try again
|
|
|
|
_InterlockedDecrement(&srwl->readerCount);
|
|
|
|
YieldProcessor();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void WINAPI stub_srwlock_ReleaseShared(MDBX_srwlock *srwl) {
|
|
|
|
assert(srwl->readerCount > 0);
|
|
|
|
_InterlockedDecrement(&srwl->readerCount);
|
|
|
|
}
|
|
|
|
|
|
|
|
static void WINAPI stub_srwlock_AcquireExclusive(MDBX_srwlock *srwl) {
|
|
|
|
while (true) {
|
|
|
|
assert(srwl->writerCount >= 0 && srwl->readerCount >= 0);
|
|
|
|
|
|
|
|
// If there's a writer already, spin without unnecessarily
|
|
|
|
// interlocking the CPUs
|
|
|
|
if (srwl->writerCount != 0) {
|
|
|
|
YieldProcessor();
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
// See if we can become the writer (expensive, because it inter-
|
|
|
|
// locks the CPUs, so writing should be an infrequent process)
|
|
|
|
if (_InterlockedExchange(&srwl->writerCount, 1) == 0)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Now we're the writer, but there may be outstanding readers.
|
|
|
|
// Spin until there aren't any more; new readers will wait now
|
|
|
|
// that we're the writer.
|
|
|
|
while (srwl->readerCount != 0) {
|
|
|
|
assert(srwl->writerCount >= 0 && srwl->readerCount >= 0);
|
|
|
|
YieldProcessor();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
static void WINAPI stub_srwlock_ReleaseExclusive(MDBX_srwlock *srwl) {
|
|
|
|
assert(srwl->writerCount == 1 && srwl->readerCount >= 0);
|
|
|
|
srwl->writerCount = 0;
|
|
|
|
}
|
|
|
|
|
2018-06-12 17:05:25 +03:00
|
|
|
MDBX_srwlock_function mdbx_srwlock_Init, mdbx_srwlock_AcquireShared,
|
|
|
|
mdbx_srwlock_ReleaseShared, mdbx_srwlock_AcquireExclusive,
|
|
|
|
mdbx_srwlock_ReleaseExclusive;
|
|
|
|
|
|
|
|
/*----------------------------------------------------------------------------*/
|
|
|
|
|
|
|
|
static void mdbx_winnt_import(void) {
|
2018-06-12 16:43:33 +03:00
|
|
|
HINSTANCE hInst = GetModuleHandleA("kernel32.dll");
|
|
|
|
MDBX_srwlock_function init =
|
|
|
|
(MDBX_srwlock_function)GetProcAddress(hInst, "InitializeSRWLock");
|
|
|
|
if (init != NULL) {
|
2018-06-12 17:05:25 +03:00
|
|
|
mdbx_srwlock_Init = init;
|
2018-06-12 16:43:33 +03:00
|
|
|
mdbx_srwlock_AcquireShared =
|
|
|
|
(MDBX_srwlock_function)GetProcAddress(hInst, "AcquireSRWLockShared");
|
|
|
|
mdbx_srwlock_ReleaseShared =
|
|
|
|
(MDBX_srwlock_function)GetProcAddress(hInst, "ReleaseSRWLockShared");
|
|
|
|
mdbx_srwlock_AcquireExclusive =
|
|
|
|
(MDBX_srwlock_function)GetProcAddress(hInst, "AcquireSRWLockExclusive");
|
|
|
|
mdbx_srwlock_ReleaseExclusive =
|
|
|
|
(MDBX_srwlock_function)GetProcAddress(hInst, "ReleaseSRWLockExclusive");
|
|
|
|
} else {
|
2018-06-12 17:05:25 +03:00
|
|
|
mdbx_srwlock_Init = stub_srwlock_Init;
|
2018-06-12 16:43:33 +03:00
|
|
|
mdbx_srwlock_AcquireShared = stub_srwlock_AcquireShared;
|
|
|
|
mdbx_srwlock_ReleaseShared = stub_srwlock_ReleaseShared;
|
|
|
|
mdbx_srwlock_AcquireExclusive = stub_srwlock_AcquireExclusive;
|
|
|
|
mdbx_srwlock_ReleaseExclusive = stub_srwlock_ReleaseExclusive;
|
|
|
|
}
|
|
|
|
}
|