mdbx-load: add '-a' option for loading dumps of custom-sorted DBs.

Based on http://www.openldap.org/devel/gitweb.cgi?p=openldap.git;a=commitdiff;h=aa77c832b8e6fc696078017f550d119cdfc0f232

Change-Id: If7de71c8f6ffc29d4316c6074995fab38f2c1b4b

+load

Change-Id: Iff6cbca2514840ee290f801e3b273edf160913b4
This commit is contained in:
Leo Yuriev 2019-02-03 15:49:40 +03:00 committed by Leonid Yuriev
parent 9ba8434c1d
commit 309955be75
2 changed files with 53 additions and 14 deletions

View File

@ -39,6 +39,13 @@ option below.
.BR \-V .BR \-V
Write the library version number to the standard output, and exit. Write the library version number to the standard output, and exit.
.TP .TP
.BR \-a
Append all records in the order they appear in the input. The input is assumed to already be
in correctly sorted order and no sorting or checking for redundant values will be performed.
This option must be used to reload data that was produced by running
.B mdbx_dump
on a database that uses custom compare functions.
.TP
.BR \-f \ file .BR \-f \ file
Read from the specified file instead of from the standard input. Read from the specified file instead of from the standard input.
.TP .TP

View File

@ -1,4 +1,4 @@
/* mdbx_load.c - memory-mapped database load tool */ /* mdbx_load.c - memory-mapped database load tool */
/* /*
* Copyright 2015-2019 Leonid Yuriev <leo@yuriev.ru> * Copyright 2015-2019 Leonid Yuriev <leo@yuriev.ru>
@ -57,6 +57,7 @@ static int Eof;
static MDBX_envinfo envinfo; static MDBX_envinfo envinfo;
static MDBX_val kbuf, dbuf; static MDBX_val kbuf, dbuf;
static MDBX_val k0buf;
#define STRLENOF(s) (sizeof(s) - 1) #define STRLENOF(s) (sizeof(s) - 1)
@ -304,11 +305,18 @@ static int readline(MDBX_val *out, MDBX_val *buf) {
} }
static void usage(void) { static void usage(void) {
fprintf(stderr, "usage: %s [-V] [-f input] [-n] [-s name] [-N] [-T] dbpath\n", fprintf(stderr,
"usage: %s [-V] [-a] [-f input] [-n] [-s name] [-N] [-T] dbpath\n",
prog); prog);
exit(EXIT_FAILURE); exit(EXIT_FAILURE);
} }
static int anyway_greater(const MDBX_val *a, const MDBX_val *b) {
(void)a;
(void)b;
return 1;
}
int main(int argc, char *argv[]) { int main(int argc, char *argv[]) {
int i, rc; int i, rc;
MDBX_env *env = NULL; MDBX_env *env = NULL;
@ -316,28 +324,32 @@ int main(int argc, char *argv[]) {
MDBX_cursor *mc = NULL; MDBX_cursor *mc = NULL;
MDBX_dbi dbi; MDBX_dbi dbi;
char *envname = NULL; char *envname = NULL;
int envflags = 0, putflags = 0; int envflags = MDBX_UTTERLY_NOSYNC, putflags = 0;
int append = 0;
MDBX_val prevk;
prog = argv[0]; prog = argv[0];
if (argc < 2)
if (argc < 2) {
usage(); usage();
}
/* -f: load file instead of stdin /* -a: append records in input order
* -f: load file instead of stdin
* -n: use NOSUBDIR flag on env_open * -n: use NOSUBDIR flag on env_open
* -s: load into named subDB * -s: load into named subDB
* -N: use NOOVERWRITE on puts * -N: use NOOVERWRITE on puts
* -T: read plaintext * -T: read plaintext
* -V: print version and exit * -V: print version and exit
*/ */
while ((i = getopt(argc, argv, "f:ns:NTV")) != EOF) { while ((i = getopt(argc, argv, "af:ns:NTV")) != EOF) {
switch (i) { switch (i) {
case 'V': case 'V':
printf("%s (%s, build %s)\n", mdbx_version.git.describe, printf("%s (%s, build %s)\n", mdbx_version.git.describe,
mdbx_version.git.datetime, mdbx_build.datetime); mdbx_version.git.datetime, mdbx_build.datetime);
exit(EXIT_SUCCESS); exit(EXIT_SUCCESS);
break; break;
case 'a':
append = 1;
break;
case 'f': case 'f':
if (freopen(optarg, "r", stdin) == NULL) { if (freopen(optarg, "r", stdin) == NULL) {
fprintf(stderr, "%s: %s: reopen: %s\n", prog, optarg, fprintf(stderr, "%s: %s: reopen: %s\n", prog, optarg,
@ -381,6 +393,7 @@ int main(int argc, char *argv[]) {
dbuf.iov_len = 4096; dbuf.iov_len = 4096;
dbuf.iov_base = mdbx_malloc(dbuf.iov_len); dbuf.iov_base = mdbx_malloc(dbuf.iov_len);
/* read first header for mapsize= */
if (!(mode & NOHDR)) if (!(mode & NOHDR))
readhdr(); readhdr();
@ -419,7 +432,10 @@ int main(int argc, char *argv[]) {
} }
kbuf.iov_len = mdbx_env_get_maxkeysize(env) * 2 + 2; kbuf.iov_len = mdbx_env_get_maxkeysize(env) * 2 + 2;
kbuf.iov_base = mdbx_malloc(kbuf.iov_len); kbuf.iov_base = malloc(kbuf.iov_len * 2);
k0buf.iov_len = kbuf.iov_len;
k0buf.iov_base = (char *)kbuf.iov_base + kbuf.iov_len;
prevk.iov_base = k0buf.iov_base;
while (!Eof) { while (!Eof) {
if (user_break) { if (user_break) {
@ -427,9 +443,6 @@ int main(int argc, char *argv[]) {
break; break;
} }
MDBX_val key, data;
int batch = 0;
rc = mdbx_txn_begin(env, NULL, 0, &txn); rc = mdbx_txn_begin(env, NULL, 0, &txn);
if (rc) { if (rc) {
fprintf(stderr, "mdbx_txn_begin failed, error %d %s\n", rc, fprintf(stderr, "mdbx_txn_begin failed, error %d %s\n", rc,
@ -437,7 +450,9 @@ int main(int argc, char *argv[]) {
goto env_close; goto env_close;
} }
rc = mdbx_dbi_open(txn, subname, dbi_flags | MDBX_CREATE, &dbi); rc = mdbx_dbi_open_ex(txn, subname, dbi_flags | MDBX_CREATE, &dbi,
append ? anyway_greater : NULL,
append ? anyway_greater : NULL);
if (rc) { if (rc) {
fprintf(stderr, "mdbx_open failed, error %d %s\n", rc, mdbx_strerror(rc)); fprintf(stderr, "mdbx_open failed, error %d %s\n", rc, mdbx_strerror(rc));
goto txn_abort; goto txn_abort;
@ -450,11 +465,15 @@ int main(int argc, char *argv[]) {
goto txn_abort; goto txn_abort;
} }
int batch = 0;
prevk.iov_len = 0;
while (1) { while (1) {
MDBX_val key;
rc = readline(&key, &kbuf); rc = readline(&key, &kbuf);
if (rc) /* rc == EOF */ if (rc) /* rc == EOF */
break; break;
MDBX_val data;
rc = readline(&data, &dbuf); rc = readline(&data, &dbuf);
if (rc) { if (rc) {
fprintf(stderr, "%s: line %" PRIiSIZE ": failed to read key value\n", fprintf(stderr, "%s: line %" PRIiSIZE ": failed to read key value\n",
@ -462,7 +481,18 @@ int main(int argc, char *argv[]) {
goto txn_abort; goto txn_abort;
} }
rc = mdbx_cursor_put(mc, &key, &data, putflags); int appflag = 0;
if (append) {
appflag = MDBX_APPEND;
if (dbi_flags & MDBX_DUPSORT) {
if (prevk.iov_len == key.iov_len &&
memcmp(prevk.iov_base, key.iov_base, key.iov_len) == 0)
appflag = MDBX_CURRENT | MDBX_APPENDDUP;
else
memcpy(prevk.iov_base, key.iov_base, prevk.iov_len = key.iov_len);
}
}
rc = mdbx_cursor_put(mc, &key, &data, putflags | appflag);
if (rc == MDBX_KEYEXIST && putflags) if (rc == MDBX_KEYEXIST && putflags)
continue; continue;
if (rc) { if (rc) {
@ -501,6 +531,8 @@ int main(int argc, char *argv[]) {
goto env_close; goto env_close;
} }
mdbx_dbi_close(env, dbi); mdbx_dbi_close(env, dbi);
/* try read next header */
if (!(mode & NOHDR)) if (!(mode & NOHDR))
readhdr(); readhdr();
} }