123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496 |
- /* mdb_load.c - memory-mapped database load tool */
- /*
- * Copyright 2011-2021 Howard Chu, Symas Corp.
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted only as authorized by the OpenLDAP
- * Public License.
- *
- * A copy of this license is available in the file LICENSE in the
- * top-level directory of the distribution or, alternatively, at
- * <http://www.OpenLDAP.org/license.html>.
- */
- #include <stdio.h>
- #include <stdlib.h>
- #include <errno.h>
- #include <string.h>
- #include <ctype.h>
- #include <unistd.h>
- #include "lmdb.h"
- #define PRINT 1
- #define NOHDR 2
- static int mode;
- static char *subname = NULL;
- static size_t lineno;
- static int version;
- static int flags;
- static char *prog;
- static int Eof;
- static MDB_envinfo info;
- static MDB_val kbuf, dbuf;
- static MDB_val k0buf;
- #ifdef _WIN32
- #define Z "I"
- #else
- #define Z "z"
- #endif
- #define STRLENOF(s) (sizeof(s)-1)
- typedef struct flagbit {
- int bit;
- char *name;
- int len;
- } flagbit;
- #define S(s) s, STRLENOF(s)
- flagbit dbflags[] = {
- { MDB_REVERSEKEY, S("reversekey") },
- { MDB_DUPSORT, S("dupsort") },
- { MDB_INTEGERKEY, S("integerkey") },
- { MDB_DUPFIXED, S("dupfixed") },
- { MDB_INTEGERDUP, S("integerdup") },
- { MDB_REVERSEDUP, S("reversedup") },
- { 0, NULL, 0 }
- };
- static void readhdr(void)
- {
- char *ptr;
- flags = 0;
- while (fgets(dbuf.mv_data, dbuf.mv_size, stdin) != NULL) {
- lineno++;
- if (!strncmp(dbuf.mv_data, "VERSION=", STRLENOF("VERSION="))) {
- version=atoi((char *)dbuf.mv_data+STRLENOF("VERSION="));
- if (version > 3) {
- fprintf(stderr, "%s: line %" Z "d: unsupported VERSION %d\n",
- prog, lineno, version);
- exit(EXIT_FAILURE);
- }
- } else if (!strncmp(dbuf.mv_data, "HEADER=END", STRLENOF("HEADER=END"))) {
- break;
- } else if (!strncmp(dbuf.mv_data, "format=", STRLENOF("format="))) {
- if (!strncmp((char *)dbuf.mv_data+STRLENOF("FORMAT="), "print", STRLENOF("print")))
- mode |= PRINT;
- else if (strncmp((char *)dbuf.mv_data+STRLENOF("FORMAT="), "bytevalue", STRLENOF("bytevalue"))) {
- fprintf(stderr, "%s: line %" Z "d: unsupported FORMAT %s\n",
- prog, lineno, (char *)dbuf.mv_data+STRLENOF("FORMAT="));
- exit(EXIT_FAILURE);
- }
- } else if (!strncmp(dbuf.mv_data, "database=", STRLENOF("database="))) {
- ptr = memchr(dbuf.mv_data, '\n', dbuf.mv_size);
- if (ptr) *ptr = '\0';
- if (subname) free(subname);
- subname = strdup((char *)dbuf.mv_data+STRLENOF("database="));
- } else if (!strncmp(dbuf.mv_data, "type=", STRLENOF("type="))) {
- if (strncmp((char *)dbuf.mv_data+STRLENOF("type="), "btree", STRLENOF("btree"))) {
- fprintf(stderr, "%s: line %" Z "d: unsupported type %s\n",
- prog, lineno, (char *)dbuf.mv_data+STRLENOF("type="));
- exit(EXIT_FAILURE);
- }
- } else if (!strncmp(dbuf.mv_data, "mapaddr=", STRLENOF("mapaddr="))) {
- int i;
- ptr = memchr(dbuf.mv_data, '\n', dbuf.mv_size);
- if (ptr) *ptr = '\0';
- i = sscanf((char *)dbuf.mv_data+STRLENOF("mapaddr="), "%p", &info.me_mapaddr);
- if (i != 1) {
- fprintf(stderr, "%s: line %" Z "d: invalid mapaddr %s\n",
- prog, lineno, (char *)dbuf.mv_data+STRLENOF("mapaddr="));
- exit(EXIT_FAILURE);
- }
- } else if (!strncmp(dbuf.mv_data, "mapsize=", STRLENOF("mapsize="))) {
- int i;
- ptr = memchr(dbuf.mv_data, '\n', dbuf.mv_size);
- if (ptr) *ptr = '\0';
- i = sscanf((char *)dbuf.mv_data+STRLENOF("mapsize="), "%" Z "u", &info.me_mapsize);
- if (i != 1) {
- fprintf(stderr, "%s: line %" Z "d: invalid mapsize %s\n",
- prog, lineno, (char *)dbuf.mv_data+STRLENOF("mapsize="));
- exit(EXIT_FAILURE);
- }
- } else if (!strncmp(dbuf.mv_data, "maxreaders=", STRLENOF("maxreaders="))) {
- int i;
- ptr = memchr(dbuf.mv_data, '\n', dbuf.mv_size);
- if (ptr) *ptr = '\0';
- i = sscanf((char *)dbuf.mv_data+STRLENOF("maxreaders="), "%u", &info.me_maxreaders);
- if (i != 1) {
- fprintf(stderr, "%s: line %" Z "d: invalid maxreaders %s\n",
- prog, lineno, (char *)dbuf.mv_data+STRLENOF("maxreaders="));
- exit(EXIT_FAILURE);
- }
- } else {
- int i;
- for (i=0; dbflags[i].bit; i++) {
- if (!strncmp(dbuf.mv_data, dbflags[i].name, dbflags[i].len) &&
- ((char *)dbuf.mv_data)[dbflags[i].len] == '=') {
- flags |= dbflags[i].bit;
- break;
- }
- }
- if (!dbflags[i].bit) {
- ptr = memchr(dbuf.mv_data, '=', dbuf.mv_size);
- if (!ptr) {
- fprintf(stderr, "%s: line %" Z "d: unexpected format\n",
- prog, lineno);
- exit(EXIT_FAILURE);
- } else {
- *ptr = '\0';
- fprintf(stderr, "%s: line %" Z "d: unrecognized keyword ignored: %s\n",
- prog, lineno, (char *)dbuf.mv_data);
- }
- }
- }
- }
- }
- static void badend(void)
- {
- fprintf(stderr, "%s: line %" Z "d: unexpected end of input\n",
- prog, lineno);
- }
- static int unhex(unsigned char *c2)
- {
- int x, c;
- x = *c2++ & 0x4f;
- if (x & 0x40)
- x -= 55;
- c = x << 4;
- x = *c2 & 0x4f;
- if (x & 0x40)
- x -= 55;
- c |= x;
- return c;
- }
- static int readline(MDB_val *out, MDB_val *buf)
- {
- unsigned char *c1, *c2, *end;
- size_t len, l2;
- int c;
- if (!(mode & NOHDR)) {
- c = fgetc(stdin);
- if (c == EOF) {
- Eof = 1;
- return EOF;
- }
- if (c != ' ') {
- lineno++;
- if (fgets(buf->mv_data, buf->mv_size, stdin) == NULL) {
- badend:
- Eof = 1;
- badend();
- return EOF;
- }
- if (c == 'D' && !strncmp(buf->mv_data, "ATA=END", STRLENOF("ATA=END")))
- return EOF;
- goto badend;
- }
- }
- if (fgets(buf->mv_data, buf->mv_size, stdin) == NULL) {
- Eof = 1;
- return EOF;
- }
- lineno++;
- c1 = buf->mv_data;
- len = strlen((char *)c1);
- l2 = len;
- /* Is buffer too short? */
- while (c1[len-1] != '\n') {
- buf->mv_data = realloc(buf->mv_data, buf->mv_size*2);
- if (!buf->mv_data) {
- Eof = 1;
- fprintf(stderr, "%s: line %" Z "d: out of memory, line too long\n",
- prog, lineno);
- return EOF;
- }
- c1 = buf->mv_data;
- c1 += l2;
- if (fgets((char *)c1, buf->mv_size+1, stdin) == NULL) {
- Eof = 1;
- badend();
- return EOF;
- }
- buf->mv_size *= 2;
- len = strlen((char *)c1);
- l2 += len;
- }
- c1 = c2 = buf->mv_data;
- len = l2;
- c1[--len] = '\0';
- end = c1 + len;
- if (mode & PRINT) {
- while (c2 < end) {
- if (*c2 == '\\') {
- if (c2[1] == '\\') {
- *c1++ = *c2;
- } else {
- if (c2+3 > end || !isxdigit(c2[1]) || !isxdigit(c2[2])) {
- Eof = 1;
- badend();
- return EOF;
- }
- *c1++ = unhex(++c2);
- }
- c2 += 2;
- } else {
- /* copies are redundant when no escapes were used */
- *c1++ = *c2++;
- }
- }
- } else {
- /* odd length not allowed */
- if (len & 1) {
- Eof = 1;
- badend();
- return EOF;
- }
- while (c2 < end) {
- if (!isxdigit(*c2) || !isxdigit(c2[1])) {
- Eof = 1;
- badend();
- return EOF;
- }
- *c1++ = unhex(c2);
- c2 += 2;
- }
- }
- c2 = out->mv_data = buf->mv_data;
- out->mv_size = c1 - c2;
- return 0;
- }
- static void usage(void)
- {
- fprintf(stderr, "usage: %s [-V] [-a] [-f input] [-n] [-s name] [-N] [-T] dbpath\n", prog);
- exit(EXIT_FAILURE);
- }
- static int greater(const MDB_val *a, const MDB_val *b)
- {
- return 1;
- }
- int main(int argc, char *argv[])
- {
- int i, rc;
- MDB_env *env;
- MDB_txn *txn;
- MDB_cursor *mc;
- MDB_dbi dbi;
- char *envname;
- int envflags = MDB_NOSYNC, putflags = 0;
- int dohdr = 0, append = 0;
- MDB_val prevk;
- prog = argv[0];
- if (argc < 2) {
- usage();
- }
- /* -a: append records in input order
- * -f: load file instead of stdin
- * -n: use NOSUBDIR flag on env_open
- * -s: load into named subDB
- * -N: use NOOVERWRITE on puts
- * -T: read plaintext
- * -V: print version and exit
- */
- while ((i = getopt(argc, argv, "af:ns:NTV")) != EOF) {
- switch(i) {
- case 'V':
- printf("%s\n", MDB_VERSION_STRING);
- exit(0);
- break;
- case 'a':
- append = 1;
- break;
- case 'f':
- if (freopen(optarg, "r", stdin) == NULL) {
- fprintf(stderr, "%s: %s: reopen: %s\n",
- prog, optarg, strerror(errno));
- exit(EXIT_FAILURE);
- }
- break;
- case 'n':
- envflags |= MDB_NOSUBDIR;
- break;
- case 's':
- subname = strdup(optarg);
- break;
- case 'N':
- putflags = MDB_NOOVERWRITE|MDB_NODUPDATA;
- break;
- case 'T':
- mode |= NOHDR | PRINT;
- break;
- default:
- usage();
- }
- }
- if (optind != argc - 1)
- usage();
- dbuf.mv_size = 4096;
- dbuf.mv_data = malloc(dbuf.mv_size);
- if (!(mode & NOHDR))
- readhdr();
- envname = argv[optind];
- rc = mdb_env_create(&env);
- if (rc) {
- fprintf(stderr, "mdb_env_create failed, error %d %s\n", rc, mdb_strerror(rc));
- return EXIT_FAILURE;
- }
- mdb_env_set_maxdbs(env, 2);
- if (info.me_maxreaders)
- mdb_env_set_maxreaders(env, info.me_maxreaders);
- if (info.me_mapsize)
- mdb_env_set_mapsize(env, info.me_mapsize);
- if (info.me_mapaddr)
- envflags |= MDB_FIXEDMAP;
- rc = mdb_env_open(env, envname, envflags, 0664);
- if (rc) {
- fprintf(stderr, "mdb_env_open failed, error %d %s\n", rc, mdb_strerror(rc));
- goto env_close;
- }
- kbuf.mv_size = mdb_env_get_maxkeysize(env) * 2 + 2;
- kbuf.mv_data = malloc(kbuf.mv_size * 2);
- k0buf.mv_size = kbuf.mv_size;
- k0buf.mv_data = (char *)kbuf.mv_data + kbuf.mv_size;
- prevk.mv_data = k0buf.mv_data;
- while(!Eof) {
- MDB_val key, data;
- int batch = 0;
- flags = 0;
- int appflag;
- if (!dohdr) {
- dohdr = 1;
- } else if (!(mode & NOHDR))
- readhdr();
-
- rc = mdb_txn_begin(env, NULL, 0, &txn);
- if (rc) {
- fprintf(stderr, "mdb_txn_begin failed, error %d %s\n", rc, mdb_strerror(rc));
- goto env_close;
- }
- rc = mdb_open(txn, subname, flags|MDB_CREATE, &dbi);
- if (rc) {
- fprintf(stderr, "mdb_open failed, error %d %s\n", rc, mdb_strerror(rc));
- goto txn_abort;
- }
- prevk.mv_size = 0;
- if (append) {
- mdb_set_compare(txn, dbi, greater);
- if (flags & MDB_DUPSORT)
- mdb_set_dupsort(txn, dbi, greater);
- }
- rc = mdb_cursor_open(txn, dbi, &mc);
- if (rc) {
- fprintf(stderr, "mdb_cursor_open failed, error %d %s\n", rc, mdb_strerror(rc));
- goto txn_abort;
- }
- while(1) {
- rc = readline(&key, &kbuf);
- if (rc) /* rc == EOF */
- break;
- rc = readline(&data, &dbuf);
- if (rc) {
- fprintf(stderr, "%s: line %" Z "d: failed to read key value\n", prog, lineno);
- goto txn_abort;
- }
- if (append) {
- appflag = MDB_APPEND;
- if (flags & MDB_DUPSORT) {
- if (prevk.mv_size == key.mv_size && !memcmp(prevk.mv_data, key.mv_data, key.mv_size))
- appflag = MDB_CURRENT|MDB_APPENDDUP;
- else {
- memcpy(prevk.mv_data, key.mv_data, key.mv_size);
- prevk.mv_size = key.mv_size;
- }
- }
- } else {
- appflag = 0;
- }
- rc = mdb_cursor_put(mc, &key, &data, putflags|appflag);
- if (rc == MDB_KEYEXIST && putflags)
- continue;
- if (rc) {
- fprintf(stderr, "mdb_cursor_put failed, error %d %s\n", rc, mdb_strerror(rc));
- goto txn_abort;
- }
- batch++;
- if (batch == 100) {
- rc = mdb_txn_commit(txn);
- if (rc) {
- fprintf(stderr, "%s: line %" Z "d: txn_commit: %s\n",
- prog, lineno, mdb_strerror(rc));
- goto env_close;
- }
- rc = mdb_txn_begin(env, NULL, 0, &txn);
- if (rc) {
- fprintf(stderr, "mdb_txn_begin failed, error %d %s\n", rc, mdb_strerror(rc));
- goto env_close;
- }
- rc = mdb_cursor_open(txn, dbi, &mc);
- if (rc) {
- fprintf(stderr, "mdb_cursor_open failed, error %d %s\n", rc, mdb_strerror(rc));
- goto txn_abort;
- }
- if (appflag & MDB_APPENDDUP) {
- MDB_val k, d;
- mdb_cursor_get(mc, &k, &d, MDB_LAST);
- }
- batch = 0;
- }
- }
- rc = mdb_txn_commit(txn);
- txn = NULL;
- if (rc) {
- fprintf(stderr, "%s: line %" Z "d: txn_commit: %s\n",
- prog, lineno, mdb_strerror(rc));
- goto env_close;
- }
- mdb_dbi_close(env, dbi);
- }
- txn_abort:
- mdb_txn_abort(txn);
- env_close:
- mdb_env_close(env);
- return rc ? EXIT_FAILURE : EXIT_SUCCESS;
- }
|