Summary: Hack up rocksdb_dump and rocksdb_undump utilities to get this task rolling/promote discussion. Test Plan: Dump/undump databases recursively to see if nothing is lost. Reviewers: sdong, yhchiang, rven, anthony, kradhakrishnan, igor Reviewed By: igor Subscribers: dhruba Differential Revision: https://reviews.facebook.net/D37269main
parent
04251e1e3a
commit
15325bf55b
@ -0,0 +1,16 @@ |
||||
## RocksDB dump format |
||||
|
||||
The version 1 RocksDB dump format is fairly simple: |
||||
|
||||
1) The dump starts with the magic 8 byte identifier "ROCKDUMP" |
||||
|
||||
2) The magic is followed by an 8 byte big-endian version which is 0x00000001. |
||||
|
||||
3) Next are arbitrarily sized chunks of bytes prepended by 4 byte little endian number indicating how large each chunk is. |
||||
|
||||
4) The first chunk is special and is a json string indicating some things about the creation of this dump. It contains the following keys: |
||||
* database-path: The path of the database this dump was created from. |
||||
* hostname: The hostname of the machine where the dump was created. |
||||
* creation-time: Unix seconds since epoc when this dump was created. |
||||
|
||||
5) Following the info dump the slices paired into are key/value pairs. |
@ -0,0 +1,149 @@ |
||||
// Copyright (c) 2014, Facebook, Inc. All rights reserved.
|
||||
// This source code is licensed under the BSD-style license found in the
|
||||
// LICENSE file in the root directory of this source tree. An additional grant
|
||||
// of patent rights can be found in the PATENTS file in the same directory.
|
||||
|
||||
#ifndef GFLAGS |
||||
#include <cstdio> |
||||
int main() { |
||||
fprintf(stderr, "Please install gflags to run rocksdb tools\n"); |
||||
return 1; |
||||
} |
||||
#else |
||||
|
||||
#include <gflags/gflags.h> |
||||
#include <iostream> |
||||
|
||||
#include "rocksdb/db.h" |
||||
#include "rocksdb/env.h" |
||||
#include "util/coding.h" |
||||
|
||||
DEFINE_bool(anonymous, false, "Output an empty information blob."); |
||||
|
||||
void usage(const char* name) { |
||||
std::cout << "usage: " << name << " [--anonymous] <db> <dumpfile>" |
||||
<< std::endl; |
||||
} |
||||
|
||||
int main(int argc, char** argv) { |
||||
rocksdb::DB* dbptr; |
||||
rocksdb::Options options; |
||||
rocksdb::Status status; |
||||
std::unique_ptr<rocksdb::WritableFile> dumpfile; |
||||
char hostname[1024]; |
||||
int64_t timesec; |
||||
std::string abspath; |
||||
char json[4096]; |
||||
|
||||
GFLAGS::ParseCommandLineFlags(&argc, &argv, true); |
||||
|
||||
static const char* magicstr = "ROCKDUMP"; |
||||
static const char versionstr[8] = {0, 0, 0, 0, 0, 0, 0, 1}; |
||||
|
||||
if (argc != 3) { |
||||
usage(argv[0]); |
||||
exit(1); |
||||
} |
||||
|
||||
rocksdb::Env* env = rocksdb::Env::Default(); |
||||
|
||||
// Open the database
|
||||
options.create_if_missing = false; |
||||
status = rocksdb::DB::OpenForReadOnly(options, argv[1], &dbptr); |
||||
if (!status.ok()) { |
||||
std::cerr << "Unable to open database '" << argv[1] |
||||
<< "' for reading: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
const std::unique_ptr<rocksdb::DB> db(dbptr); |
||||
|
||||
status = env->NewWritableFile(argv[2], &dumpfile, rocksdb::EnvOptions()); |
||||
if (!status.ok()) { |
||||
std::cerr << "Unable to open dump file '" << argv[2] |
||||
<< "' for writing: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
rocksdb::Slice magicslice(magicstr, 8); |
||||
status = dumpfile->Append(magicslice); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
rocksdb::Slice versionslice(versionstr, 8); |
||||
status = dumpfile->Append(versionslice); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
if (FLAGS_anonymous) { |
||||
snprintf(json, sizeof(json), "{}"); |
||||
} else { |
||||
status = env->GetHostName(hostname, sizeof(hostname)); |
||||
status = env->GetCurrentTime(×ec); |
||||
status = env->GetAbsolutePath(argv[1], &abspath); |
||||
snprintf(json, sizeof(json), |
||||
"{ \"database-path\": \"%s\", \"hostname\": \"%s\", " |
||||
"\"creation-time\": %ld }", |
||||
abspath.c_str(), hostname, timesec); |
||||
} |
||||
|
||||
rocksdb::Slice infoslice(json, strlen(json)); |
||||
char infosize[4]; |
||||
rocksdb::EncodeFixed32(infosize, (uint32_t)infoslice.size()); |
||||
rocksdb::Slice infosizeslice(infosize, 4); |
||||
status = dumpfile->Append(infosizeslice); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
status = dumpfile->Append(infoslice); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
const std::unique_ptr<rocksdb::Iterator> it( |
||||
db->NewIterator(rocksdb::ReadOptions())); |
||||
for (it->SeekToFirst(); it->Valid(); it->Next()) { |
||||
char keysize[4]; |
||||
rocksdb::EncodeFixed32(keysize, (uint32_t)it->key().size()); |
||||
rocksdb::Slice keysizeslice(keysize, 4); |
||||
status = dumpfile->Append(keysizeslice); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
status = dumpfile->Append(it->key()); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
char valsize[4]; |
||||
rocksdb::EncodeFixed32(valsize, (uint32_t)it->value().size()); |
||||
rocksdb::Slice valsizeslice(valsize, 4); |
||||
status = dumpfile->Append(valsizeslice); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
status = dumpfile->Append(it->value()); |
||||
if (!status.ok()) { |
||||
std::cerr << "Append failed: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
} |
||||
if (!it->status().ok()) { |
||||
std::cerr << "Database iteration failed: " << status.ToString() |
||||
<< std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
return 0; |
||||
} |
||||
|
||||
#endif // GFLAGS
|
@ -0,0 +1,136 @@ |
||||
// Copyright (c) 2014, Facebook, Inc. All rights reserved.
|
||||
// This source code is licensed under the BSD-style license found in the
|
||||
// LICENSE file in the root directory of this source tree. An additional grant
|
||||
// of patent rights can be found in the PATENTS file in the same directory.
|
||||
|
||||
#include <cstring> |
||||
#include <iostream> |
||||
|
||||
#include "rocksdb/db.h" |
||||
#include "rocksdb/env.h" |
||||
#include "util/coding.h" |
||||
|
||||
void usage(const char *name) { |
||||
std::cout << "usage: " << name << " <dumpfile> <rocksdb>" << std::endl; |
||||
} |
||||
|
||||
int main(int argc, char **argv) { |
||||
rocksdb::DB *dbptr; |
||||
rocksdb::Options options; |
||||
rocksdb::Status status; |
||||
rocksdb::Env *env; |
||||
std::unique_ptr<rocksdb::SequentialFile> dumpfile; |
||||
rocksdb::Slice slice; |
||||
char scratch8[8]; |
||||
|
||||
static const char *magicstr = "ROCKDUMP"; |
||||
static const char versionstr[8] = {0, 0, 0, 0, 0, 0, 0, 1}; |
||||
|
||||
if (argc != 3) { |
||||
usage(argv[0]); |
||||
exit(1); |
||||
} |
||||
|
||||
env = rocksdb::Env::Default(); |
||||
|
||||
status = env->NewSequentialFile(argv[1], &dumpfile, rocksdb::EnvOptions()); |
||||
if (!status.ok()) { |
||||
std::cerr << "Unable to open dump file '" << argv[1] |
||||
<< "' for reading: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
status = dumpfile->Read(8, &slice, scratch8); |
||||
if (!status.ok() || slice.size() != 8 || |
||||
memcmp(slice.data(), magicstr, 8) != 0) { |
||||
std::cerr << "File '" << argv[1] << "' is not a recognizable dump file." |
||||
<< std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
status = dumpfile->Read(8, &slice, scratch8); |
||||
if (!status.ok() || slice.size() != 8 || |
||||
memcmp(slice.data(), versionstr, 8) != 0) { |
||||
std::cerr << "File '" << argv[1] << "' version not recognized." |
||||
<< std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
status = dumpfile->Read(4, &slice, scratch8); |
||||
if (!status.ok() || slice.size() != 4) { |
||||
std::cerr << "Unable to read info blob size." << std::endl; |
||||
exit(1); |
||||
} |
||||
uint32_t infosize = rocksdb::DecodeFixed32(slice.data()); |
||||
status = dumpfile->Skip(infosize); |
||||
if (!status.ok()) { |
||||
std::cerr << "Unable to skip info blob: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
options.create_if_missing = true; |
||||
status = rocksdb::DB::Open(options, argv[2], &dbptr); |
||||
if (!status.ok()) { |
||||
std::cerr << "Unable to open database '" << argv[2] |
||||
<< "' for writing: " << status.ToString() << std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
const std::unique_ptr<rocksdb::DB> db(dbptr); |
||||
|
||||
uint32_t last_keysize = 64; |
||||
size_t last_valsize = 1 << 20; |
||||
std::unique_ptr<char[]> keyscratch(new char[last_keysize]); |
||||
std::unique_ptr<char[]> valscratch(new char[last_valsize]); |
||||
|
||||
while (1) { |
||||
uint32_t keysize, valsize; |
||||
rocksdb::Slice keyslice; |
||||
rocksdb::Slice valslice; |
||||
|
||||
status = dumpfile->Read(4, &slice, scratch8); |
||||
if (!status.ok() || slice.size() != 4) break; |
||||
keysize = rocksdb::DecodeFixed32(slice.data()); |
||||
if (keysize > last_keysize) { |
||||
while (keysize > last_keysize) last_keysize *= 2; |
||||
keyscratch = std::unique_ptr<char[]>(new char[last_keysize]); |
||||
} |
||||
|
||||
status = dumpfile->Read(keysize, &keyslice, keyscratch.get()); |
||||
if (!status.ok() || keyslice.size() != keysize) { |
||||
std::cerr << "Key read failure: " |
||||
<< (status.ok() ? "insufficient data" : status.ToString()) |
||||
<< std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
status = dumpfile->Read(4, &slice, scratch8); |
||||
if (!status.ok() || slice.size() != 4) { |
||||
std::cerr << "Unable to read value size: " |
||||
<< (status.ok() ? "insufficient data" : status.ToString()) |
||||
<< std::endl; |
||||
exit(1); |
||||
} |
||||
valsize = rocksdb::DecodeFixed32(slice.data()); |
||||
if (valsize > last_valsize) { |
||||
while (valsize > last_valsize) last_valsize *= 2; |
||||
valscratch = std::unique_ptr<char[]>(new char[last_valsize]); |
||||
} |
||||
|
||||
status = dumpfile->Read(valsize, &valslice, valscratch.get()); |
||||
if (!status.ok() || valslice.size() != valsize) { |
||||
std::cerr << "Unable to read value: " |
||||
<< (status.ok() ? "insufficient data" : status.ToString()) |
||||
<< std::endl; |
||||
exit(1); |
||||
} |
||||
|
||||
status = db->Put(rocksdb::WriteOptions(), keyslice, valslice); |
||||
if (!status.ok()) { |
||||
fprintf(stderr, "Unable to write database entry\n"); |
||||
exit(1); |
||||
} |
||||
} |
||||
|
||||
return 0; |
||||
} |
@ -0,0 +1,7 @@ |
||||
TESTDIR=`mktemp -d /tmp/rocksdb-dump-test.XXXXX` |
||||
DUMPFILE="tools/sample-dump.dmp" |
||||
|
||||
# Verify that the sample dump file is undumpable and then redumpable. |
||||
./rocksdb_undump $DUMPFILE $TESTDIR/db |
||||
./rocksdb_dump --anonymous $TESTDIR/db $TESTDIR/dump |
||||
cmp $DUMPFILE $TESTDIR/dump |
Binary file not shown.
Loading…
Reference in new issue