mirror of
https://github.com/facebook/rocksdb.git
synced 2024-11-27 11:43:49 +00:00
768edfaaed
Summary: Added the following two options: [--bloom_bits=<int,e.g.:14>] [--compression_type=<no|snappy|zlib|bzip2>] These options will be used when ldb opens the leveldb database. Test Plan: Tried by hand for both success and failure cases. We do need a test framework. Reviewers: dhruba, emayanke, sheki Reviewed By: dhruba CC: leveldb Differential Revision: https://reviews.facebook.net/D7197
472 lines
14 KiB
C++
472 lines
14 KiB
C++
// Copyright (c) 2012 Facebook. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
// found in the LICENSE file.
|
|
|
|
|
|
#include "leveldb/write_batch.h"
|
|
#include "db/dbformat.h"
|
|
#include "db/log_reader.h"
|
|
#include "db/write_batch_internal.h"
|
|
#include "util/ldb_cmd.h"
|
|
|
|
namespace leveldb {
|
|
|
|
const char* LDBCommand::BLOOM_ARG = "--bloom_bits=";
|
|
const char* LDBCommand::COMPRESSION_TYPE_ARG = "--compression_type=";
|
|
|
|
void LDBCommand::parse_open_args(std::vector<std::string>& args) {
|
|
std::vector<std::string> rest_of_args;
|
|
for (unsigned int i = 0; i < args.size(); i++) {
|
|
std::string& arg = args.at(i);
|
|
if (arg.find(BLOOM_ARG) == 0
|
|
|| arg.find(COMPRESSION_TYPE_ARG) == 0) {
|
|
open_args_.push_back(arg);
|
|
} else {
|
|
rest_of_args.push_back(arg);
|
|
}
|
|
}
|
|
swap(args, rest_of_args);
|
|
}
|
|
|
|
leveldb::Options LDBCommand::PrepareOptionsForOpenDB() {
|
|
leveldb::Options opt;
|
|
opt.create_if_missing = false;
|
|
for (unsigned int i = 0; i < open_args_.size(); i++) {
|
|
std::string& arg = open_args_.at(i);
|
|
if (arg.find(BLOOM_ARG) == 0) {
|
|
std::string bits_string = arg.substr(strlen(BLOOM_ARG));
|
|
int bits = atoi(bits_string.c_str());
|
|
if (bits == 0) {
|
|
// Badly-formatted bits.
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(
|
|
std::string("Badly-formatted bits: ") + bits_string);
|
|
}
|
|
opt.filter_policy = leveldb::NewBloomFilterPolicy(bits);
|
|
} else if (arg.find(COMPRESSION_TYPE_ARG) == 0) {
|
|
std::string comp = arg.substr(strlen(COMPRESSION_TYPE_ARG));
|
|
if (comp == "no") {
|
|
opt.compression = leveldb::kNoCompression;
|
|
} else if (comp == "snappy") {
|
|
opt.compression = leveldb::kSnappyCompression;
|
|
} else if (comp == "zlib") {
|
|
opt.compression = leveldb::kZlibCompression;
|
|
} else if (comp == "bzip2") {
|
|
opt.compression = leveldb::kBZip2Compression;
|
|
} else {
|
|
// Unknown compression.
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(
|
|
"Unknown compression level: " + comp);
|
|
}
|
|
}
|
|
}
|
|
|
|
return opt;
|
|
}
|
|
|
|
|
|
const char* LDBCommand::FROM_ARG = "--from=";
|
|
const char* LDBCommand::END_ARG = "--to=";
|
|
const char* LDBCommand::HEX_ARG = "--hex";
|
|
|
|
Compactor::Compactor(std::string& db_name, std::vector<std::string>& args) :
|
|
LDBCommand(db_name, args), null_from_(true), null_to_(true), hex_(false) {
|
|
for (unsigned int i = 0; i < args.size(); i++) {
|
|
std::string& arg = args.at(i);
|
|
if (arg.find(FROM_ARG) == 0) {
|
|
null_from_ = false;
|
|
from_ = arg.substr(strlen(FROM_ARG));
|
|
} else if (arg.find(END_ARG) == 0) {
|
|
null_to_ = false;
|
|
to_ = arg.substr(strlen(END_ARG));
|
|
} else if (arg.find(HEX_ARG) == 0) {
|
|
hex_ = true;
|
|
} else {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED("Unknown argument." + arg);
|
|
}
|
|
}
|
|
|
|
if (hex_) {
|
|
if (!null_from_) {
|
|
from_ = HexToString(from_);
|
|
}
|
|
if (!null_to_) {
|
|
to_ = HexToString(to_);
|
|
}
|
|
}
|
|
}
|
|
|
|
void Compactor::Help(std::string& ret) {
|
|
LDBCommand::Help(ret);
|
|
ret.append("[--from=START KEY] ");
|
|
ret.append("[--to=START KEY] ");
|
|
ret.append("[--hex] ");
|
|
}
|
|
|
|
void Compactor::DoCommand() {
|
|
|
|
leveldb::Slice* begin = NULL;
|
|
leveldb::Slice* end = NULL;
|
|
if (!null_from_) {
|
|
begin = new leveldb::Slice(from_);
|
|
}
|
|
if (!null_to_) {
|
|
end = new leveldb::Slice(to_);
|
|
}
|
|
|
|
db_->CompactRange(begin, end);
|
|
exec_state_ = LDBCommandExecuteResult::SUCCEED("");
|
|
|
|
delete begin;
|
|
delete end;
|
|
}
|
|
|
|
const char* DBDumper::MAX_KEYS_ARG = "--max_keys=";
|
|
const char* DBDumper::COUNT_ONLY_ARG = "--count_only";
|
|
const char* DBDumper::STATS_ARG = "--stats";
|
|
const char* DBDumper::HEX_OUTPUT_ARG = "--output_hex";
|
|
|
|
DBDumper::DBDumper(std::string& db_name, std::vector<std::string>& args) :
|
|
LDBCommand(db_name, args),
|
|
null_from_(true),
|
|
null_to_(true),
|
|
max_keys_(-1),
|
|
count_only_(false),
|
|
print_stats_(false),
|
|
hex_(false),
|
|
hex_output_(false) {
|
|
for (unsigned int i = 0; i < args.size(); i++) {
|
|
std::string& arg = args.at(i);
|
|
if (arg.find(FROM_ARG) == 0) {
|
|
null_from_ = false;
|
|
from_ = arg.substr(strlen(FROM_ARG));
|
|
} else if (arg.find(END_ARG) == 0) {
|
|
null_to_ = false;
|
|
to_ = arg.substr(strlen(END_ARG));
|
|
} else if (arg.find(HEX_ARG) == 0) {
|
|
hex_ = true;
|
|
} else if (arg.find(MAX_KEYS_ARG) == 0) {
|
|
max_keys_ = atoi(arg.substr(strlen(MAX_KEYS_ARG)).c_str());
|
|
} else if (arg.find(STATS_ARG) == 0) {
|
|
print_stats_ = true;
|
|
} else if (arg.find(COUNT_ONLY_ARG) == 0) {
|
|
count_only_ = true;
|
|
} else if (arg.find(HEX_OUTPUT_ARG) == 0) {
|
|
hex_output_ = true;
|
|
} else {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED("Unknown argument:" + arg);
|
|
}
|
|
}
|
|
|
|
if (hex_) {
|
|
if (!null_from_) {
|
|
from_ = HexToString(from_);
|
|
}
|
|
if (!null_to_) {
|
|
to_ = HexToString(to_);
|
|
}
|
|
}
|
|
}
|
|
|
|
void DBDumper::Help(std::string& ret) {
|
|
LDBCommand::Help(ret);
|
|
ret.append("[--from=START KEY] ");
|
|
ret.append("[--to=END Key] ");
|
|
ret.append("[--hex] ");
|
|
ret.append("[--output_hex] ");
|
|
ret.append("[--max_keys=NUM] ");
|
|
ret.append("[--count_only] ");
|
|
ret.append("[--stats] ");
|
|
}
|
|
|
|
void DBDumper::DoCommand() {
|
|
if (!db_) {
|
|
return;
|
|
}
|
|
// Parse command line args
|
|
uint64_t count = 0;
|
|
if (print_stats_) {
|
|
std::string stats;
|
|
if (db_->GetProperty("leveldb.stats", &stats)) {
|
|
fprintf(stdout, "%s\n", stats.c_str());
|
|
}
|
|
}
|
|
|
|
// Setup key iterator
|
|
leveldb::Iterator* iter = db_->NewIterator(leveldb::ReadOptions());
|
|
leveldb::Status st = iter->status();
|
|
if (!st.ok()) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED("Iterator error."
|
|
+ st.ToString());
|
|
}
|
|
|
|
if (!null_from_) {
|
|
iter->Seek(from_);
|
|
} else {
|
|
iter->SeekToFirst();
|
|
}
|
|
|
|
int max_keys = max_keys_;
|
|
for (; iter->Valid(); iter->Next()) {
|
|
// If end marker was specified, we stop before it
|
|
if (!null_to_ && (iter->key().ToString() >= to_))
|
|
break;
|
|
// Terminate if maximum number of keys have been dumped
|
|
if (max_keys == 0)
|
|
break;
|
|
if (max_keys > 0) {
|
|
--max_keys;
|
|
}
|
|
++count;
|
|
if (!count_only_) {
|
|
if (hex_output_) {
|
|
std::string str = iter->key().ToString();
|
|
for (unsigned int i = 0; i < str.length(); ++i) {
|
|
fprintf(stdout, "%X", str[i]);
|
|
}
|
|
fprintf(stdout, " ==> ");
|
|
str = iter->value().ToString();
|
|
for (unsigned int i = 0; i < str.length(); ++i) {
|
|
fprintf(stdout, "%X", str[i]);
|
|
}
|
|
fprintf(stdout, "\n");
|
|
} else {
|
|
fprintf(stdout, "%s ==> %s\n", iter->key().ToString().c_str(),
|
|
iter->value().ToString().c_str());
|
|
}
|
|
}
|
|
}
|
|
fprintf(stdout, "Keys in range: %lld\n", (long long) count);
|
|
// Clean up
|
|
delete iter;
|
|
}
|
|
|
|
|
|
const char* ReduceDBLevels::NEW_LEVLES_ARG = "--new_levels=";
|
|
const char* ReduceDBLevels::PRINT_OLD_LEVELS_ARG = "--print_old_levels";
|
|
const char* ReduceDBLevels::COMPRESSION_TYPE_ARG = "--compression=";
|
|
const char* ReduceDBLevels::FILE_SIZE_ARG = "--file_size=";
|
|
|
|
ReduceDBLevels::ReduceDBLevels(std::string& db_name,
|
|
std::vector<std::string>& args)
|
|
: LDBCommand(db_name, args),
|
|
old_levels_(1 << 16),
|
|
new_levels_(-1),
|
|
print_old_levels_(false) {
|
|
file_size_ = leveldb::Options().target_file_size_base;
|
|
compression_ = leveldb::Options().compression;
|
|
|
|
for (unsigned int i = 0; i < args.size(); i++) {
|
|
std::string& arg = args.at(i);
|
|
if (arg.find(NEW_LEVLES_ARG) == 0) {
|
|
new_levels_ = atoi(arg.substr(strlen(NEW_LEVLES_ARG)).c_str());
|
|
} else if (arg.find(PRINT_OLD_LEVELS_ARG) == 0) {
|
|
print_old_levels_ = true;
|
|
} else if (arg.find(COMPRESSION_TYPE_ARG) == 0) {
|
|
const char* type = arg.substr(strlen(COMPRESSION_TYPE_ARG)).c_str();
|
|
if (!strcasecmp(type, "none"))
|
|
compression_ = leveldb::kNoCompression;
|
|
else if (!strcasecmp(type, "snappy"))
|
|
compression_ = leveldb::kSnappyCompression;
|
|
else if (!strcasecmp(type, "zlib"))
|
|
compression_ = leveldb::kZlibCompression;
|
|
else if (!strcasecmp(type, "bzip2"))
|
|
compression_ = leveldb::kBZip2Compression;
|
|
else
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(
|
|
"Invalid compression arg : " + arg);
|
|
} else if (arg.find(FILE_SIZE_ARG) == 0) {
|
|
file_size_ = atoi(arg.substr(strlen(FILE_SIZE_ARG)).c_str());
|
|
} else {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(
|
|
"Unknown argument." + arg);
|
|
}
|
|
}
|
|
|
|
if(new_levels_ <= 0) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(
|
|
" Use --new_levels to specify a new level number\n");
|
|
}
|
|
}
|
|
|
|
std::vector<std::string> ReduceDBLevels::PrepareArgs(int new_levels,
|
|
bool print_old_level) {
|
|
std::vector<std::string> ret;
|
|
char arg[100];
|
|
sprintf(arg, "%s%d", NEW_LEVLES_ARG, new_levels);
|
|
ret.push_back(arg);
|
|
if(print_old_level) {
|
|
sprintf(arg, "%s", PRINT_OLD_LEVELS_ARG);
|
|
ret.push_back(arg);
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
void ReduceDBLevels::Help(std::string& msg) {
|
|
LDBCommand::Help(msg);
|
|
msg.append("[--new_levels=New number of levels] ");
|
|
msg.append("[--print_old_levels] ");
|
|
msg.append("[--compression=none|snappy|zlib|bzip2] ");
|
|
msg.append("[--file_size= per-file size] ");
|
|
}
|
|
|
|
leveldb::Options ReduceDBLevels::PrepareOptionsForOpenDB() {
|
|
leveldb::Options opt = LDBCommand::PrepareOptionsForOpenDB();
|
|
opt.num_levels = old_levels_;
|
|
// Disable size compaction
|
|
opt.max_bytes_for_level_base = 1UL << 50;
|
|
opt.max_bytes_for_level_multiplier = 1;
|
|
opt.max_mem_compaction_level = 0;
|
|
return opt;
|
|
}
|
|
|
|
Status ReduceDBLevels::GetOldNumOfLevels(leveldb::Options& opt, int* levels) {
|
|
TableCache* tc = new TableCache(db_path_, &opt, 10);
|
|
const InternalKeyComparator* cmp = new InternalKeyComparator(
|
|
opt.comparator);
|
|
VersionSet* versions = new VersionSet(db_path_, &opt,
|
|
tc, cmp);
|
|
// We rely the VersionSet::Recover to tell us the internal data structures
|
|
// in the db. And the Recover() should never do any change
|
|
// (like LogAndApply) to the manifest file.
|
|
Status st = versions->Recover();
|
|
if (!st.ok()) {
|
|
return st;
|
|
}
|
|
int max = -1;
|
|
for (int i = 0; i < versions->NumberLevels(); i++) {
|
|
if (versions->NumLevelFiles(i)) {
|
|
max = i;
|
|
}
|
|
}
|
|
|
|
*levels = max + 1;
|
|
delete versions;
|
|
return st;
|
|
}
|
|
|
|
void ReduceDBLevels::DoCommand() {
|
|
if (new_levels_ <= 1) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(
|
|
"Invalid number of levels.\n");
|
|
return;
|
|
}
|
|
|
|
leveldb::Status st;
|
|
leveldb::Options opt = PrepareOptionsForOpenDB();
|
|
int old_level_num = -1;
|
|
st = GetOldNumOfLevels(opt, &old_level_num);
|
|
if (!st.ok()) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(st.ToString());
|
|
return;
|
|
}
|
|
|
|
if (print_old_levels_) {
|
|
fprintf(stdout, "The old number of levels in use is %d\n", old_level_num);
|
|
}
|
|
|
|
if (old_level_num <= new_levels_) {
|
|
return;
|
|
}
|
|
|
|
old_levels_ = old_level_num;
|
|
|
|
OpenDB();
|
|
if (!db_) {
|
|
return;
|
|
}
|
|
// Compact the whole DB to put all files to the highest level.
|
|
fprintf(stdout, "Compacting the db...\n");
|
|
db_->CompactRange(NULL, NULL);
|
|
CloseDB();
|
|
|
|
TableCache* tc = new TableCache(db_path_, &opt, 10);
|
|
const InternalKeyComparator* cmp = new InternalKeyComparator(
|
|
opt.comparator);
|
|
VersionSet* versions = new VersionSet(db_path_, &opt,
|
|
tc, cmp);
|
|
// We rely the VersionSet::Recover to tell us the internal data structures
|
|
// in the db. And the Recover() should never do any change (like LogAndApply)
|
|
// to the manifest file.
|
|
st = versions->Recover();
|
|
if (!st.ok()) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(st.ToString());
|
|
return;
|
|
}
|
|
|
|
port::Mutex mu;
|
|
mu.Lock();
|
|
st = versions->ReduceNumberOfLevels(new_levels_, &mu);
|
|
mu.Unlock();
|
|
|
|
if (!st.ok()) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED(st.ToString());
|
|
return;
|
|
}
|
|
}
|
|
|
|
const char* WALDumper::WAL_FILE_ARG = "--walfile=";
|
|
WALDumper::WALDumper(std::vector<std::string>& args) :
|
|
LDBCommand(args), print_header_(false) {
|
|
wal_file_.clear();
|
|
for (unsigned int i = 0; i < args.size(); i++) {
|
|
std::string& arg = args.at(i);
|
|
if (arg.find("--header") == 0) {
|
|
print_header_ = true;
|
|
} else if (arg.find(WAL_FILE_ARG) == 0) {
|
|
wal_file_ = arg.substr(strlen(WAL_FILE_ARG));
|
|
} else {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED("Unknown argument " + arg);
|
|
}
|
|
}
|
|
if (wal_file_.empty()) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED("Argument --walfile reqd.");
|
|
}
|
|
}
|
|
|
|
void WALDumper::Help(std::string& ret) {
|
|
ret.append("--walfile write_ahead_log ");
|
|
ret.append("[--header print's a header] ");
|
|
}
|
|
|
|
void WALDumper::DoCommand() {
|
|
struct StdErrReporter : public log::Reader::Reporter {
|
|
virtual void Corruption(size_t bytes, const Status& s) {
|
|
std::cerr<<"Corruption detected in log file "<<s.ToString()<<"\n";
|
|
}
|
|
};
|
|
|
|
SequentialFile* file;
|
|
Env* env_ = Env::Default();
|
|
Status status = env_->NewSequentialFile(wal_file_, &file);
|
|
if (!status.ok()) {
|
|
exec_state_ = LDBCommandExecuteResult::FAILED("Failed to open WAL file " +
|
|
status.ToString());
|
|
} else {
|
|
StdErrReporter reporter;
|
|
log::Reader reader(file, &reporter, true, 0);
|
|
std::string scratch;
|
|
WriteBatch batch;
|
|
Slice record;
|
|
std::stringstream row;
|
|
if (print_header_) {
|
|
std::cout<<"Sequence,Count,ByteSize,Physical Offset\n";
|
|
}
|
|
while(reader.ReadRecord(&record, &scratch)) {
|
|
row.str("");
|
|
if (record.size() < 12) {
|
|
reporter.Corruption(
|
|
record.size(), Status::Corruption("log record too small"));
|
|
} else {
|
|
WriteBatchInternal::SetContents(&batch, record);
|
|
row<<WriteBatchInternal::Sequence(&batch)<<",";
|
|
row<<WriteBatchInternal::Count(&batch)<<",";
|
|
row<<WriteBatchInternal::ByteSize(&batch)<<",";
|
|
row<<reader.LastRecordOffset()<<"\n";
|
|
}
|
|
std::cout<<row.str();
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|