mirror of https://github.com/facebook/rocksdb.git
BlobStore Benchmark
Summary: Finally, arc diff works again! This has been sitting in my repo for a while. I would like some comments on my BlobStore benchmark. We don't have to check this in. Also, I don't do any fsync in the BlobStore, so this is all extremely fast. I'm not sure what durability guarantees we need from the BlobStore. Test Plan: Nope Reviewers: dhruba, haobo, kailiu, emayanke Reviewed By: dhruba CC: leveldb Differential Revision: https://reviews.facebook.net/D13527
This commit is contained in:
parent
cb8a7302e4
commit
7e2c1ba173
|
@ -9,9 +9,8 @@ build_config.mk
|
||||||
*.so
|
*.so
|
||||||
*.so.*
|
*.so.*
|
||||||
*_test
|
*_test
|
||||||
db_bench
|
*_bench
|
||||||
db_repl_stress
|
*_stress
|
||||||
db_stress
|
|
||||||
ldb
|
ldb
|
||||||
leveldb_server
|
leveldb_server
|
||||||
leveldb_shell
|
leveldb_shell
|
||||||
|
|
6
Makefile
6
Makefile
|
@ -72,7 +72,8 @@ TOOLS = \
|
||||||
sst_dump \
|
sst_dump \
|
||||||
db_stress \
|
db_stress \
|
||||||
ldb \
|
ldb \
|
||||||
db_repl_stress
|
db_repl_stress \
|
||||||
|
blob_store_bench
|
||||||
|
|
||||||
PROGRAMS = db_bench signal_test $(TESTS) $(TOOLS)
|
PROGRAMS = db_bench signal_test $(TESTS) $(TOOLS)
|
||||||
BENCHMARKS = db_bench_sqlite3 db_bench_tree_db
|
BENCHMARKS = db_bench_sqlite3 db_bench_tree_db
|
||||||
|
@ -183,6 +184,9 @@ db_stress: tools/db_stress.o $(LIBOBJECTS) $(TESTUTIL)
|
||||||
db_repl_stress: tools/db_repl_stress.o $(LIBOBJECTS) $(TESTUTIL)
|
db_repl_stress: tools/db_repl_stress.o $(LIBOBJECTS) $(TESTUTIL)
|
||||||
$(CXX) tools/db_repl_stress.o $(LIBOBJECTS) $(TESTUTIL) $(EXEC_LDFLAGS) -o $@ $(LDFLAGS) $(COVERAGEFLAGS)
|
$(CXX) tools/db_repl_stress.o $(LIBOBJECTS) $(TESTUTIL) $(EXEC_LDFLAGS) -o $@ $(LDFLAGS) $(COVERAGEFLAGS)
|
||||||
|
|
||||||
|
blob_store_bench: tools/blob_store_bench.o $(LIBOBJECTS) $(TESTUTIL)
|
||||||
|
$(CXX) tools/blob_store_bench.o $(LIBOBJECTS) $(TESTUTIL) $(EXEC_LDFLAGS) -o $@ $(LDFLAGS) $(COVERAGEFLAGS)
|
||||||
|
|
||||||
db_bench_sqlite3: doc/bench/db_bench_sqlite3.o $(LIBOBJECTS) $(TESTUTIL)
|
db_bench_sqlite3: doc/bench/db_bench_sqlite3.o $(LIBOBJECTS) $(TESTUTIL)
|
||||||
$(CXX) doc/bench/db_bench_sqlite3.o $(LIBOBJECTS) $(TESTUTIL) $(EXEC_LDFLAGS) -o $@ $(LDFLAGS) -lsqlite3 $(COVERAGEFLAGS)
|
$(CXX) doc/bench/db_bench_sqlite3.o $(LIBOBJECTS) $(TESTUTIL) $(EXEC_LDFLAGS) -o $@ $(LDFLAGS) -lsqlite3 $(COVERAGEFLAGS)
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,259 @@
|
||||||
|
#include <cstdio>
|
||||||
|
#include <vector>
|
||||||
|
#include <atomic>
|
||||||
|
|
||||||
|
#include "rocksdb/env.h"
|
||||||
|
#include "util/blob_store.h"
|
||||||
|
#include "util/testutil.h"
|
||||||
|
|
||||||
|
#define KB 1024LL
|
||||||
|
#define MB 1024*1024LL
|
||||||
|
|
||||||
|
using namespace rocksdb;
|
||||||
|
using namespace std;
|
||||||
|
|
||||||
|
// used by all threads
|
||||||
|
uint64_t timeout_sec;
|
||||||
|
Env *env;
|
||||||
|
BlobStore* bs;
|
||||||
|
|
||||||
|
static std::string RandomString(Random* rnd, uint64_t len) {
|
||||||
|
std::string r;
|
||||||
|
test::RandomString(rnd, len, &r);
|
||||||
|
return r;
|
||||||
|
}
|
||||||
|
|
||||||
|
struct Result {
|
||||||
|
uint32_t writes;
|
||||||
|
uint32_t reads;
|
||||||
|
uint32_t deletes;
|
||||||
|
uint64_t data_written;
|
||||||
|
uint64_t data_read;
|
||||||
|
|
||||||
|
void print() {
|
||||||
|
printf("Total writes = %u\n", writes);
|
||||||
|
printf("Total reads = %u\n", reads);
|
||||||
|
printf("Total deletes = %u\n", deletes);
|
||||||
|
printf("Write throughput = %lf MB/s\n",
|
||||||
|
(double)data_written / (1024*1024.0) / timeout_sec);
|
||||||
|
printf("Read throughput = %lf MB/s\n",
|
||||||
|
(double)data_read / (1024*1024.0) / timeout_sec);
|
||||||
|
printf("Total throughput = %lf MB/s\n",
|
||||||
|
(double)(data_read + data_written) / (1024*1024.0) / timeout_sec);
|
||||||
|
}
|
||||||
|
|
||||||
|
Result() {
|
||||||
|
writes = reads = deletes = data_read = data_written = 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
Result (uint32_t writes, uint32_t reads, uint32_t deletes,
|
||||||
|
uint64_t data_written, uint64_t data_read) :
|
||||||
|
writes(writes), reads(reads), deletes(deletes),
|
||||||
|
data_written(data_written), data_read(data_read) {}
|
||||||
|
|
||||||
|
};
|
||||||
|
|
||||||
|
Result operator + (const Result &a, const Result &b) {
|
||||||
|
return Result(a.writes + b.writes, a.reads + b.reads,
|
||||||
|
a.deletes + b.deletes, a.data_written + b.data_written,
|
||||||
|
a.data_read + b.data_read);
|
||||||
|
}
|
||||||
|
|
||||||
|
struct WorkerThread {
|
||||||
|
uint64_t data_size_from, data_size_to;
|
||||||
|
double read_ratio;
|
||||||
|
uint64_t working_set_size; // start deleting once you reach this
|
||||||
|
Result result;
|
||||||
|
atomic<bool> stopped;
|
||||||
|
|
||||||
|
WorkerThread(uint64_t data_size_from, uint64_t data_size_to,
|
||||||
|
double read_ratio, uint64_t working_set_size) :
|
||||||
|
data_size_from(data_size_from), data_size_to(data_size_to),
|
||||||
|
read_ratio(read_ratio), working_set_size(working_set_size),
|
||||||
|
stopped(false) {}
|
||||||
|
|
||||||
|
WorkerThread(const WorkerThread& wt) :
|
||||||
|
data_size_from(wt.data_size_from), data_size_to(wt.data_size_to),
|
||||||
|
read_ratio(wt.read_ratio), working_set_size(wt.working_set_size),
|
||||||
|
stopped(false) {}
|
||||||
|
};
|
||||||
|
|
||||||
|
static void WorkerThreadBody(void* arg) {
|
||||||
|
WorkerThread* t = reinterpret_cast<WorkerThread*>(arg);
|
||||||
|
Random rnd(5);
|
||||||
|
string buf;
|
||||||
|
vector<pair<Blob, uint64_t>> blobs;
|
||||||
|
vector<string> random_strings;
|
||||||
|
|
||||||
|
for (int i = 0; i < 10; ++i) {
|
||||||
|
random_strings.push_back(RandomString(&rnd, t->data_size_to));
|
||||||
|
}
|
||||||
|
|
||||||
|
uint64_t total_size = 0;
|
||||||
|
|
||||||
|
uint64_t start_micros = env->NowMicros();
|
||||||
|
while (env->NowMicros() - start_micros < timeout_sec * 1000 * 1000) {
|
||||||
|
if (blobs.size() && rand() < RAND_MAX * t->read_ratio) {
|
||||||
|
// read
|
||||||
|
int bi = rand() % blobs.size();
|
||||||
|
Status s = bs->Get(blobs[bi].first, &buf);
|
||||||
|
assert(s.ok());
|
||||||
|
t->result.data_read += buf.size();
|
||||||
|
t->result.reads++;
|
||||||
|
} else {
|
||||||
|
// write
|
||||||
|
uint64_t size = rand() % (t->data_size_to - t->data_size_from) +
|
||||||
|
t->data_size_from;
|
||||||
|
total_size += size;
|
||||||
|
string put_str = random_strings[rand() % random_strings.size()];
|
||||||
|
blobs.push_back(make_pair(Blob(), size));
|
||||||
|
Status s = bs->Put(Slice(put_str.data(), size), &blobs.back().first);
|
||||||
|
assert(s.ok());
|
||||||
|
t->result.data_written += size;
|
||||||
|
t->result.writes++;
|
||||||
|
}
|
||||||
|
|
||||||
|
while (total_size >= t->working_set_size) {
|
||||||
|
// delete random
|
||||||
|
int bi = rand() % blobs.size();
|
||||||
|
total_size -= blobs[bi].second;
|
||||||
|
bs->Delete(blobs[bi].first);
|
||||||
|
blobs.erase(blobs.begin() + bi);
|
||||||
|
t->result.deletes++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
t->stopped.store(true);
|
||||||
|
}
|
||||||
|
|
||||||
|
Result StartBenchmark(vector<WorkerThread>& config) {
|
||||||
|
for (auto w : config) {
|
||||||
|
env->StartThread(WorkerThreadBody, &w);
|
||||||
|
}
|
||||||
|
|
||||||
|
Result result;
|
||||||
|
|
||||||
|
for (auto w : config) {
|
||||||
|
while (!w.stopped.load());
|
||||||
|
result = result + w.result;
|
||||||
|
}
|
||||||
|
|
||||||
|
delete bs;
|
||||||
|
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
|
vector<WorkerThread> SetupBenchmarkBalanced() {
|
||||||
|
string test_path;
|
||||||
|
env->GetTestDirectory(&test_path);
|
||||||
|
test_path.append("/blob_store");
|
||||||
|
|
||||||
|
// config start
|
||||||
|
uint32_t block_size = 16*KB;
|
||||||
|
uint32_t file_size = 1*MB;
|
||||||
|
double read_write_ratio = 0.5;
|
||||||
|
uint64_t data_read_from = 16*KB;
|
||||||
|
uint64_t data_read_to = 32*KB;
|
||||||
|
int number_of_threads = 10;
|
||||||
|
uint64_t working_set_size = 5*MB;
|
||||||
|
timeout_sec = 5;
|
||||||
|
// config end
|
||||||
|
|
||||||
|
bs = new BlobStore(test_path, block_size, file_size / block_size, 10000, env);
|
||||||
|
|
||||||
|
vector <WorkerThread> config;
|
||||||
|
|
||||||
|
for (int i = 0; i < number_of_threads; ++i) {
|
||||||
|
config.push_back(WorkerThread(data_read_from,
|
||||||
|
data_read_to,
|
||||||
|
read_write_ratio,
|
||||||
|
working_set_size));
|
||||||
|
};
|
||||||
|
|
||||||
|
return config;
|
||||||
|
}
|
||||||
|
|
||||||
|
vector<WorkerThread> SetupBenchmarkWriteHeavy() {
|
||||||
|
string test_path;
|
||||||
|
env->GetTestDirectory(&test_path);
|
||||||
|
test_path.append("/blob_store");
|
||||||
|
|
||||||
|
// config start
|
||||||
|
uint32_t block_size = 16*KB;
|
||||||
|
uint32_t file_size = 1*MB;
|
||||||
|
double read_write_ratio = 0.1;
|
||||||
|
uint64_t data_read_from = 16*KB;
|
||||||
|
uint64_t data_read_to = 32*KB;
|
||||||
|
int number_of_threads = 10;
|
||||||
|
uint64_t working_set_size = 5*MB;
|
||||||
|
timeout_sec = 5;
|
||||||
|
// config end
|
||||||
|
|
||||||
|
bs = new BlobStore(test_path, block_size, file_size / block_size, 10000, env);
|
||||||
|
|
||||||
|
vector <WorkerThread> config;
|
||||||
|
|
||||||
|
for (int i = 0; i < number_of_threads; ++i) {
|
||||||
|
config.push_back(WorkerThread(data_read_from,
|
||||||
|
data_read_to,
|
||||||
|
read_write_ratio,
|
||||||
|
working_set_size));
|
||||||
|
};
|
||||||
|
|
||||||
|
return config;
|
||||||
|
}
|
||||||
|
|
||||||
|
vector<WorkerThread> SetupBenchmarkReadHeavy() {
|
||||||
|
string test_path;
|
||||||
|
env->GetTestDirectory(&test_path);
|
||||||
|
test_path.append("/blob_store");
|
||||||
|
|
||||||
|
// config start
|
||||||
|
uint32_t block_size = 16*KB;
|
||||||
|
uint32_t file_size = 1*MB;
|
||||||
|
double read_write_ratio = 0.9;
|
||||||
|
uint64_t data_read_from = 16*KB;
|
||||||
|
uint64_t data_read_to = 32*KB;
|
||||||
|
int number_of_threads = 10;
|
||||||
|
uint64_t working_set_size = 5*MB;
|
||||||
|
timeout_sec = 5;
|
||||||
|
// config end
|
||||||
|
|
||||||
|
bs = new BlobStore(test_path, block_size, file_size / block_size, 10000, env);
|
||||||
|
|
||||||
|
vector <WorkerThread> config;
|
||||||
|
|
||||||
|
for (int i = 0; i < number_of_threads; ++i) {
|
||||||
|
config.push_back(WorkerThread(data_read_from,
|
||||||
|
data_read_to,
|
||||||
|
read_write_ratio,
|
||||||
|
working_set_size));
|
||||||
|
};
|
||||||
|
|
||||||
|
return config;
|
||||||
|
}
|
||||||
|
|
||||||
|
int main(int argc, const char** argv) {
|
||||||
|
srand(33);
|
||||||
|
env = Env::Default();
|
||||||
|
|
||||||
|
{
|
||||||
|
printf("--- Balanced read/write benchmark ---\n");
|
||||||
|
vector <WorkerThread> config = SetupBenchmarkBalanced();
|
||||||
|
Result r = StartBenchmark(config);
|
||||||
|
r.print();
|
||||||
|
}
|
||||||
|
{
|
||||||
|
printf("--- Write heavy benchmark ---\n");
|
||||||
|
vector <WorkerThread> config = SetupBenchmarkWriteHeavy();
|
||||||
|
Result r = StartBenchmark(config);
|
||||||
|
r.print();
|
||||||
|
}
|
||||||
|
{
|
||||||
|
printf("--- Read heavy benchmark ---\n");
|
||||||
|
vector <WorkerThread> config = SetupBenchmarkReadHeavy();
|
||||||
|
Result r = StartBenchmark(config);
|
||||||
|
r.print();
|
||||||
|
}
|
||||||
|
|
||||||
|
return 0;
|
||||||
|
}
|
Loading…
Reference in New Issue