Fix race to make BlockBasedTableOptions effectively mutable (#13082)

Summary:
Fix a longstanding race condition in SetOptions for `block_based_table_factory` options. The fix is mostly described in new, unified `TableFactoryParseFn()` in `cf_options.cc`. Also in this PR:
* Adds a virtual `Clone()` function to TableFactory
* To avoid behavioral hiccups with `SetOptions`, make the "hidden state" of `BlockBasedTableFactory` shared between an original and a clone. For example, `TailPrefetchStats`
* `Configurable` was allowed to be copied but was not safe to do so, because the copy would have and use pointers into object it was copied from (!!!). This has been fixed using relative instead of absolute pointers, though it's still technically relying on undefined behavior (consistent object layout for non-standard-layout types).

For future follow-up:
* Deny SetOptions on block cache options (dubious and not yet made safe with proper shared_ptr handling)

Fixes https://github.com/facebook/rocksdb/issues/10079

Pull Request resolved: https://github.com/facebook/rocksdb/pull/13082

Test Plan:
added to unit tests and crash test

Ran TSAN blackbox crashtest for hours with options to amplify potential race (see https://github.com/facebook/rocksdb/issues/10079)

Reviewed By: cbi42

Differential Revision: D64947243

Pulled By: pdillinger

fbshipit-source-id: 8390299149f50e2a2b39a5247680f2637edb23c8
This commit is contained in:
Peter Dillinger 2024-10-25 10:24:54 -07:00 committed by Facebook GitHub Bot
parent 9c94559de7
commit 3fd1f11d35
20 changed files with 415 additions and 195 deletions

View File

@ -618,8 +618,9 @@ TEST_F(DBBlockCacheTest, DynamicOptions) {
++i;
// NOT YET SUPPORTED
ASSERT_NOK(dbfull()->SetOptions(
{{"block_based_table_factory", "{block_cache=null;}"}}));
// FIXME: find a way to make this fail again (until well supported)
// ASSERT_NOK(dbfull()->SetOptions(
// {{"block_based_table_factory", "{block_cache=null;}"}}));
// ASSERT_OK(Put(std::to_string(i), value));
// ASSERT_OK(Flush());
@ -631,8 +632,11 @@ TEST_F(DBBlockCacheTest, DynamicOptions) {
// ASSERT_EQ(0, st->getAndResetTickerCount(BLOCK_CACHE_DATA_HIT));
// ++i;
ASSERT_NOK(dbfull()->SetOptions(
{{"block_based_table_factory", "{block_cache=1M;}"}}));
// NOT YET SUPPORTED
// FIXME: find a way to make this fail again (until well supported)
// ASSERT_NOK(dbfull()->SetOptions(
// {{"block_based_table_factory", "{block_cache=1M;}"}}));
// ASSERT_OK(Put(std::to_string(i), value));
// ASSERT_OK(Flush());

View File

@ -1975,10 +1975,24 @@ TEST_F(DBBloomFilterTest, MutatingRibbonFilterPolicy) {
if (configs.empty()) {
break;
}
std::string factory_field =
(v[0] & 1) ? "table_factory" : "block_based_table_factory";
// Some irrelevant SetOptions to be sure they don't interfere
ASSERT_OK(db_->SetOptions({{"level0_file_num_compaction_trigger", "10"}}));
ASSERT_OK(
db_->SetOptions({{"table_factory.filter_policy.bloom_before_level",
db_->SetOptions({{"block_based_table_factory", "{block_size=1234}"}}));
ASSERT_OK(db_->SetOptions({{factory_field + ".block_size", "12345"}}));
// Test the mutable field we're interested in
ASSERT_OK(
db_->SetOptions({{factory_field + ".filter_policy.bloom_before_level",
configs.back().first}}));
// FilterPolicy pointer should not have changed
ASSERT_EQ(db_->GetOptions()
.table_factory->GetOptions<BlockBasedTableOptions>()
->filter_policy.get(),
table_options.filter_policy.get());
// Ensure original object is mutated
std::string val;
@ -1991,6 +2005,59 @@ TEST_F(DBBloomFilterTest, MutatingRibbonFilterPolicy) {
}
}
TEST_F(DBBloomFilterTest, MutableFilterPolicy) {
// Test that BlockBasedTableOptions::filter_policy is mutable (replaceable)
// with SetOptions.
Options options = CurrentOptions();
options.statistics = CreateDBStatistics();
auto& stats = *options.statistics;
BlockBasedTableOptions table_options;
// First config, to make sure there's no issues with this shared ptr
// etc. when the DB switches filter policies.
table_options.filter_policy.reset(NewBloomFilterPolicy(10));
double expected_bpk = 10.0;
// Other configs to try
std::vector<std::pair<std::string, double>> configs = {
{"ribbonfilter:10:-1", 7.0}, {"bloomfilter:5", 5.0}, {"nullptr", 0.0}};
table_options.cache_index_and_filter_blocks = true;
options.table_factory.reset(NewBlockBasedTableFactory(table_options));
options.level0_file_num_compaction_trigger =
static_cast<int>(configs.size()) + 2;
ASSERT_OK(TryReopen(options));
char v[] = "a";
for (;; ++(v[0])) {
const int maxKey = 8000;
for (int i = 0; i < maxKey; i++) {
ASSERT_OK(Put(Key(i), v));
}
ASSERT_OK(Flush());
for (int i = 0; i < maxKey; i++) {
ASSERT_EQ(Get(Key(i)), v);
}
uint64_t filter_bytes =
stats.getAndResetTickerCount(BLOCK_CACHE_FILTER_BYTES_INSERT);
EXPECT_NEAR(filter_bytes * 8.0 / maxKey, expected_bpk, 0.3);
if (configs.empty()) {
break;
}
ASSERT_OK(
db_->SetOptions({{"block_based_table_factory",
"{filter_policy=" + configs.back().first + "}"}}));
expected_bpk = configs.back().second;
configs.pop_back();
}
}
class SliceTransformLimitedDomain : public SliceTransform {
const char* Name() const override { return "SliceTransformLimitedDomain"; }

View File

@ -186,14 +186,6 @@ TEST_F(DBOptionsTest, GetLatestDBOptions) {
ASSERT_EQ(new_options, GetMutableDBOptionsMap(dbfull()->GetDBOptions()));
}
// FIXME osolete when table_factory is mutable
static std::unordered_map<std::string, std::string> WithoutTableFactory(
const std::unordered_map<std::string, std::string>& opts) {
auto opts_copy = opts;
opts_copy.erase("table_factory");
return opts_copy;
}
TEST_F(DBOptionsTest, GetLatestCFOptions) {
// GetOptions should be able to get latest option changed by SetOptions.
Options options;
@ -203,16 +195,14 @@ TEST_F(DBOptionsTest, GetLatestCFOptions) {
Reopen(options);
CreateColumnFamilies({"foo"}, options);
ReopenWithColumnFamilies({"default", "foo"}, options);
auto options_default =
WithoutTableFactory(GetRandomizedMutableCFOptionsMap(&rnd));
auto options_foo =
WithoutTableFactory(GetRandomizedMutableCFOptionsMap(&rnd));
auto options_default = GetRandomizedMutableCFOptionsMap(&rnd);
auto options_foo = GetRandomizedMutableCFOptionsMap(&rnd);
ASSERT_OK(dbfull()->SetOptions(handles_[0], options_default));
ASSERT_OK(dbfull()->SetOptions(handles_[1], options_foo));
ASSERT_EQ(options_default, WithoutTableFactory(GetMutableCFOptionsMap(
dbfull()->GetOptions(handles_[0]))));
ASSERT_EQ(options_foo, WithoutTableFactory(GetMutableCFOptionsMap(
dbfull()->GetOptions(handles_[1]))));
ASSERT_EQ(options_default,
GetMutableCFOptionsMap(dbfull()->GetOptions(handles_[0])));
ASSERT_EQ(options_foo,
GetMutableCFOptionsMap(dbfull()->GetOptions(handles_[1])));
}
TEST_F(DBOptionsTest, SetMutableTableOptions) {
@ -241,21 +231,33 @@ TEST_F(DBOptionsTest, SetMutableTableOptions) {
ASSERT_OK(dbfull()->SetOptions(
cfh, {{"table_factory.block_size", "16384"},
{"table_factory.block_restart_interval", "11"}}));
// Old c_bbto
ASSERT_EQ(c_bbto->block_size, 8192);
ASSERT_EQ(c_bbto->block_restart_interval, 7);
// New c_bbto
c_opts = dbfull()->GetOptions(cfh);
c_bbto = c_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_EQ(c_bbto->block_size, 16384);
ASSERT_EQ(c_bbto->block_restart_interval, 11);
// Now set an option that is not mutable - options should not change
ASSERT_NOK(
dbfull()->SetOptions(cfh, {{"table_factory.no_block_cache", "false"}}));
// FIXME: find a way to make this fail again
// ASSERT_NOK(
// dbfull()->SetOptions(cfh, {{"table_factory.no_block_cache", "false"}}));
c_opts = dbfull()->GetOptions(cfh);
ASSERT_EQ(c_bbto, c_opts.table_factory->GetOptions<BlockBasedTableOptions>());
ASSERT_EQ(c_bbto->no_block_cache, true);
ASSERT_EQ(c_bbto->block_size, 16384);
ASSERT_EQ(c_bbto->block_restart_interval, 11);
// Set some that are mutable and some that are not - options should not change
ASSERT_NOK(dbfull()->SetOptions(
cfh, {{"table_factory.no_block_cache", "false"},
{"table_factory.block_size", "8192"},
{"table_factory.block_restart_interval", "7"}}));
// FIXME: find a way to make this fail again
// ASSERT_NOK(dbfull()->SetOptions(
// cfh, {{"table_factory.no_block_cache", "false"},
// {"table_factory.block_size", "8192"},
// {"table_factory.block_restart_interval", "7"}}));
c_opts = dbfull()->GetOptions(cfh);
ASSERT_EQ(c_bbto, c_opts.table_factory->GetOptions<BlockBasedTableOptions>());
ASSERT_EQ(c_bbto->no_block_cache, true);
ASSERT_EQ(c_bbto->block_size, 16384);
ASSERT_EQ(c_bbto->block_restart_interval, 11);
@ -266,6 +268,8 @@ TEST_F(DBOptionsTest, SetMutableTableOptions) {
cfh, {{"table_factory.block_size", "8192"},
{"table_factory.does_not_exist", "true"},
{"table_factory.block_restart_interval", "7"}}));
c_opts = dbfull()->GetOptions(cfh);
ASSERT_EQ(c_bbto, c_opts.table_factory->GetOptions<BlockBasedTableOptions>());
ASSERT_EQ(c_bbto->no_block_cache, true);
ASSERT_EQ(c_bbto->block_size, 16384);
ASSERT_EQ(c_bbto->block_restart_interval, 11);
@ -281,6 +285,7 @@ TEST_F(DBOptionsTest, SetMutableTableOptions) {
{"table_factory.block_restart_interval", "13"}}));
c_opts = dbfull()->GetOptions(cfh);
ASSERT_EQ(c_opts.blob_file_size, 32768);
c_bbto = c_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_EQ(c_bbto->block_size, 16384);
ASSERT_EQ(c_bbto->block_restart_interval, 13);
// Set some on the table and a bad one on the ColumnFamily - options should
@ -289,6 +294,7 @@ TEST_F(DBOptionsTest, SetMutableTableOptions) {
cfh, {{"table_factory.block_size", "1024"},
{"no_such_option", "32768"},
{"table_factory.block_restart_interval", "7"}}));
ASSERT_EQ(c_bbto, c_opts.table_factory->GetOptions<BlockBasedTableOptions>());
ASSERT_EQ(c_bbto->block_size, 16384);
ASSERT_EQ(c_bbto->block_restart_interval, 13);
}

View File

@ -274,6 +274,8 @@ bool StressTest::BuildOptionsTable() {
return true;
}
bool keepRibbonFilterPolicyOnly = FLAGS_bloom_before_level != INT_MAX;
std::unordered_map<std::string, std::vector<std::string>> options_tbl = {
{"write_buffer_size",
{std::to_string(options_.write_buffer_size),
@ -339,16 +341,17 @@ bool StressTest::BuildOptionsTable() {
"2",
}},
{"max_sequential_skip_in_iterations", {"4", "8", "12"}},
// XXX: BlockBasedTableOptions fields are mutable, but there is a
// read-write race condition affecting them with SetOptions.
// See https://github.com/facebook/rocksdb/issues/10079
// {"block_based_table_factory", {"{block_size=2048}",
// "{block_size=4096}"}},
// Also TODO: a way here to modify many different BBTO fields
// {"block_based_table_factory", {"{filter_policy=bloomfilter:2.34",
// "{filter_policy=ribbonfilter:3.45",
// "{filter_policy=ribbonfilter:4.56:-1",
// "{filter_policy=ribbonfilter:6.67:3"}},
{"block_based_table_factory",
{
keepRibbonFilterPolicyOnly ? "{filter_policy=ribbonfilter:2.35}"
: "{filter_policy=bloomfilter:2.34}",
"{filter_policy=ribbonfilter:5.67:-1}",
keepRibbonFilterPolicyOnly ? "{filter_policy=ribbonfilter:8.9:3}"
: "{filter_policy=nullptr}",
"{block_size=" + std::to_string(FLAGS_block_size) + "}",
"{block_size=" +
std::to_string(FLAGS_block_size + (FLAGS_seed & 0xFFFU)) + "}",
}},
};
if (FLAGS_compaction_style == kCompactionStyleUniversal &&
FLAGS_universal_max_read_amp > 0) {
@ -403,7 +406,7 @@ bool StressTest::BuildOptionsTable() {
std::vector<std::string>{"kDisable", "kFlushOnly"});
}
if (FLAGS_bloom_before_level != INT_MAX) {
if (keepRibbonFilterPolicyOnly) {
// Can modify RibbonFilterPolicy field
options_tbl.emplace("table_factory.filter_policy.bloom_before_level",
std::vector<std::string>{"-1", "0", "1", "2",

View File

@ -675,6 +675,8 @@ TEST_P(PrefetchTest, ConfigureAutoMaxReadaheadSize) {
default:
assert(false);
}
ASSERT_OK(iter->status());
ASSERT_OK(iter->Refresh()); // Update to latest mutable options
for (int i = 0; i < num_keys_per_level; ++i) {
iter->Seek(Key(key_count++));
@ -802,6 +804,8 @@ TEST_P(PrefetchTest, ConfigureInternalAutoReadaheadSize) {
default:
assert(false);
}
ASSERT_OK(iter->status());
ASSERT_OK(iter->Refresh()); // Update to latest mutable options
for (int i = 0; i < num_keys_per_level; ++i) {
iter->Seek(Key(key_count++));

View File

@ -47,8 +47,10 @@ class Configurable {
struct RegisteredOptions {
// The name of the options being registered
std::string name;
// Pointer to the object being registered
void* opt_ptr;
// Pointer to the object being registered, relative to `this` so that
// RegisteredOptions are copyable from one Configurable to another of the
// same type, assuming the option is a member of `this`.
intptr_t opt_offset;
// The map of options being registered
const std::unordered_map<std::string, OptionTypeInfo>* type_map;
};
@ -384,9 +386,9 @@ class Configurable {
inline bool HasRegisteredOptions() const { return !options_.empty(); }
private:
// Contains the collection of options (name, opt_ptr, opt_map) associated with
// this object. This collection is typically set in the constructor of the
// Configurable option via
// Contains the collection of options (name, opt_offset, opt_map) associated
// with this object. This collection is typically set in the constructor of
// the specific Configurable via RegisterOptions().
std::vector<RegisteredOptions> options_;
};
} // namespace ROCKSDB_NAMESPACE

View File

@ -128,7 +128,7 @@ struct CacheUsageOptions {
// Configures how SST files using the block-based table format (standard)
// are written and read.
//
// Except as specifically noted, all "simple" options here are "mutable" using
// Except as specifically noted, all options here are "mutable" using
// SetOptions(), with the caveat that only new table builders and new table
// readers will pick up new options. This is nearly immediate effect for
// SST building, but in the worst case, options affecting reads only take
@ -142,9 +142,8 @@ struct CacheUsageOptions {
// "{max_auto_readahead_size=0;block_size=8192;}"}}));
// db->SetOptions({{"block_based_table_factory",
// "{prepopulate_block_cache=kFlushOnly;}"}}));
//
// For now, "simple" options are only non-pointer options that are 64 bits or
// less.
// db->SetOptions({{"block_based_table_factory",
// "{filter_policy=ribbonfilter:10;}"}});
struct BlockBasedTableOptions {
static const char* kName() { return "BlockTableOptions"; }
// @flush_block_policy_factory creates the instances of flush block policy.
@ -278,13 +277,17 @@ struct BlockBasedTableOptions {
// Disable block cache. If this is set to true, then no block cache
// will be configured (block_cache reset to nullptr).
//
// This option cannot be used with SetOptions because it only affects
// the value of `block_cache` during initialization.
// This option should not be used with SetOptions.
bool no_block_cache = false;
// If non-nullptr and no_block_cache == false, use the specified cache for
// blocks. If nullptr and no_block_cache == false, a 32MB internal cache
// will be created and used.
//
// This option should not be used with SetOptions, because (a) the code
// to make it safe is incomplete, and (b) it is not clear when/if the
// old block cache would go away. For now, dynamic changes to block cache
// should be through the Cache object, e.g. Cache::SetCapacity().
std::shared_ptr<Cache> block_cache = nullptr;
// If non-NULL use the specified cache for pages read from device
@ -934,6 +937,11 @@ class TableFactory : public Customizable {
const TableBuilderOptions& table_builder_options,
WritableFileWriter* file) const = 0;
// Clone this TableFactory with the same options, ideally a "shallow" clone
// in which shared_ptr members and hidden state are (safely) shared between
// this original and the returned clone.
virtual std::unique_ptr<TableFactory> Clone() const = 0;
// Return is delete range supported
virtual bool IsDeleteRangeSupported() const { return false; }
};

View File

@ -132,6 +132,92 @@ static Status ParseCompressionOptions(const std::string& value,
return Status::OK();
}
static Status TableFactoryParseFn(const ConfigOptions& opts,
const std::string& name,
const std::string& value, void* addr) {
assert(addr);
auto table_factory = static_cast<std::shared_ptr<TableFactory>*>(addr);
// The general approach to mutating a table factory is to clone it, then
// mutate and save the clone. This avoids race conditions between SetOptions
// and consumers of table_factory/table options by leveraging
// MutableCFOptions infrastructure to track the table_factory pointer.
// However, in the atypical case of setting an option that is safely mutable
// under something pointed to by the table factory, we should avoid cloning.
// The simple way to detect that case is to try with "mutable_options_only"
// and see if it works. If it does, we are finished. If not, we proceed to
// cloning etc.
//
// The canonical example of what is handled here is
// table_factory.filter_policy.bloom_before_level for RibbonFilterPolicy.
if (table_factory->get() != nullptr && !EndsWith(name, "table_factory")) {
ConfigOptions opts_mutable_only{opts};
opts_mutable_only.mutable_options_only = true;
Status s =
table_factory->get()->ConfigureOption(opts_mutable_only, name, value);
if (s.ok()) {
return s;
}
s.PermitUncheckedError();
}
std::shared_ptr<TableFactory> new_factory;
Status s;
if (name == "block_based_table_factory") {
if (table_factory->get() != nullptr) {
std::string factory_name = table_factory->get()->Name();
if (factory_name == TableFactory::kBlockBasedTableName()) {
new_factory = table_factory->get()->Clone();
} else {
s = Status::InvalidArgument("Cannot modify " + factory_name + " as " +
name);
return s;
}
} else {
new_factory.reset(NewBlockBasedTableFactory());
}
// Passing an object string to configure/instantiate a table factory
s = new_factory->ConfigureFromString(opts, value);
} else if (name == "plain_table_factory") {
if (table_factory->get() != nullptr) {
std::string factory_name = table_factory->get()->Name();
if (factory_name == TableFactory::kPlainTableName()) {
new_factory = table_factory->get()->Clone();
} else {
s = Status::InvalidArgument("Cannot modify " + factory_name + " as " +
name);
return s;
}
} else {
new_factory.reset(NewPlainTableFactory());
}
// Passing an object string to configure/instantiate a table factory
s = new_factory->ConfigureFromString(opts, value);
} else if (name == "table_factory" || name == OptionTypeInfo::kIdPropName()) {
// Related to OptionTypeInfo::AsCustomSharedPtr
if (value.empty()) {
new_factory = nullptr;
} else {
s = TableFactory::CreateFromString(opts, value, &new_factory);
}
} else if (table_factory->get() != nullptr) {
new_factory = table_factory->get()->Clone();
// Presumably passing a value for a specific field of the table factory
s = new_factory->ConfigureOption(opts, name, value);
} else {
s = Status::NotFound("Unable to instantiate a table factory from option: ",
name);
return s;
}
// Only keep the modified clone if everything went OK
if (s.ok()) {
*table_factory = std::move(new_factory);
}
return s;
}
const std::string kOptNameBMCompOpts = "bottommost_compression_opts";
const std::string kOptNameCompOpts = "compression_opts";
@ -266,75 +352,25 @@ static std::unordered_map<std::string, OptionTypeInfo>
{offsetof(struct MutableCFOptions, disable_auto_compactions),
OptionType::kBoolean, OptionVerificationType::kNormal,
OptionTypeFlags::kMutable}},
{"table_factory", OptionTypeInfo::AsCustomSharedPtr<TableFactory>(
offsetof(struct MutableCFOptions, table_factory),
OptionVerificationType::kByName,
(OptionTypeFlags::kCompareLoose |
OptionTypeFlags::kStringNameOnly |
OptionTypeFlags::kDontPrepare))},
{"table_factory",
{offsetof(struct MutableCFOptions, table_factory),
OptionType::kCustomizable, OptionVerificationType::kByName,
OptionTypeFlags::kShared | OptionTypeFlags::kCompareLoose |
OptionTypeFlags::kStringNameOnly | OptionTypeFlags::kDontPrepare |
OptionTypeFlags::kMutable,
TableFactoryParseFn}},
{"block_based_table_factory",
{offsetof(struct MutableCFOptions, table_factory),
OptionType::kCustomizable, OptionVerificationType::kAlias,
OptionTypeFlags::kShared | OptionTypeFlags::kCompareLoose,
// Parses the input value and creates a BlockBasedTableFactory
[](const ConfigOptions& opts, const std::string& name,
const std::string& value, void* addr) {
BlockBasedTableOptions* old_opts = nullptr;
auto table_factory =
static_cast<std::shared_ptr<TableFactory>*>(addr);
if (table_factory->get() != nullptr) {
old_opts =
table_factory->get()->GetOptions<BlockBasedTableOptions>();
}
if (name == "block_based_table_factory") {
std::unique_ptr<TableFactory> new_factory;
if (old_opts != nullptr) {
new_factory.reset(NewBlockBasedTableFactory(*old_opts));
} else {
new_factory.reset(NewBlockBasedTableFactory());
}
Status s = new_factory->ConfigureFromString(opts, value);
if (s.ok()) {
table_factory->reset(new_factory.release());
}
return s;
} else if (old_opts != nullptr) {
return table_factory->get()->ConfigureOption(opts, name, value);
} else {
return Status::NotFound("Mismatched table option: ", name);
}
}}},
OptionTypeFlags::kShared | OptionTypeFlags::kCompareLoose |
OptionTypeFlags::kMutable,
TableFactoryParseFn}},
{"plain_table_factory",
{offsetof(struct MutableCFOptions, table_factory),
OptionType::kCustomizable, OptionVerificationType::kAlias,
OptionTypeFlags::kShared | OptionTypeFlags::kCompareLoose,
// Parses the input value and creates a PlainTableFactory
[](const ConfigOptions& opts, const std::string& name,
const std::string& value, void* addr) {
PlainTableOptions* old_opts = nullptr;
auto table_factory =
static_cast<std::shared_ptr<TableFactory>*>(addr);
if (table_factory->get() != nullptr) {
old_opts = table_factory->get()->GetOptions<PlainTableOptions>();
}
if (name == "plain_table_factory") {
std::unique_ptr<TableFactory> new_factory;
if (old_opts != nullptr) {
new_factory.reset(NewPlainTableFactory(*old_opts));
} else {
new_factory.reset(NewPlainTableFactory());
}
Status s = new_factory->ConfigureFromString(opts, value);
if (s.ok()) {
table_factory->reset(new_factory.release());
}
return s;
} else if (old_opts != nullptr) {
return table_factory->get()->ConfigureOption(opts, name, value);
} else {
return Status::NotFound("Mismatched table option: ", name);
}
}}},
OptionTypeFlags::kShared | OptionTypeFlags::kCompareLoose |
OptionTypeFlags::kMutable,
TableFactoryParseFn}},
{"filter_deletes",
{0, OptionType::kBoolean, OptionVerificationType::kDeprecated,
OptionTypeFlags::kMutable}},

View File

@ -17,13 +17,25 @@
namespace ROCKSDB_NAMESPACE {
namespace {
intptr_t GetOffset(const Configurable* holder, void* field) {
return reinterpret_cast<intptr_t>(field) -
reinterpret_cast<intptr_t>(static_cast<const void*>(holder));
}
void* ApplyOffset(const Configurable* holder, intptr_t offset) {
return reinterpret_cast<void*>(
reinterpret_cast<intptr_t>(static_cast<const void*>(holder)) + offset);
}
} // namespace
void Configurable::RegisterOptions(
const std::string& name, void* opt_ptr,
const std::unordered_map<std::string, OptionTypeInfo>* type_map) {
RegisteredOptions opts;
opts.name = name;
opts.type_map = type_map;
opts.opt_ptr = opt_ptr;
opts.opt_offset = GetOffset(this, opt_ptr);
options_.emplace_back(opts);
}
@ -42,7 +54,8 @@ Status Configurable::PrepareOptions(const ConfigOptions& opts) {
for (const auto& map_iter : *(opt_iter.type_map)) {
auto& opt_info = map_iter.second;
if (opt_info.ShouldPrepare()) {
status = opt_info.Prepare(opts, map_iter.first, opt_iter.opt_ptr);
status = opt_info.Prepare(opts, map_iter.first,
ApplyOffset(this, opt_iter.opt_offset));
if (!status.ok()) {
return status;
}
@ -62,7 +75,7 @@ Status Configurable::ValidateOptions(const DBOptions& db_opts,
auto& opt_info = map_iter.second;
if (opt_info.ShouldValidate()) {
status = opt_info.Validate(db_opts, cf_opts, map_iter.first,
opt_iter.opt_ptr);
ApplyOffset(this, opt_iter.opt_offset));
if (!status.ok()) {
return status;
}
@ -82,7 +95,7 @@ Status Configurable::ValidateOptions(const DBOptions& db_opts,
const void* Configurable::GetOptionsPtr(const std::string& name) const {
for (const auto& o : options_) {
if (o.name == name) {
return o.opt_ptr;
return ApplyOffset(this, o.opt_offset);
}
}
return nullptr;
@ -93,14 +106,14 @@ std::string Configurable::GetOptionName(const std::string& opt_name) const {
}
const OptionTypeInfo* ConfigurableHelper::FindOption(
const std::vector<Configurable::RegisteredOptions>& options,
const std::string& short_name, std::string* opt_name, void** opt_ptr) {
for (const auto& iter : options) {
const Configurable& configurable, const std::string& short_name,
std::string* opt_name, void** opt_ptr) {
for (const auto& iter : configurable.options_) {
if (iter.type_map != nullptr) {
const auto opt_info =
OptionTypeInfo::Find(short_name, *(iter.type_map), opt_name);
if (opt_info != nullptr) {
*opt_ptr = iter.opt_ptr;
*opt_ptr = ApplyOffset(&configurable, iter.opt_offset);
return opt_info;
}
}
@ -244,7 +257,8 @@ Status ConfigurableHelper::ConfigureOptions(
for (const auto& iter : configurable.options_) {
if (iter.type_map != nullptr) {
s = ConfigureSomeOptions(config_options, configurable, *(iter.type_map),
&remaining, iter.opt_ptr);
&remaining,
ApplyOffset(&configurable, iter.opt_offset));
if (remaining.empty()) { // Are there more options left?
break;
} else if (!s.ok()) {
@ -354,7 +368,7 @@ Status ConfigurableHelper::ConfigureSingleOption(
std::string elem_name;
void* opt_ptr = nullptr;
const auto opt_info =
FindOption(configurable.options_, opt_name, &elem_name, &opt_ptr);
FindOption(configurable, opt_name, &elem_name, &opt_ptr);
if (opt_info == nullptr) {
return Status::NotFound("Could not find option: ", name);
} else {
@ -507,7 +521,7 @@ Status ConfigurableHelper::GetOption(const ConfigOptions& config_options,
std::string opt_name;
void* opt_ptr = nullptr;
const auto opt_info =
FindOption(configurable.options_, short_name, &opt_name, &opt_ptr);
FindOption(configurable, short_name, &opt_name, &opt_ptr);
if (opt_info != nullptr) {
ConfigOptions embedded = config_options;
embedded.delimiter = ";";
@ -538,22 +552,22 @@ Status ConfigurableHelper::SerializeOptions(const ConfigOptions& config_options,
if (opt_info.ShouldSerialize()) {
std::string value;
Status s;
void* opt_ptr = ApplyOffset(&configurable, opt_iter.opt_offset);
if (!config_options.mutable_options_only) {
s = opt_info.Serialize(config_options, prefix + opt_name,
opt_iter.opt_ptr, &value);
s = opt_info.Serialize(config_options, prefix + opt_name, opt_ptr,
&value);
} else if (opt_info.IsMutable()) {
ConfigOptions copy = config_options;
copy.mutable_options_only = false;
s = opt_info.Serialize(copy, prefix + opt_name, opt_iter.opt_ptr,
&value);
s = opt_info.Serialize(copy, prefix + opt_name, opt_ptr, &value);
} else if (opt_info.IsConfigurable()) {
// If it is a Configurable and we are either printing all of the
// details or not printing only the name, this option should be
// included in the list
if (config_options.IsDetailed() ||
!opt_info.IsEnabled(OptionTypeFlags::kStringNameOnly)) {
s = opt_info.Serialize(config_options, prefix + opt_name,
opt_iter.opt_ptr, &value);
s = opt_info.Serialize(config_options, prefix + opt_name, opt_ptr,
&value);
}
}
if (!s.ok()) {

View File

@ -160,9 +160,9 @@ class ConfigurableHelper {
std::string* mismatch);
private:
// Looks for the option specified by name in the RegisteredOptions.
// This method traverses the types in the input options vector. If an entry
// matching name is found, that entry, opt_name, and pointer are returned.
// Looks for the option specified by name in the RegisteredOptions of a
// configurable. If an entry matching name is found, that entry, opt_name,
// and pointer are returned.
// @param options The vector of options to search through
// @param name The name of the option to search for in the OptionType map
// @param opt_name If the name was found, this value is set to the option name
@ -172,9 +172,10 @@ class ConfigurableHelper {
// in the RegisteredOptions vector associated with this entry
// @return A pointer to the OptionTypeInfo from the options if found,
// nullptr if the name was not found in the input options
static const OptionTypeInfo* FindOption(
const std::vector<Configurable::RegisteredOptions>& options,
const std::string& name, std::string* opt_name, void** opt_ptr);
static const OptionTypeInfo* FindOption(const Configurable& configurable,
const std::string& name,
std::string* opt_name,
void** opt_ptr);
static Status ConfigureCustomizableOption(
const ConfigOptions& config_options, Configurable& configurable,

View File

@ -61,6 +61,9 @@ class UnregisteredTableFactory : public TableFactory {
WritableFileWriter*) const override {
return nullptr;
}
std::unique_ptr<TableFactory> Clone() const override {
return std::make_unique<UnregisteredTableFactory>();
}
};
TEST_F(OptionsTest, GetOptionsFromMapTest) {
@ -1668,23 +1671,32 @@ TEST_F(OptionsTest, MutableTableOptions) {
ASSERT_EQ(bbto->block_size, 1024);
ASSERT_OK(bbtf->PrepareOptions(config_options));
config_options.mutable_options_only = true;
ASSERT_OK(bbtf->ConfigureOption(config_options, "block_size", "1024"));
ASSERT_EQ(bbto->no_block_cache, true);
// Options on BlockBasedTableOptions/Factory are no longer directly mutable
// but have to be mutated on a live DB with SetOptions replacing the
// table_factory with a copy using the new options.
ASSERT_NOK(bbtf->ConfigureOption(config_options, "no_block_cache", "false"));
ASSERT_OK(bbtf->ConfigureOption(config_options, "block_size", "2048"));
ASSERT_NOK(bbtf->ConfigureOption(config_options, "block_size", "2048"));
ASSERT_EQ(bbto->no_block_cache, true);
ASSERT_EQ(bbto->block_size, 2048);
ASSERT_EQ(bbto->block_size, 1024);
ColumnFamilyOptions cf_opts;
cf_opts.table_factory = bbtf;
// FIXME: find a way to make this fail again
/*
ASSERT_NOK(GetColumnFamilyOptionsFromString(
config_options, cf_opts, "block_based_table_factory.no_block_cache=false",
&cf_opts));
*/
ASSERT_OK(GetColumnFamilyOptionsFromString(
config_options, cf_opts, "block_based_table_factory.block_size=8192",
&cf_opts));
ASSERT_EQ(bbto->no_block_cache, true);
ASSERT_EQ(bbto->block_size, 8192);
const auto new_bbto =
cf_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_NE(new_bbto, nullptr);
ASSERT_NE(new_bbto, bbto);
ASSERT_EQ(new_bbto->no_block_cache, true);
ASSERT_EQ(new_bbto->block_size, 8192);
ASSERT_EQ(bbto->block_size, 1024);
}
TEST_F(OptionsTest, MutableCFOptions) {
@ -1698,7 +1710,7 @@ TEST_F(OptionsTest, MutableCFOptions) {
&cf_opts));
ASSERT_TRUE(cf_opts.paranoid_file_checks);
ASSERT_NE(cf_opts.table_factory.get(), nullptr);
const auto bbto = cf_opts.table_factory->GetOptions<BlockBasedTableOptions>();
auto* bbto = cf_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_NE(bbto, nullptr);
ASSERT_EQ(bbto->block_size, 8192);
ASSERT_EQ(bbto->block_align, false);
@ -1707,10 +1719,11 @@ TEST_F(OptionsTest, MutableCFOptions) {
config_options, cf_opts, {{"paranoid_file_checks", "false"}}, &cf_opts));
ASSERT_EQ(cf_opts.paranoid_file_checks, false);
// Should replace the factory with the new setting
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"block_based_table_factory.block_size", "16384"}}, &cf_opts));
ASSERT_EQ(bbto, cf_opts.table_factory->GetOptions<BlockBasedTableOptions>());
bbto = cf_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_EQ(bbto->block_size, 16384);
config_options.mutable_options_only = true;
@ -1719,45 +1732,103 @@ TEST_F(OptionsTest, MutableCFOptions) {
config_options, cf_opts, {{"force_consistency_checks", "true"}},
&cf_opts));
// Attempt to change the table. It is not mutable, so this should fail and
// leave the original intact
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
// Attempt to change the table factory kind. This was previously disallowed
// and is a dubious operation but is tricky to disallow without breaking
// other things (FIXME?)
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts, {{"table_factory", "PlainTable"}}, &cf_opts));
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
ASSERT_STREQ(cf_opts.table_factory->Name(), TableFactory::kPlainTableName());
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts, {{"table_factory", "BlockBasedTable"}},
&cf_opts));
ASSERT_STREQ(cf_opts.table_factory->Name(),
TableFactory::kBlockBasedTableName());
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts, {{"table_factory.id", "PlainTable"}}, &cf_opts));
ASSERT_NE(cf_opts.table_factory.get(), nullptr);
ASSERT_EQ(bbto, cf_opts.table_factory->GetOptions<BlockBasedTableOptions>());
ASSERT_STREQ(cf_opts.table_factory->Name(), TableFactory::kPlainTableName());
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts, {{"table_factory.id", "BlockBasedTable"}},
&cf_opts));
ASSERT_STREQ(cf_opts.table_factory->Name(),
TableFactory::kBlockBasedTableName());
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"table_factory", "{id=PlainTable;bloom_bits_per_key=42}"}}, &cf_opts));
ASSERT_STREQ(cf_opts.table_factory->Name(), TableFactory::kPlainTableName());
// Change the block size. Should update the value in the current table
// Should at least be allowed to instantiate in place of nullptr, for
// initialization purposes.
cf_opts.table_factory = nullptr;
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"table_factory", "{id=BlockBasedTable;block_size=12345}"}}, &cf_opts));
ASSERT_STREQ(cf_opts.table_factory->Name(),
TableFactory::kBlockBasedTableName());
bbto = cf_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_EQ(bbto->block_size, 12345);
// Accessing through the wrong factory alias fails gracefully
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"plain_table_factory", "{bloom_bits_per_key=42}"}}, &cf_opts));
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"plain_table_factory.bloom_bits_per_key", "42"}}, &cf_opts));
ASSERT_STREQ(cf_opts.table_factory->Name(),
TableFactory::kBlockBasedTableName());
// Change the block size.
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"block_based_table_factory.block_size", "8192"}}, &cf_opts));
ASSERT_EQ(bbto, cf_opts.table_factory->GetOptions<BlockBasedTableOptions>());
bbto = cf_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_EQ(bbto->block_size, 8192);
// Attempt to turn off block cache fails, as this option is not mutable
// FIXME: find a way to make this fail again
/*
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"block_based_table_factory.no_block_cache", "true"}}, &cf_opts));
ASSERT_EQ(bbto, cf_opts.table_factory->GetOptions<BlockBasedTableOptions>());
*/
// Attempt to change the block size via a config string/map. Should update
// the current value
// Attempt to change the block size via a config string/map.
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"block_based_table_factory", "{block_size=32768}"}}, &cf_opts));
ASSERT_EQ(bbto, cf_opts.table_factory->GetOptions<BlockBasedTableOptions>());
bbto = cf_opts.table_factory->GetOptions<BlockBasedTableOptions>();
ASSERT_EQ(bbto->block_size, 32768);
// Attempt to change the block size and no cache through the map. Should
// fail, leaving the old values intact
// FIXME: find a way to make this fail again
/*
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"block_based_table_factory",
"{block_size=16384; no_block_cache=true}"}},
&cf_opts));
ASSERT_EQ(bbto, cf_opts.table_factory->GetOptions<BlockBasedTableOptions>());
*/
ASSERT_EQ(bbto->block_size, 32768);
// Switch to plain table for some tests
cf_opts.table_factory = nullptr;
ASSERT_OK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"table_factory", "{id=PlainTable;bloom_bits_per_key=42}"}}, &cf_opts));
ASSERT_STREQ(cf_opts.table_factory->Name(), TableFactory::kPlainTableName());
auto* pto = cf_opts.table_factory->GetOptions<PlainTableOptions>();
ASSERT_EQ(pto->bloom_bits_per_key, 42);
// Accessing through the wrong factory alias fails gracefully
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"block_based_table_factory.block_size", "8192"}}, &cf_opts));
ASSERT_NOK(GetColumnFamilyOptionsFromMap(
config_options, cf_opts,
{{"block_based_table_factory", "{block_size=32768}"}}, &cf_opts));
ASSERT_STREQ(cf_opts.table_factory->Name(), TableFactory::kPlainTableName());
ASSERT_EQ(pto, cf_opts.table_factory->GetOptions<PlainTableOptions>());
}

View File

@ -46,6 +46,10 @@ class AdaptiveTableFactory : public TableFactory {
std::string GetPrintableOptions() const override;
std::unique_ptr<TableFactory> Clone() const override {
return std::make_unique<AdaptiveTableFactory>(*this);
}
private:
std::shared_ptr<TableFactory> table_factory_to_write_;
std::shared_ptr<TableFactory> block_based_table_factory_;

View File

@ -394,34 +394,6 @@ static struct BlockBasedTableTypeInfo {
num_file_reads_for_auto_readahead),
OptionType::kUInt64T, OptionVerificationType::kNormal}},
};
for (auto& i : info) {
switch (i.second.GetType()) {
case OptionType::kString:
case OptionType::kEnv:
case OptionType::kStruct:
case OptionType::kVector:
case OptionType::kConfigurable:
case OptionType::kCustomizable:
case OptionType::kEncodedString:
case OptionType::kArray:
case OptionType::kUnknown:
// Not mutable, at least until race condition is resolved
break;
default:
if (i.first == "no_block_cache") {
// Special case of not being mutable; only makes sense at
// initialization time, and for non-expert users
assert((i.second.GetFlags() & OptionTypeFlags::kMutable) ==
OptionTypeFlags::kNone);
} else {
// Values up to 64 bits should be generally safe to mutate despite
// the read-write race.
i.second.SetFlags(i.second.GetFlags() | OptionTypeFlags::kMutable);
}
break;
}
}
}
} block_based_table_type_info;
@ -429,7 +401,8 @@ static struct BlockBasedTableTypeInfo {
// options
BlockBasedTableFactory::BlockBasedTableFactory(
const BlockBasedTableOptions& _table_options)
: table_options_(_table_options) {
: table_options_(_table_options),
shared_state_(std::make_shared<SharedState>()) {
InitializeOptions();
RegisterOptions(&table_options_, &block_based_table_type_info.info);
@ -439,10 +412,11 @@ BlockBasedTableFactory::BlockBasedTableFactory(
.charged;
if (table_options_.block_cache &&
table_reader_charged == CacheEntryRoleOptions::Decision::kEnabled) {
table_reader_cache_res_mgr_.reset(new ConcurrentCacheReservationManager(
std::make_shared<CacheReservationManagerImpl<
CacheEntryRole::kBlockBasedTableReader>>(
table_options_.block_cache)));
shared_state_->table_reader_cache_res_mgr =
std::make_shared<ConcurrentCacheReservationManager>(
std::make_shared<CacheReservationManagerImpl<
CacheEntryRole::kBlockBasedTableReader>>(
table_options_.block_cache));
}
}
@ -580,11 +554,13 @@ Status BlockBasedTableFactory::NewTableReader(
ro, table_reader_options.ioptions, table_reader_options.env_options,
table_options_, table_reader_options.internal_comparator, std::move(file),
file_size, table_reader_options.block_protection_bytes_per_key,
table_reader, table_reader_options.tail_size, table_reader_cache_res_mgr_,
table_reader, table_reader_options.tail_size,
shared_state_->table_reader_cache_res_mgr,
table_reader_options.prefix_extractor, prefetch_index_and_filter_in_cache,
table_reader_options.skip_filters, table_reader_options.level,
table_reader_options.immortal, table_reader_options.largest_seqno,
table_reader_options.force_direct_prefetch, &tail_prefetch_stats_,
table_reader_options.force_direct_prefetch,
&shared_state_->tail_prefetch_stats,
table_reader_options.block_cache_tracer,
table_reader_options.max_file_size_for_l0_meta_pin,
table_reader_options.cur_db_session_id, table_reader_options.cur_file_num,

View File

@ -79,7 +79,13 @@ class BlockBasedTableFactory : public TableFactory {
bool IsDeleteRangeSupported() const override { return true; }
TailPrefetchStats* tail_prefetch_stats() { return &tail_prefetch_stats_; }
std::unique_ptr<TableFactory> Clone() const override {
return std::make_unique<BlockBasedTableFactory>(*this);
}
TailPrefetchStats* tail_prefetch_stats() {
return &shared_state_->tail_prefetch_stats;
}
protected:
const void* GetOptionsPtr(const std::string& name) const override;
@ -91,8 +97,12 @@ class BlockBasedTableFactory : public TableFactory {
private:
BlockBasedTableOptions table_options_;
std::shared_ptr<CacheReservationManager> table_reader_cache_res_mgr_;
mutable TailPrefetchStats tail_prefetch_stats_;
// Share some state among cloned instances
struct SharedState {
std::shared_ptr<CacheReservationManager> table_reader_cache_res_mgr;
TailPrefetchStats tail_prefetch_stats;
};
std::shared_ptr<SharedState> shared_state_;
};
extern const std::string kHashIndexPrefixesBlock;

View File

@ -73,6 +73,10 @@ class CuckooTableFactory : public TableFactory {
std::string GetPrintableOptions() const override;
std::unique_ptr<TableFactory> Clone() const override {
return std::make_unique<CuckooTableFactory>(*this);
}
private:
CuckooTableOptions table_options_;
};

View File

@ -76,6 +76,9 @@ class MockTableFactory : public TableFactory {
// contents are equal to file_contents
void AssertSingleFile(const KVVector& file_contents);
void AssertLatestFiles(const std::vector<KVVector>& files_contents);
std::unique_ptr<TableFactory> Clone() const override {
return nullptr; // Not implemented
}
private:
Status GetAndWriteNextID(WritableFileWriter* file, uint32_t* id) const;

View File

@ -173,6 +173,10 @@ class PlainTableFactory : public TableFactory {
std::string GetPrintableOptions() const override;
static const char kValueTypeSeqId0 = char(~0);
std::unique_ptr<TableFactory> Clone() const override {
return std::make_unique<PlainTableFactory>(*this);
}
private:
PlainTableOptions table_options_;
};

View File

@ -448,7 +448,7 @@ blackbox_default_params = {
# since we will be killing anyway, use large value for ops_per_thread
"ops_per_thread": 100000000,
"reopen": 0,
"set_options_one_in": 10000,
"set_options_one_in": 2000,
}
whitebox_default_params = {

View File

@ -0,0 +1 @@
Fix a longstanding race condition in SetOptions for `block_based_table_factory` options. The fix has some subtle behavior changes because of copying and replacing the TableFactory on a change with SetOptions, including requiring an Iterator::Refresh() for an existing Iterator to use the latest options.

View File

@ -179,6 +179,8 @@ class DummyTableFactory : public TableFactory {
}
std::string GetPrintableOptions() const override { return ""; }
std::unique_ptr<TableFactory> Clone() const override { return nullptr; }
};
class DummyMergeOperator : public MergeOperator {