Add DataBlockIndexType option in BlockBasedTableOptions (#4150)

Summary:
Added DataBlockIndexType option in BlockBasedTableOptions.
```
enum DataBlockIndexType : char {
    kDataBlockBinarySearch = 0, // traditional block type
    kDataBlockHashIndex = 1, // additional hash index appended to the end.
};
```
The default type is the traditional binary seek option: `kDataBlockBinarySearch`.
Pull Request resolved: https://github.com/facebook/rocksdb/pull/4150

Differential Revision: D8895958

Pulled By: fgwu

fbshipit-source-id: 480adef48104cf11d30db3bad9a73f98b4a80c10
main
Fenggang Wu 7 years ago committed by Facebook Github Bot
parent f5e46354d2
commit a11df583ec
  1. 9
      include/rocksdb/table.h
  2. 2
      options/options.cc
  3. 18
      options/options_helper.cc
  4. 6
      options/options_helper.h
  5. 6
      options/options_parser.cc
  6. 1
      options/options_settable_test.cc
  7. 4
      table/block_based_table_factory.h

@ -100,6 +100,15 @@ struct BlockBasedTableOptions {
IndexType index_type = kBinarySearch; IndexType index_type = kBinarySearch;
// The index type that will be used for the data block.
// Now two DataBlockIndexType supported
enum DataBlockIndexType : char {
kDataBlockBinarySearch = 0, // traditional block type
kDataBlockHashSearch = 1, // additional hash index appended to the end.
};
DataBlockIndexType data_block_index_type = kDataBlockBinarySearch;
// This option is now deprecated. No matter what value it is set to, // This option is now deprecated. No matter what value it is set to,
// it will behave as if hash_index_allow_collision=true. // it will behave as if hash_index_allow_collision=true.
bool hash_index_allow_collision = true; bool hash_index_allow_collision = true;

@ -479,6 +479,8 @@ ColumnFamilyOptions* ColumnFamilyOptions::OptimizeForPointLookup(
prefix_extractor.reset(NewNoopTransform()); prefix_extractor.reset(NewNoopTransform());
BlockBasedTableOptions block_based_options; BlockBasedTableOptions block_based_options;
block_based_options.index_type = BlockBasedTableOptions::kHashSearch; block_based_options.index_type = BlockBasedTableOptions::kHashSearch;
block_based_options.data_block_index_type =
BlockBasedTableOptions::kDataBlockBinarySearch;
block_based_options.filter_policy.reset(NewBloomFilterPolicy(10)); block_based_options.filter_policy.reset(NewBloomFilterPolicy(10));
block_based_options.block_cache = block_based_options.block_cache =
NewLRUCache(static_cast<size_t>(block_cache_size_mb * 1024 * 1024)); NewLRUCache(static_cast<size_t>(block_cache_size_mb * 1024 * 1024));

@ -494,6 +494,11 @@ bool ParseOptionHelper(char* opt_address, const OptionType& opt_type,
return ParseEnum<BlockBasedTableOptions::IndexType>( return ParseEnum<BlockBasedTableOptions::IndexType>(
block_base_table_index_type_string_map, value, block_base_table_index_type_string_map, value,
reinterpret_cast<BlockBasedTableOptions::IndexType*>(opt_address)); reinterpret_cast<BlockBasedTableOptions::IndexType*>(opt_address));
case OptionType::kBlockBasedTableDataBlockIndexType:
return ParseEnum<BlockBasedTableOptions::DataBlockIndexType>(
block_base_table_data_block_index_type_string_map, value,
reinterpret_cast<BlockBasedTableOptions::DataBlockIndexType*>(
opt_address));
case OptionType::kEncodingType: case OptionType::kEncodingType:
return ParseEnum<EncodingType>( return ParseEnum<EncodingType>(
encoding_type_string_map, value, encoding_type_string_map, value,
@ -673,6 +678,12 @@ bool SerializeSingleOptionHelper(const char* opt_address,
*reinterpret_cast<const BlockBasedTableOptions::IndexType*>( *reinterpret_cast<const BlockBasedTableOptions::IndexType*>(
opt_address), opt_address),
value); value);
case OptionType::kBlockBasedTableDataBlockIndexType:
return SerializeEnum<BlockBasedTableOptions::DataBlockIndexType>(
block_base_table_data_block_index_type_string_map,
*reinterpret_cast<const BlockBasedTableOptions::DataBlockIndexType*>(
opt_address),
value);
case OptionType::kFlushBlockPolicyFactory: { case OptionType::kFlushBlockPolicyFactory: {
const auto* ptr = const auto* ptr =
reinterpret_cast<const std::shared_ptr<FlushBlockPolicyFactory>*>( reinterpret_cast<const std::shared_ptr<FlushBlockPolicyFactory>*>(
@ -1552,6 +1563,13 @@ std::unordered_map<std::string, BlockBasedTableOptions::IndexType>
{"kTwoLevelIndexSearch", {"kTwoLevelIndexSearch",
BlockBasedTableOptions::IndexType::kTwoLevelIndexSearch}}; BlockBasedTableOptions::IndexType::kTwoLevelIndexSearch}};
std::unordered_map<std::string, BlockBasedTableOptions::DataBlockIndexType>
OptionsHelper::block_base_table_data_block_index_type_string_map = {
{"kDataBlockBinarySearch",
BlockBasedTableOptions::DataBlockIndexType::kDataBlockBinarySearch},
{"kDataBlockHashSearch",
BlockBasedTableOptions::DataBlockIndexType::kDataBlockHashSearch}};
std::unordered_map<std::string, EncodingType> std::unordered_map<std::string, EncodingType>
OptionsHelper::encoding_type_string_map = {{"kPlain", kPlain}, OptionsHelper::encoding_type_string_map = {{"kPlain", kPlain},
{"kPrefix", kPrefix}}; {"kPrefix", kPrefix}};

@ -69,6 +69,7 @@ enum class OptionType {
kMergeOperator, kMergeOperator,
kMemTableRepFactory, kMemTableRepFactory,
kBlockBasedTableIndexType, kBlockBasedTableIndexType,
kBlockBasedTableDataBlockIndexType,
kFilterPolicy, kFilterPolicy,
kFlushBlockPolicyFactory, kFlushBlockPolicyFactory,
kChecksumType, kChecksumType,
@ -163,6 +164,9 @@ struct OptionsHelper {
lru_cache_options_type_info; lru_cache_options_type_info;
static std::unordered_map<std::string, BlockBasedTableOptions::IndexType> static std::unordered_map<std::string, BlockBasedTableOptions::IndexType>
block_base_table_index_type_string_map; block_base_table_index_type_string_map;
static std::unordered_map<std::string,
BlockBasedTableOptions::DataBlockIndexType>
block_base_table_data_block_index_type_string_map;
static std::unordered_map<std::string, EncodingType> encoding_type_string_map; static std::unordered_map<std::string, EncodingType> encoding_type_string_map;
static std::unordered_map<std::string, CompactionStyle> static std::unordered_map<std::string, CompactionStyle>
compaction_style_string_map; compaction_style_string_map;
@ -203,6 +207,8 @@ static auto& compression_type_string_map =
OptionsHelper::compression_type_string_map; OptionsHelper::compression_type_string_map;
static auto& block_base_table_index_type_string_map = static auto& block_base_table_index_type_string_map =
OptionsHelper::block_base_table_index_type_string_map; OptionsHelper::block_base_table_index_type_string_map;
static auto& block_base_table_data_block_index_type_string_map =
OptionsHelper::block_base_table_data_block_index_type_string_map;
static auto& encoding_type_string_map = OptionsHelper::encoding_type_string_map; static auto& encoding_type_string_map = OptionsHelper::encoding_type_string_map;
static auto& compaction_style_string_map = static auto& compaction_style_string_map =
OptionsHelper::compaction_style_string_map; OptionsHelper::compaction_style_string_map;

@ -592,6 +592,12 @@ bool AreEqualOptions(
*reinterpret_cast<const BlockBasedTableOptions::IndexType*>( *reinterpret_cast<const BlockBasedTableOptions::IndexType*>(
offset1) == offset1) ==
*reinterpret_cast<const BlockBasedTableOptions::IndexType*>(offset2)); *reinterpret_cast<const BlockBasedTableOptions::IndexType*>(offset2));
case OptionType::kBlockBasedTableDataBlockIndexType:
return (
*reinterpret_cast<const BlockBasedTableOptions::DataBlockIndexType*>(
offset1) ==
*reinterpret_cast<const BlockBasedTableOptions::DataBlockIndexType*>(
offset2));
case OptionType::kWALRecoveryMode: case OptionType::kWALRecoveryMode:
return (*reinterpret_cast<const WALRecoveryMode*>(offset1) == return (*reinterpret_cast<const WALRecoveryMode*>(offset1) ==
*reinterpret_cast<const WALRecoveryMode*>(offset2)); *reinterpret_cast<const WALRecoveryMode*>(offset2));

@ -142,6 +142,7 @@ TEST_F(OptionsSettableTest, BlockBasedTableOptionsAllFieldsSettable) {
"pin_l0_filter_and_index_blocks_in_cache=1;" "pin_l0_filter_and_index_blocks_in_cache=1;"
"pin_top_level_index_and_filter=1;" "pin_top_level_index_and_filter=1;"
"index_type=kHashSearch;" "index_type=kHashSearch;"
"data_block_index_type=kDataBlockHashSearch;"
"checksum=kxxHash;hash_index_allow_collision=1;no_block_cache=1;" "checksum=kxxHash;hash_index_allow_collision=1;no_block_cache=1;"
"block_cache=1M;block_cache_compressed=1k;block_size=1024;" "block_cache=1M;block_cache_compressed=1k;block_size=1024;"
"block_size_deviation=8;block_restart_interval=4; " "block_size_deviation=8;block_restart_interval=4; "

@ -123,6 +123,10 @@ static std::unordered_map<std::string, OptionTypeInfo>
{"hash_index_allow_collision", {"hash_index_allow_collision",
{offsetof(struct BlockBasedTableOptions, hash_index_allow_collision), {offsetof(struct BlockBasedTableOptions, hash_index_allow_collision),
OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}}, OptionType::kBoolean, OptionVerificationType::kNormal, false, 0}},
{"data_block_index_type",
{offsetof(struct BlockBasedTableOptions, data_block_index_type),
OptionType::kBlockBasedTableDataBlockIndexType,
OptionVerificationType::kNormal, false, 0}},
{"checksum", {"checksum",
{offsetof(struct BlockBasedTableOptions, checksum), {offsetof(struct BlockBasedTableOptions, checksum),
OptionType::kChecksumType, OptionVerificationType::kNormal, false, OptionType::kChecksumType, OptionVerificationType::kNormal, false,

Loading…
Cancel
Save