|
|
|
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
|
|
|
|
// This source code is licensed under both the GPLv2 (found in the
|
|
|
|
// COPYING file in the root directory) and Apache 2.0 License
|
|
|
|
// (found in the LICENSE.Apache file in the root directory).
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#ifndef ROCKSDB_LITE
|
|
|
|
|
|
|
|
#include <memory>
|
|
|
|
#include <string>
|
|
|
|
|
|
|
|
#include "rocksdb/env.h"
|
|
|
|
#include "rocksdb/options.h"
|
|
|
|
#include "rocksdb/table_properties.h"
|
|
|
|
#include "rocksdb/types.h"
|
|
|
|
|
|
|
|
#if defined(__GNUC__) || defined(__clang__)
|
|
|
|
#define ROCKSDB_DEPRECATED_FUNC __attribute__((__deprecated__))
|
|
|
|
#elif _WIN32
|
|
|
|
#define ROCKSDB_DEPRECATED_FUNC __declspec(deprecated)
|
|
|
|
#endif
|
|
|
|
|
|
|
|
namespace ROCKSDB_NAMESPACE {
|
|
|
|
|
|
|
|
class Comparator;
|
|
|
|
|
|
|
|
// ExternalSstFileInfo include information about sst files created
|
|
|
|
// using SstFileWriter.
|
|
|
|
struct ExternalSstFileInfo {
|
|
|
|
ExternalSstFileInfo()
|
|
|
|
: file_path(""),
|
|
|
|
smallest_key(""),
|
|
|
|
largest_key(""),
|
|
|
|
smallest_range_del_key(""),
|
|
|
|
largest_range_del_key(""),
|
|
|
|
file_checksum(""),
|
|
|
|
file_checksum_func_name(""),
|
|
|
|
sequence_number(0),
|
|
|
|
file_size(0),
|
|
|
|
num_entries(0),
|
|
|
|
num_range_del_entries(0),
|
|
|
|
version(0) {}
|
|
|
|
|
|
|
|
ExternalSstFileInfo(const std::string& _file_path,
|
|
|
|
const std::string& _smallest_key,
|
|
|
|
const std::string& _largest_key,
|
|
|
|
SequenceNumber _sequence_number, uint64_t _file_size,
|
|
|
|
int32_t _num_entries, int32_t _version)
|
|
|
|
: file_path(_file_path),
|
|
|
|
smallest_key(_smallest_key),
|
|
|
|
largest_key(_largest_key),
|
|
|
|
smallest_range_del_key(""),
|
|
|
|
largest_range_del_key(""),
|
|
|
|
file_checksum(""),
|
|
|
|
file_checksum_func_name(""),
|
|
|
|
sequence_number(_sequence_number),
|
|
|
|
file_size(_file_size),
|
|
|
|
num_entries(_num_entries),
|
|
|
|
num_range_del_entries(0),
|
|
|
|
version(_version) {}
|
|
|
|
|
|
|
|
std::string file_path; // external sst file path
|
|
|
|
std::string smallest_key; // smallest user key in file
|
|
|
|
std::string largest_key; // largest user key in file
|
|
|
|
std::string
|
|
|
|
smallest_range_del_key; // smallest range deletion user key in file
|
|
|
|
std::string largest_range_del_key; // largest range deletion user key in file
|
|
|
|
std::string file_checksum; // sst file checksum;
|
|
|
|
std::string file_checksum_func_name; // The name of file checksum function
|
|
|
|
SequenceNumber sequence_number; // sequence number of all keys in file
|
|
|
|
uint64_t file_size; // file size in bytes
|
|
|
|
uint64_t num_entries; // number of entries in file
|
|
|
|
uint64_t num_range_del_entries; // number of range deletion entries in file
|
|
|
|
int32_t version; // file version
|
|
|
|
};
|
|
|
|
|
|
|
|
// SstFileWriter is used to create sst files that can be added to database later
|
|
|
|
// All keys in files generated by SstFileWriter will have sequence number = 0.
|
|
|
|
class SstFileWriter {
|
|
|
|
public:
|
|
|
|
// User can pass `column_family` to specify that the generated file will
|
|
|
|
// be ingested into this column_family, note that passing nullptr means that
|
|
|
|
// the column_family is unknown.
|
|
|
|
// If invalidate_page_cache is set to true, SstFileWriter will give the OS a
|
|
|
|
// hint that this file pages is not needed every time we write 1MB to the
|
|
|
|
// file. To use the rate limiter an io_priority smaller than IO_TOTAL can be
|
|
|
|
// passed.
|
Add more LSM info to FilterBuildingContext (#8246)
Summary:
Add `num_levels`, `is_bottommost`, and table file creation
`reason` to `FilterBuildingContext`, in anticipation of more powerful
Bloom-like filter support.
To support this, added `is_bottommost` and `reason` to
`TableBuilderOptions`, which allowed removing `reason` parameter from
`rocksdb::BuildTable`.
I attempted to remove `skip_filters` from `TableBuilderOptions`, because
filter construction decisions should arise from options, not one-off
parameters. I could not completely remove it because the public API for
SstFileWriter takes a `skip_filters` parameter, and translating this
into an option change would mean awkwardly replacing the table_factory
if it is BlockBasedTableFactory with new filter_policy=nullptr option.
I marked this public skip_filters option as deprecated because of this
oddity. (skip_filters on the read side probably makes sense.)
At least `skip_filters` is now largely hidden for users of
`TableBuilderOptions` and is no longer used for implementing the
optimize_filters_for_hits option. Bringing the logic for that option
closer to handling of FilterBuildingContext makes it more obvious that
hese two are using the same notion of "bottommost." (Planned:
configuration options for Bloom-like filters that generalize
`optimize_filters_for_hits`)
Recommended follow-up: Try to get away from "bottommost level" naming of
things, which is inaccurate (see
VersionStorageInfo::RangeMightExistAfterSortedRun), and move to
"bottommost run" or just "bottommost."
Pull Request resolved: https://github.com/facebook/rocksdb/pull/8246
Test Plan:
extended an existing unit test to exercise and check various
filter building contexts. Also, existing tests for
optimize_filters_for_hits validate some of the "bottommost" handling,
which is now closely connected to FilterBuildingContext::is_bottommost
through TableBuilderOptions::is_bottommost
Reviewed By: mrambacher
Differential Revision: D28099346
Pulled By: pdillinger
fbshipit-source-id: 2c1072e29c24d4ac404c761a7b7663292372600a
4 years ago
|
|
|
// The `skip_filters` option is DEPRECATED and could be removed in the
|
|
|
|
// future. Use `BlockBasedTableOptions::filter_policy` to control filter
|
|
|
|
// generation.
|
|
|
|
SstFileWriter(const EnvOptions& env_options, const Options& options,
|
|
|
|
ColumnFamilyHandle* column_family = nullptr,
|
|
|
|
bool invalidate_page_cache = true,
|
|
|
|
Env::IOPriority io_priority = Env::IOPriority::IO_TOTAL,
|
|
|
|
bool skip_filters = false)
|
|
|
|
: SstFileWriter(env_options, options, options.comparator, column_family,
|
|
|
|
invalidate_page_cache, io_priority, skip_filters) {}
|
|
|
|
|
|
|
|
// Deprecated API
|
|
|
|
SstFileWriter(const EnvOptions& env_options, const Options& options,
|
|
|
|
const Comparator* user_comparator,
|
|
|
|
ColumnFamilyHandle* column_family = nullptr,
|
|
|
|
bool invalidate_page_cache = true,
|
|
|
|
Env::IOPriority io_priority = Env::IOPriority::IO_TOTAL,
|
|
|
|
bool skip_filters = false);
|
|
|
|
|
|
|
|
~SstFileWriter();
|
|
|
|
|
|
|
|
// Prepare SstFileWriter to write into file located at "file_path".
|
|
|
|
Status Open(const std::string& file_path);
|
|
|
|
|
|
|
|
// Add a Put key with value to currently opened file (deprecated)
|
|
|
|
// REQUIRES: key is after any previously added key according to comparator.
|
|
|
|
// REQUIRES: comparator is *not* timestamp-aware.
|
|
|
|
ROCKSDB_DEPRECATED_FUNC Status Add(const Slice& user_key, const Slice& value);
|
|
|
|
|
|
|
|
// Add a Put key with value to currently opened file
|
|
|
|
// REQUIRES: key is after any previously added key according to comparator.
|
|
|
|
// REQUIRES: comparator is *not* timestamp-aware.
|
|
|
|
Status Put(const Slice& user_key, const Slice& value);
|
|
|
|
|
|
|
|
// Add a Put (key with timestamp, value) to the currently opened file
|
|
|
|
// REQUIRES: key is after any previously added key according to the
|
|
|
|
// comparator.
|
|
|
|
// REQUIRES: the timestamp's size is equal to what is expected by
|
|
|
|
// the comparator.
|
|
|
|
Status Put(const Slice& user_key, const Slice& timestamp, const Slice& value);
|
|
|
|
|
|
|
|
// Add a Merge key with value to currently opened file
|
|
|
|
// REQUIRES: key is after any previously added key according to comparator.
|
|
|
|
// REQUIRES: comparator is *not* timestamp-aware.
|
|
|
|
Status Merge(const Slice& user_key, const Slice& value);
|
|
|
|
|
|
|
|
// Add a deletion key to currently opened file
|
|
|
|
// REQUIRES: key is after any previously added key according to comparator.
|
|
|
|
// REQUIRES: comparator is *not* timestamp-aware.
|
|
|
|
Status Delete(const Slice& user_key);
|
|
|
|
|
|
|
|
// Add a deletion key with timestamp to the currently opened file
|
|
|
|
// REQUIRES: key is after any previously added key according to the
|
|
|
|
// comparator.
|
|
|
|
// REQUIRES: the timestamp's size is equal to what is expected by
|
|
|
|
// the comparator.
|
|
|
|
Status Delete(const Slice& user_key, const Slice& timestamp);
|
|
|
|
|
|
|
|
// Add a range deletion tombstone to currently opened file
|
|
|
|
// REQUIRES: comparator is *not* timestamp-aware.
|
|
|
|
Status DeleteRange(const Slice& begin_key, const Slice& end_key);
|
|
|
|
|
|
|
|
// Finalize writing to sst file and close file.
|
|
|
|
//
|
|
|
|
// An optional ExternalSstFileInfo pointer can be passed to the function
|
|
|
|
// which will be populated with information about the created sst file.
|
|
|
|
Status Finish(ExternalSstFileInfo* file_info = nullptr);
|
|
|
|
|
|
|
|
// Return the current file size.
|
|
|
|
uint64_t FileSize();
|
|
|
|
|
|
|
|
private:
|
|
|
|
void InvalidatePageCache(bool closing);
|
|
|
|
struct Rep;
|
|
|
|
std::unique_ptr<Rep> rep_;
|
|
|
|
};
|
|
|
|
} // namespace ROCKSDB_NAMESPACE
|
|
|
|
|
|
|
|
#endif // !ROCKSDB_LITE
|