@ -4,8 +4,10 @@
// (found in the LICENSE.Apache file in the root directory).
// (found in the LICENSE.Apache file in the root directory).
# include <array>
# include <array>
# include <sstream>
# include "db/blob/blob_index.h"
# include "db/blob/blob_index.h"
# include "db/blob/blob_log_format.h"
# include "db/db_test_util.h"
# include "db/db_test_util.h"
# include "port/stack_trace.h"
# include "port/stack_trace.h"
# include "test_util/sync_point.h"
# include "test_util/sync_point.h"
@ -372,103 +374,139 @@ TEST_F(DBBlobBasicTest, Properties) {
Options options = GetDefaultOptions ( ) ;
Options options = GetDefaultOptions ( ) ;
options . enable_blob_files = true ;
options . enable_blob_files = true ;
options . min_blob_size = 0 ;
options . min_blob_size = 0 ;
Reopen ( options ) ;
Reopen ( options ) ;
ASSERT_OK ( Put ( " key1 " , " 0000000000 " ) ) ;
ASSERT_OK ( Put ( " key2 " , " 0000000000 " ) ) ;
constexpr char key1 [ ] = " key1 " ;
constexpr size_t key1_size = sizeof ( key1 ) - 1 ;
constexpr char key2 [ ] = " key2 " ;
constexpr size_t key2_size = sizeof ( key2 ) - 1 ;
constexpr char key3 [ ] = " key3 " ;
constexpr size_t key3_size = sizeof ( key3 ) - 1 ;
constexpr char blob [ ] = " 0000000000 " ;
constexpr size_t blob_size = sizeof ( blob ) - 1 ;
ASSERT_OK ( Put ( key1 , blob ) ) ;
ASSERT_OK ( Put ( key2 , blob ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Put ( " key3 " , " 0000000000 " ) ) ;
constexpr size_t first_blob_file_expected_size =
BlobLogHeader : : kSize +
BlobLogRecord : : CalculateAdjustmentForRecordHeader ( key1_size ) + blob_size +
BlobLogRecord : : CalculateAdjustmentForRecordHeader ( key2_size ) + blob_size +
BlobLogFooter : : kSize ;
ASSERT_OK ( Put ( key3 , blob ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Flush ( ) ) ;
// num of files
constexpr size_t second_blob_file_expected_size =
BlobLogHeader : : kSize +
BlobLogRecord : : CalculateAdjustmentForRecordHeader ( key3_size ) + blob_size +
BlobLogFooter : : kSize ;
constexpr size_t total_expected_size =
first_blob_file_expected_size + second_blob_file_expected_size ;
// Number of blob files
uint64_t num_blob_files = 0 ;
uint64_t num_blob_files = 0 ;
EXPECT_TRUE (
ASSER T_TRUE(
db_ - > GetIntProperty ( DB : : Properties : : kNumBlobFiles , & num_blob_files ) ) ;
db_ - > GetIntProperty ( DB : : Properties : : kNumBlobFiles , & num_blob_files ) ) ;
ASSERT_EQ ( num_blob_files , 2 ) ;
ASSERT_EQ ( num_blob_files , 2 ) ;
// size of live blob files
// Total size of live blob files
uint64_t live_blob_file_size = 0 ;
uint64_t live_blob_file_size = 0 ;
EXPECT_TRUE ( db_ - > GetIntProperty ( DB : : Properties : : kLiveBlobFileSize ,
ASSER T_TRUE( db_ - > GetIntProperty ( DB : : Properties : : kLiveBlobFileSize ,
& live_blob_file_size ) ) ;
& live_blob_file_size ) ) ;
// size of total blob files
ASSERT_EQ ( live_blob_file_size , total_expected_size ) ;
// Total size of all blob files across all versions
// Note: this should be the same as above since we only have one
// version at this point.
uint64_t total_blob_file_size = 0 ;
uint64_t total_blob_file_size = 0 ;
EXPECT_TRUE ( db_ - > GetIntProperty ( DB : : Properties : : kTotalBlobFileSize ,
ASSER T_TRUE( db_ - > GetIntProperty ( DB : : Properties : : kTotalBlobFileSize ,
& total_blob_file_size ) ) ;
& total_blob_file_size ) ) ;
ASSERT_EQ ( live_blob_file_size , total_blob_file_size ) ;
ASSERT_EQ ( total_blob_file_size , total_expected_size ) ;
auto * versions = dbfull ( ) - > TEST_GetVersionSet ( ) ;
auto * current = versions - > GetColumnFamilySet ( ) - > GetDefault ( ) - > current ( ) ;
const auto & blob_files = current - > storage_info ( ) - > GetBlobFiles ( ) ;
uint64_t expected_live_blob_file_size = 0 ;
for ( const auto & pair : blob_files ) {
expected_live_blob_file_size + = pair . second - > GetTotalBlobBytes ( ) ;
}
ASSERT_EQ ( live_blob_file_size , expected_live_blob_file_size ) ;
// estimate live data size
// Delete key2 to create some garbage
std : : string blob_stats = " " ;
ASSERT_OK ( Delete ( key2 ) ) ;
EXPECT_TRUE ( db_ - > GetProperty ( DB : : Properties : : kBlobStats , & blob_stats ) ) ;
EXPECT_TRUE ( blob_stats . size ( ) > 0 ) ;
// delete key2 to make some garbage
ASSERT_OK ( Delete ( " key2 " ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Flush ( ) ) ;
constexpr Slice * begin = nullptr ;
constexpr Slice * begin = nullptr ;
constexpr Slice * end = nullptr ;
constexpr Slice * end = nullptr ;
ASSERT_OK ( db_ - > CompactRange ( CompactRangeOptions ( ) , begin , end ) ) ;
ASSERT_OK ( db_ - > CompactRange ( CompactRangeOptions ( ) , begin , end ) ) ;
std : : string new_blob_stats = " " ;
constexpr size_t expected_garbage_size =
EXPECT_TRUE ( db_ - > GetProperty ( DB : : Properties : : kBlobStats , & new_blob_stats ) ) ;
BlobLogRecord : : CalculateAdjustmentForRecordHeader ( key2_size ) + blob_size ;
std : : cout < < blob_stats < < new_blob_stats < < std : : endl ;
{
// Blob file stats
std : : istringstream ss1 ( blob_stats ) ;
std : : string blob_stats ;
std : : istringstream ss2 ( new_blob_stats ) ;
ASSERT_TRUE ( db_ - > GetProperty ( DB : : Properties : : kBlobStats , & blob_stats ) ) ;
std : : string stats_line = " " ;
std : : string new_stats_line = " " ;
std : : ostringstream oss ;
// skip the first line because it is the version info
oss < < " Number of blob files: 2 \n Total size of blob files: "
std : : getline ( ss1 , stats_line ) ;
< < total_expected_size
std : : getline ( ss2 , new_stats_line ) ;
< < " \n Total size of garbage in blob files: " < < expected_garbage_size
for ( size_t i = 0 ; i < 3 ; i + + ) {
< < ' \n ' ;
std : : getline ( ss1 , stats_line ) ;
std : : getline ( ss2 , new_stats_line ) ;
ASSERT_EQ ( blob_stats , oss . str ( ) ) ;
if ( i = = 2 ) {
ASSERT_TRUE ( stats_line ! = new_stats_line ) ;
} else {
ASSERT_EQ ( stats_line , new_stats_line ) ;
}
}
}
}
}
TEST_F ( DBBlobBasicTest , PropertiesMultiVersion ) {
TEST_F ( DBBlobBasicTest , PropertiesMultiVersion ) {
Options options = GetDefaultOptions ( ) ;
Options options = GetDefaultOptions ( ) ;
options . enable_blob_files = true ;
options . enable_blob_files = true ;
options . min_blob_size = 0 ;
options . min_blob_size = 0 ;
Reopen ( options ) ;
Reopen ( options ) ;
ASSERT_OK ( Put ( " key1 " , " 0000000000 " ) ) ;
constexpr char key1 [ ] = " key1 " ;
constexpr char key2 [ ] = " key2 " ;
constexpr char key3 [ ] = " key3 " ;
constexpr size_t key_size = sizeof ( key1 ) - 1 ;
static_assert ( sizeof ( key2 ) - 1 = = key_size , " unexpected size: key2 " ) ;
static_assert ( sizeof ( key3 ) - 1 = = key_size , " unexpected size: key3 " ) ;
constexpr char blob [ ] = " 0000000000 " ;
constexpr size_t blob_size = sizeof ( blob ) - 1 ;
ASSERT_OK ( Put ( key1 , blob ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Put ( " key2 " , " 0000000000 " ) ) ;
ASSERT_OK ( Put ( key2 , blob ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Flush ( ) ) ;
// create an iterator to make the current version alive
Iterator * iter = db_ - > NewIterator ( ReadOptions ( ) ) ;
// Create an iterator to keep the current version alive
std : : unique_ptr < Iterator > iter ( db_ - > NewIterator ( ReadOptions ( ) ) ) ;
ASSERT_OK ( iter - > status ( ) ) ;
ASSERT_OK ( iter - > status ( ) ) ;
ASSERT_OK ( Put ( " key3 " , " 0000000000 " ) ) ;
// Note: the Delete and subsequent compaction results in the first blob file
// not making it to the final version. (It is still part of the previous
// version kept alive by the iterator though.) On the other hand, the Put
// results in a third blob file.
ASSERT_OK ( Delete ( key1 ) ) ;
ASSERT_OK ( Put ( key3 , blob ) ) ;
ASSERT_OK ( Flush ( ) ) ;
ASSERT_OK ( Flush ( ) ) ;
// size of total blob files
constexpr Slice * begin = nullptr ;
constexpr Slice * end = nullptr ;
ASSERT_OK ( db_ - > CompactRange ( CompactRangeOptions ( ) , begin , end ) ) ;
// Total size of all blob files across all versions: between the two versions,
// we should have three blob files of the same size with one blob each.
// The version kept alive by the iterator contains the first and the second
// blob file, while the final version contains the second and the third blob
// file. (The second blob file is thus shared by the two versions but should
// be counted only once.)
uint64_t total_blob_file_size = 0 ;
uint64_t total_blob_file_size = 0 ;
EXPECT_TRUE ( db_ - > GetIntProperty ( DB : : Properties : : kTotalBlobFileSize ,
ASSER T_TRUE( db_ - > GetIntProperty ( DB : : Properties : : kTotalBlobFileSize ,
& total_blob_file_size ) ) ;
& total_blob_file_size ) ) ;
ASSERT_EQ ( total_blob_file_size ,
// total size equals to the current version's blob size because previous
3 * ( BlobLogHeader : : kSize +
// version's files are duplicated and thus not counted
BlobLogRecord : : CalculateAdjustmentForRecordHeader ( key_size ) +
auto * versions = dbfull ( ) - > TEST_GetVersionSet ( ) ;
blob_size + BlobLogFooter : : kSize ) ) ;
auto * current = versions - > GetColumnFamilySet ( ) - > GetDefault ( ) - > current ( ) ;
const auto & blob_files = current - > storage_info ( ) - > GetBlobFiles ( ) ;
uint64_t current_v_blob_size = 0 ;
for ( const auto & pair : blob_files ) {
current_v_blob_size + = pair . second - > GetTotalBlobBytes ( ) ;
}
ASSERT_EQ ( current_v_blob_size , total_blob_file_size ) ;
delete iter ;
}
}
# endif // !ROCKSDB_LITE
# endif // !ROCKSDB_LITE