mirror of
https://github.com/facebook/rocksdb.git
synced 2024-11-30 04:41:49 +00:00
e8cb32ed67
Summary: The patch adds blob file support to the `Get` API by extending `Version` so that whenever a blob reference is read from a file, the blob is retrieved from the corresponding blob file and passed back to the caller. (This is assuming the blob reference is valid and the blob file is actually part of the given `Version`.) It also introduces a cache of `BlobFileReader`s called `BlobFileCache` that enables sharing `BlobFileReader`s between callers. `BlobFileCache` uses the same backing cache as `TableCache`, so `max_open_files` (if specified) limits the total number of open (table + blob) files. TODO: proactively open/cache blob files and pin the cache handles of the readers in the metadata objects similarly to what `VersionBuilder::LoadTableHandlers` does for table files. Pull Request resolved: https://github.com/facebook/rocksdb/pull/7540 Test Plan: `make check` Reviewed By: riversand963 Differential Revision: D24260219 Pulled By: ltamasi fbshipit-source-id: a8a2a4f11d3d04d6082201b52184bc4d7b0857ba
133 lines
3.9 KiB
C++
133 lines
3.9 KiB
C++
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
|
|
// This source code is licensed under both the GPLv2 (found in the
|
|
// COPYING file in the root directory) and Apache 2.0 License
|
|
// (found in the LICENSE.Apache file in the root directory).
|
|
//
|
|
|
|
#include "db/blob/blob_log_sequential_reader.h"
|
|
|
|
#include "file/random_access_file_reader.h"
|
|
#include "monitoring/statistics.h"
|
|
#include "util/stop_watch.h"
|
|
|
|
namespace ROCKSDB_NAMESPACE {
|
|
|
|
BlobLogSequentialReader::BlobLogSequentialReader(
|
|
std::unique_ptr<RandomAccessFileReader>&& file_reader, Env* env,
|
|
Statistics* statistics)
|
|
: file_(std::move(file_reader)),
|
|
env_(env),
|
|
statistics_(statistics),
|
|
next_byte_(0) {}
|
|
|
|
BlobLogSequentialReader::~BlobLogSequentialReader() = default;
|
|
|
|
Status BlobLogSequentialReader::ReadSlice(uint64_t size, Slice* slice,
|
|
char* buf) {
|
|
assert(slice);
|
|
assert(file_);
|
|
|
|
StopWatch read_sw(env_, statistics_, BLOB_DB_BLOB_FILE_READ_MICROS);
|
|
Status s = file_->Read(IOOptions(), next_byte_, static_cast<size_t>(size),
|
|
slice, buf, nullptr);
|
|
next_byte_ += size;
|
|
if (!s.ok()) {
|
|
return s;
|
|
}
|
|
RecordTick(statistics_, BLOB_DB_BLOB_FILE_BYTES_READ, slice->size());
|
|
if (slice->size() != size) {
|
|
return Status::Corruption("EOF reached while reading record");
|
|
}
|
|
return s;
|
|
}
|
|
|
|
Status BlobLogSequentialReader::ReadHeader(BlobLogHeader* header) {
|
|
assert(header);
|
|
assert(next_byte_ == 0);
|
|
|
|
static_assert(BlobLogHeader::kSize <= sizeof(header_buf_),
|
|
"Buffer is smaller than BlobLogHeader::kSize");
|
|
|
|
Status s = ReadSlice(BlobLogHeader::kSize, &buffer_, header_buf_);
|
|
if (!s.ok()) {
|
|
return s;
|
|
}
|
|
|
|
if (buffer_.size() != BlobLogHeader::kSize) {
|
|
return Status::Corruption("EOF reached before file header");
|
|
}
|
|
|
|
return header->DecodeFrom(buffer_);
|
|
}
|
|
|
|
Status BlobLogSequentialReader::ReadRecord(BlobLogRecord* record,
|
|
ReadLevel level,
|
|
uint64_t* blob_offset) {
|
|
assert(record);
|
|
static_assert(BlobLogRecord::kHeaderSize <= sizeof(header_buf_),
|
|
"Buffer is smaller than BlobLogRecord::kHeaderSize");
|
|
|
|
Status s = ReadSlice(BlobLogRecord::kHeaderSize, &buffer_, header_buf_);
|
|
if (!s.ok()) {
|
|
return s;
|
|
}
|
|
if (buffer_.size() != BlobLogRecord::kHeaderSize) {
|
|
return Status::Corruption("EOF reached before record header");
|
|
}
|
|
|
|
s = record->DecodeHeaderFrom(buffer_);
|
|
if (!s.ok()) {
|
|
return s;
|
|
}
|
|
|
|
uint64_t kb_size = record->key_size + record->value_size;
|
|
if (blob_offset != nullptr) {
|
|
*blob_offset = next_byte_ + record->key_size;
|
|
}
|
|
|
|
switch (level) {
|
|
case kReadHeader:
|
|
next_byte_ += kb_size;
|
|
break;
|
|
|
|
case kReadHeaderKey:
|
|
record->key_buf.reset(new char[record->key_size]);
|
|
s = ReadSlice(record->key_size, &record->key, record->key_buf.get());
|
|
next_byte_ += record->value_size;
|
|
break;
|
|
|
|
case kReadHeaderKeyBlob:
|
|
record->key_buf.reset(new char[record->key_size]);
|
|
s = ReadSlice(record->key_size, &record->key, record->key_buf.get());
|
|
if (s.ok()) {
|
|
record->value_buf.reset(new char[record->value_size]);
|
|
s = ReadSlice(record->value_size, &record->value,
|
|
record->value_buf.get());
|
|
}
|
|
if (s.ok()) {
|
|
s = record->CheckBlobCRC();
|
|
}
|
|
break;
|
|
}
|
|
return s;
|
|
}
|
|
|
|
Status BlobLogSequentialReader::ReadFooter(BlobLogFooter* footer) {
|
|
assert(footer);
|
|
static_assert(BlobLogFooter::kSize <= sizeof(header_buf_),
|
|
"Buffer is smaller than BlobLogFooter::kSize");
|
|
|
|
Status s = ReadSlice(BlobLogFooter::kSize, &buffer_, header_buf_);
|
|
if (!s.ok()) {
|
|
return s;
|
|
}
|
|
|
|
if (buffer_.size() != BlobLogFooter::kSize) {
|
|
return Status::Corruption("EOF reached before file footer");
|
|
}
|
|
|
|
return footer->DecodeFrom(buffer_);
|
|
}
|
|
|
|
} // namespace ROCKSDB_NAMESPACE
|