2013-10-16 23:59:46 +02:00
|
|
|
// Copyright (c) 2013, Facebook, Inc. All rights reserved.
|
|
|
|
// This source code is licensed under the BSD-style license found in the
|
|
|
|
// LICENSE file in the root directory of this source tree. An additional grant
|
|
|
|
// of patent rights can be found in the PATENTS file in the same directory.
|
|
|
|
//
|
2013-08-06 21:54:37 +02:00
|
|
|
#include "db/transaction_log_impl.h"
|
2012-11-30 02:28:37 +01:00
|
|
|
#include "db/write_batch_internal.h"
|
2013-03-21 23:12:35 +01:00
|
|
|
|
2013-10-04 06:49:15 +02:00
|
|
|
namespace rocksdb {
|
2012-11-30 02:28:37 +01:00
|
|
|
|
|
|
|
TransactionLogIteratorImpl::TransactionLogIteratorImpl(
|
2013-10-01 23:46:52 +02:00
|
|
|
const std::string& dir,
|
2013-03-04 19:44:04 +01:00
|
|
|
const Options* options,
|
2013-06-08 00:35:17 +02:00
|
|
|
const EnvOptions& soptions,
|
2013-08-06 21:54:37 +02:00
|
|
|
const SequenceNumber seq,
|
|
|
|
std::unique_ptr<VectorLogPtr> files,
|
2013-10-25 04:09:02 +02:00
|
|
|
DBImpl const * const dbimpl) :
|
2013-10-01 23:46:52 +02:00
|
|
|
dir_(dir),
|
2013-08-06 21:54:37 +02:00
|
|
|
options_(options),
|
|
|
|
soptions_(soptions),
|
|
|
|
startingSequenceNumber_(seq),
|
|
|
|
files_(std::move(files)),
|
|
|
|
started_(false),
|
|
|
|
isValid_(false),
|
|
|
|
currentFileIndex_(0),
|
2013-10-21 04:06:19 +02:00
|
|
|
currentBatchSeq_(0),
|
2013-10-25 04:09:02 +02:00
|
|
|
currentLastSeq_(0),
|
|
|
|
dbimpl_(dbimpl) {
|
2013-10-14 00:28:24 +02:00
|
|
|
assert(files_ != nullptr);
|
2013-10-25 04:09:02 +02:00
|
|
|
assert(dbimpl_ != nullptr);
|
2012-11-30 02:28:37 +01:00
|
|
|
|
2013-04-29 22:19:24 +02:00
|
|
|
reporter_.env = options_->env;
|
|
|
|
reporter_.info_log = options_->info_log.get();
|
2013-10-14 00:28:24 +02:00
|
|
|
SeekToStartSequence(); // Seek till starting sequence
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
|
|
|
|
2013-01-20 11:07:13 +01:00
|
|
|
Status TransactionLogIteratorImpl::OpenLogFile(
|
2013-10-21 04:06:19 +02:00
|
|
|
const LogFile* logFile,
|
|
|
|
unique_ptr<SequentialFile>* file) {
|
2012-11-30 02:28:37 +01:00
|
|
|
Env* env = options_->env;
|
2013-08-06 21:54:37 +02:00
|
|
|
if (logFile->Type() == kArchivedLogFile) {
|
2013-10-01 23:46:52 +02:00
|
|
|
std::string fname = ArchivedLogFileName(dir_, logFile->LogNumber());
|
2013-03-15 01:00:04 +01:00
|
|
|
return env->NewSequentialFile(fname, file, soptions_);
|
2012-11-30 02:28:37 +01:00
|
|
|
} else {
|
2013-10-01 23:46:52 +02:00
|
|
|
std::string fname = LogFileName(dir_, logFile->LogNumber());
|
2013-03-15 01:00:04 +01:00
|
|
|
Status status = env->NewSequentialFile(fname, file, soptions_);
|
2012-11-30 02:28:37 +01:00
|
|
|
if (!status.ok()) {
|
|
|
|
// If cannot open file in DB directory.
|
|
|
|
// Try the archive dir, as it could have moved in the meanwhile.
|
2013-10-01 23:46:52 +02:00
|
|
|
fname = ArchivedLogFileName(dir_, logFile->LogNumber());
|
2013-03-15 01:00:04 +01:00
|
|
|
status = env->NewSequentialFile(fname, file, soptions_);
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-03-04 19:44:04 +01:00
|
|
|
BatchResult TransactionLogIteratorImpl::GetBatch() {
|
2012-11-30 02:28:37 +01:00
|
|
|
assert(isValid_); // cannot call in a non valid state.
|
2013-03-04 19:44:04 +01:00
|
|
|
BatchResult result;
|
2013-10-14 00:28:24 +02:00
|
|
|
result.sequence = currentBatchSeq_;
|
2013-03-04 19:44:04 +01:00
|
|
|
result.writeBatchPtr = std::move(currentBatch_);
|
|
|
|
return result;
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
Status TransactionLogIteratorImpl::status() {
|
|
|
|
return currentStatus_;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool TransactionLogIteratorImpl::Valid() {
|
|
|
|
return started_ && isValid_;
|
|
|
|
}
|
|
|
|
|
2013-10-21 04:06:19 +02:00
|
|
|
bool TransactionLogIteratorImpl::RestrictedRead(
|
|
|
|
Slice* record,
|
|
|
|
std::string* scratch) {
|
|
|
|
// Don't read if no more complete entries to read from logs
|
2013-10-25 04:09:02 +02:00
|
|
|
if (currentLastSeq_ >= dbimpl_->GetLatestSequenceNumber()) {
|
2013-10-21 04:06:19 +02:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
return currentLogReader_->ReadRecord(record, scratch);
|
|
|
|
}
|
|
|
|
|
|
|
|
void TransactionLogIteratorImpl::SeekToStartSequence(
|
|
|
|
uint64_t startFileIndex,
|
|
|
|
bool strict) {
|
|
|
|
std::string scratch;
|
|
|
|
Slice record;
|
|
|
|
started_ = false;
|
|
|
|
isValid_ = false;
|
|
|
|
if (files_->size() <= startFileIndex) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
Status s = OpenLogReader(files_->at(startFileIndex).get());
|
|
|
|
if (!s.ok()) {
|
|
|
|
currentStatus_ = s;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
while (RestrictedRead(&record, &scratch)) {
|
|
|
|
if (record.size() < 12) {
|
|
|
|
reporter_.Corruption(
|
|
|
|
record.size(), Status::Corruption("very small log record"));
|
|
|
|
continue;
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
2013-10-21 04:06:19 +02:00
|
|
|
UpdateCurrentWriteBatch(record);
|
2013-10-25 04:09:02 +02:00
|
|
|
if (currentLastSeq_ >= startingSequenceNumber_) {
|
2013-10-21 04:06:19 +02:00
|
|
|
if (strict && currentBatchSeq_ != startingSequenceNumber_) {
|
|
|
|
currentStatus_ = Status::Corruption("Gap in sequence number. Could not "
|
|
|
|
"seek to required sequence number");
|
|
|
|
reporter_.Info(currentStatus_.ToString().c_str());
|
2013-10-14 00:28:24 +02:00
|
|
|
return;
|
2013-10-21 04:06:19 +02:00
|
|
|
} else if (strict) {
|
|
|
|
reporter_.Info("Could seek required sequence number. Iterator will "
|
|
|
|
"continue.");
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
2013-10-21 04:06:19 +02:00
|
|
|
isValid_ = true;
|
|
|
|
started_ = true; // set started_ as we could seek till starting sequence
|
|
|
|
return;
|
|
|
|
} else {
|
|
|
|
isValid_ = false;
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
2013-10-21 04:06:19 +02:00
|
|
|
}
|
2013-10-25 04:09:02 +02:00
|
|
|
|
2013-10-21 04:06:19 +02:00
|
|
|
// Could not find start sequence in first file. Normally this must be the
|
|
|
|
// only file. Otherwise log the error and let the iterator return next entry
|
2013-10-25 04:09:02 +02:00
|
|
|
// If strict is set, we want to seek exactly till the start sequence and it
|
|
|
|
// should have been present in the file we scanned above
|
|
|
|
if (strict) {
|
|
|
|
currentStatus_ = Status::Corruption("Gap in sequence number. Could not "
|
|
|
|
"seek to required sequence number");
|
|
|
|
reporter_.Info(currentStatus_.ToString().c_str());
|
|
|
|
} else if (files_->size() != 1) {
|
2013-10-21 04:06:19 +02:00
|
|
|
currentStatus_ = Status::Corruption("Start sequence was not found, "
|
|
|
|
"skipping to the next available");
|
2013-10-25 04:09:02 +02:00
|
|
|
reporter_.Info(currentStatus_.ToString().c_str());
|
|
|
|
// Let NextImpl find the next available entry. started_ remains false
|
|
|
|
// because we don't want to check for gaps while moving to start sequence
|
|
|
|
NextImpl(true);
|
2013-10-21 04:06:19 +02:00
|
|
|
}
|
2013-10-14 00:28:24 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
void TransactionLogIteratorImpl::Next() {
|
2013-10-25 04:09:02 +02:00
|
|
|
return NextImpl(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
void TransactionLogIteratorImpl::NextImpl(bool internal) {
|
2013-10-14 00:28:24 +02:00
|
|
|
std::string scratch;
|
|
|
|
Slice record;
|
|
|
|
isValid_ = false;
|
2013-10-25 04:09:02 +02:00
|
|
|
if (!internal && !started_) {
|
|
|
|
// Runs every time until we can seek to the start sequence
|
2013-10-14 00:28:24 +02:00
|
|
|
return SeekToStartSequence();
|
2013-04-09 01:28:09 +02:00
|
|
|
}
|
2013-10-14 00:28:24 +02:00
|
|
|
while(true) {
|
2013-01-20 11:07:13 +01:00
|
|
|
assert(currentLogReader_);
|
2013-10-25 04:09:02 +02:00
|
|
|
if (currentLogReader_->IsEOF()) {
|
|
|
|
currentLogReader_->UnmarkEOF();
|
|
|
|
}
|
|
|
|
while (RestrictedRead(&record, &scratch)) {
|
|
|
|
if (record.size() < 12) {
|
|
|
|
reporter_.Corruption(
|
|
|
|
record.size(), Status::Corruption("very small log record"));
|
|
|
|
continue;
|
|
|
|
} else {
|
|
|
|
// started_ should be true if called by application
|
|
|
|
assert(internal || started_);
|
|
|
|
// started_ should be false if called internally
|
|
|
|
assert(!internal || !started_);
|
|
|
|
UpdateCurrentWriteBatch(record);
|
|
|
|
if (internal && !started_) {
|
|
|
|
started_ = true;
|
2013-03-21 23:12:35 +01:00
|
|
|
}
|
2013-10-25 04:09:02 +02:00
|
|
|
return;
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-10-14 00:28:24 +02:00
|
|
|
// Open the next file
|
|
|
|
if (currentFileIndex_ < files_->size() - 1) {
|
|
|
|
++currentFileIndex_;
|
|
|
|
Status status =OpenLogReader(files_->at(currentFileIndex_).get());
|
|
|
|
if (!status.ok()) {
|
2012-11-30 02:28:37 +01:00
|
|
|
isValid_ = false;
|
2013-10-14 00:28:24 +02:00
|
|
|
currentStatus_ = status;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
isValid_ = false;
|
2013-10-25 04:09:02 +02:00
|
|
|
if (currentLastSeq_ == dbimpl_->GetLatestSequenceNumber()) {
|
2013-10-14 00:28:24 +02:00
|
|
|
currentStatus_ = Status::OK();
|
|
|
|
} else {
|
2014-02-12 20:42:54 +01:00
|
|
|
currentStatus_ = Status::Corruption("NO MORE DATA LEFT");
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
2013-10-14 00:28:24 +02:00
|
|
|
return;
|
2012-11-30 02:28:37 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-10-25 04:09:02 +02:00
|
|
|
bool TransactionLogIteratorImpl::IsBatchExpected(
|
2013-10-21 04:06:19 +02:00
|
|
|
const WriteBatch* batch,
|
|
|
|
const SequenceNumber expectedSeq) {
|
|
|
|
assert(batch);
|
|
|
|
SequenceNumber batchSeq = WriteBatchInternal::Sequence(batch);
|
2013-10-25 04:09:02 +02:00
|
|
|
if (batchSeq != expectedSeq) {
|
2013-10-21 04:06:19 +02:00
|
|
|
char buf[200];
|
|
|
|
snprintf(buf, sizeof(buf),
|
2013-11-13 06:02:03 +01:00
|
|
|
"Discontinuity in log records. Got seq=%lu, Expected seq=%lu, "
|
|
|
|
"Last flushed seq=%lu.Log iterator will reseek the correct "
|
2013-11-13 05:05:28 +01:00
|
|
|
"batch.",
|
2013-11-13 06:02:03 +01:00
|
|
|
(unsigned long)batchSeq,
|
|
|
|
(unsigned long)expectedSeq,
|
|
|
|
(unsigned long)dbimpl_->GetLatestSequenceNumber());
|
2013-10-21 04:06:19 +02:00
|
|
|
reporter_.Info(buf);
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2013-03-04 19:44:04 +01:00
|
|
|
void TransactionLogIteratorImpl::UpdateCurrentWriteBatch(const Slice& record) {
|
2013-11-08 00:46:48 +01:00
|
|
|
std::unique_ptr<WriteBatch> batch(new WriteBatch());
|
|
|
|
WriteBatchInternal::SetContents(batch.get(), record);
|
2013-10-21 04:06:19 +02:00
|
|
|
|
2013-10-25 04:09:02 +02:00
|
|
|
SequenceNumber expectedSeq = currentLastSeq_ + 1;
|
|
|
|
// If the iterator has started, then confirm that we get continuous batches
|
2013-11-08 00:46:48 +01:00
|
|
|
if (started_ && !IsBatchExpected(batch.get(), expectedSeq)) {
|
2013-10-21 04:06:19 +02:00
|
|
|
// Seek to the batch having expected sequence number
|
|
|
|
if (expectedSeq < files_->at(currentFileIndex_)->StartSequence()) {
|
|
|
|
// Expected batch must lie in the previous log file
|
2013-11-13 05:05:28 +01:00
|
|
|
// Avoid underflow.
|
|
|
|
if (currentFileIndex_ != 0) {
|
|
|
|
currentFileIndex_--;
|
|
|
|
}
|
2013-10-21 04:06:19 +02:00
|
|
|
}
|
|
|
|
startingSequenceNumber_ = expectedSeq;
|
2013-10-25 04:09:02 +02:00
|
|
|
// currentStatus_ will be set to Ok if reseek succeeds
|
|
|
|
currentStatus_ = Status::NotFound("Gap in sequence numbers");
|
2013-10-21 04:06:19 +02:00
|
|
|
return SeekToStartSequence(currentFileIndex_, true);
|
|
|
|
}
|
|
|
|
|
2013-11-08 00:46:48 +01:00
|
|
|
currentBatchSeq_ = WriteBatchInternal::Sequence(batch.get());
|
|
|
|
currentLastSeq_ = currentBatchSeq_ +
|
|
|
|
WriteBatchInternal::Count(batch.get()) - 1;
|
2013-10-21 04:06:19 +02:00
|
|
|
// currentBatchSeq_ can only change here
|
2013-10-25 04:09:02 +02:00
|
|
|
assert(currentLastSeq_ <= dbimpl_->GetLatestSequenceNumber());
|
2013-10-21 04:06:19 +02:00
|
|
|
|
2013-11-08 00:46:48 +01:00
|
|
|
currentBatch_ = move(batch);
|
2013-03-21 23:12:35 +01:00
|
|
|
isValid_ = true;
|
2013-03-21 23:49:20 +01:00
|
|
|
currentStatus_ = Status::OK();
|
2013-03-04 19:44:04 +01:00
|
|
|
}
|
|
|
|
|
2013-08-06 21:54:37 +02:00
|
|
|
Status TransactionLogIteratorImpl::OpenLogReader(const LogFile* logFile) {
|
2013-04-09 01:28:09 +02:00
|
|
|
unique_ptr<SequentialFile> file;
|
|
|
|
Status status = OpenLogFile(logFile, &file);
|
|
|
|
if (!status.ok()) {
|
|
|
|
return status;
|
|
|
|
}
|
|
|
|
assert(file);
|
|
|
|
currentLogReader_.reset(
|
2013-04-29 22:19:24 +02:00
|
|
|
new log::Reader(std::move(file), &reporter_, true, 0)
|
2013-04-09 01:28:09 +02:00
|
|
|
);
|
|
|
|
return Status::OK();
|
|
|
|
}
|
2013-10-04 06:49:15 +02:00
|
|
|
} // namespace rocksdb
|