2016-02-09 15:12:00 -08:00
|
|
|
// Copyright (c) 2011-present, Facebook, Inc. All rights reserved.
|
2017-07-15 16:03:42 -07:00
|
|
|
// This source code is licensed under both the GPLv2 (found in the
|
|
|
|
// COPYING file in the root directory) and Apache 2.0 License
|
|
|
|
// (found in the LICENSE.Apache file in the root directory).
|
2013-10-16 14:59:46 -07:00
|
|
|
//
|
2011-03-18 22:37:00 +00:00
|
|
|
// Copyright (c) 2011 The LevelDB Authors. All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
|
|
// found in the LICENSE file. See the AUTHORS file for names of contributors.
|
|
|
|
|
|
|
|
#include "db/log_writer.h"
|
|
|
|
|
|
|
|
#include <stdint.h>
|
2019-09-16 10:31:27 -07:00
|
|
|
#include "file/writable_file_writer.h"
|
2013-08-23 08:38:13 -07:00
|
|
|
#include "rocksdb/env.h"
|
2011-03-18 22:37:00 +00:00
|
|
|
#include "util/coding.h"
|
|
|
|
#include "util/crc32c.h"
|
|
|
|
|
2020-02-20 12:07:53 -08:00
|
|
|
namespace ROCKSDB_NAMESPACE {
|
2011-03-18 22:37:00 +00:00
|
|
|
namespace log {
|
|
|
|
|
2019-03-27 10:18:56 -07:00
|
|
|
Writer::Writer(std::unique_ptr<WritableFileWriter>&& dest, uint64_t log_number,
|
2017-06-24 14:06:43 -07:00
|
|
|
bool recycle_log_files, bool manual_flush)
|
2015-10-08 13:07:15 -04:00
|
|
|
: dest_(std::move(dest)),
|
|
|
|
block_offset_(0),
|
|
|
|
log_number_(log_number),
|
2017-06-24 14:06:43 -07:00
|
|
|
recycle_log_files_(recycle_log_files),
|
|
|
|
manual_flush_(manual_flush) {
|
2011-03-18 22:37:00 +00:00
|
|
|
for (int i = 0; i <= kMaxRecordType; i++) {
|
|
|
|
char t = static_cast<char>(i);
|
|
|
|
type_crc_[i] = crc32c::Value(&t, 1);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-04-25 10:04:57 -07:00
|
|
|
Writer::~Writer() {
|
|
|
|
if (dest_) {
|
|
|
|
WriteBuffer();
|
|
|
|
}
|
|
|
|
}
|
2017-06-24 14:06:43 -07:00
|
|
|
|
|
|
|
Status Writer::WriteBuffer() { return dest_->Flush(); }
|
2011-03-18 22:37:00 +00:00
|
|
|
|
2019-04-25 10:04:57 -07:00
|
|
|
Status Writer::Close() {
|
|
|
|
Status s;
|
|
|
|
if (dest_) {
|
|
|
|
s = dest_->Close();
|
|
|
|
dest_.reset();
|
|
|
|
}
|
|
|
|
return s;
|
|
|
|
}
|
|
|
|
|
2011-03-18 22:37:00 +00:00
|
|
|
Status Writer::AddRecord(const Slice& slice) {
|
|
|
|
const char* ptr = slice.data();
|
|
|
|
size_t left = slice.size();
|
|
|
|
|
2015-10-19 17:24:05 -04:00
|
|
|
// Header size varies depending on whether we are recycling or not.
|
|
|
|
const int header_size =
|
|
|
|
recycle_log_files_ ? kRecyclableHeaderSize : kHeaderSize;
|
|
|
|
|
2011-03-18 22:37:00 +00:00
|
|
|
// Fragment the record if necessary and emit it. Note that if slice
|
|
|
|
// is empty, we still want to iterate once to emit a single
|
|
|
|
// zero-length record
|
|
|
|
Status s;
|
2011-05-21 02:17:43 +00:00
|
|
|
bool begin = true;
|
2011-03-18 22:37:00 +00:00
|
|
|
do {
|
2015-11-15 21:49:14 +03:00
|
|
|
const int64_t leftover = kBlockSize - block_offset_;
|
2011-03-18 22:37:00 +00:00
|
|
|
assert(leftover >= 0);
|
2015-10-19 17:24:05 -04:00
|
|
|
if (leftover < header_size) {
|
2011-03-18 22:37:00 +00:00
|
|
|
// Switch to a new block
|
|
|
|
if (leftover > 0) {
|
2015-10-19 17:24:05 -04:00
|
|
|
// Fill the trailer (literal below relies on kHeaderSize and
|
|
|
|
// kRecyclableHeaderSize being <= 11)
|
|
|
|
assert(header_size <= 11);
|
2018-04-19 14:00:52 -07:00
|
|
|
s = dest_->Append(Slice("\x00\x00\x00\x00\x00\x00\x00\x00\x00\x00",
|
|
|
|
static_cast<size_t>(leftover)));
|
|
|
|
if (!s.ok()) {
|
|
|
|
break;
|
|
|
|
}
|
2011-03-18 22:37:00 +00:00
|
|
|
}
|
|
|
|
block_offset_ = 0;
|
|
|
|
}
|
|
|
|
|
2015-10-19 17:24:05 -04:00
|
|
|
// Invariant: we never leave < header_size bytes in a block.
|
2015-11-15 21:49:14 +03:00
|
|
|
assert(static_cast<int64_t>(kBlockSize - block_offset_) >= header_size);
|
2011-03-18 22:37:00 +00:00
|
|
|
|
2015-10-19 17:24:05 -04:00
|
|
|
const size_t avail = kBlockSize - block_offset_ - header_size;
|
2011-03-18 22:37:00 +00:00
|
|
|
const size_t fragment_length = (left < avail) ? left : avail;
|
|
|
|
|
|
|
|
RecordType type;
|
|
|
|
const bool end = (left == fragment_length);
|
|
|
|
if (begin && end) {
|
2015-10-19 17:24:05 -04:00
|
|
|
type = recycle_log_files_ ? kRecyclableFullType : kFullType;
|
2011-03-18 22:37:00 +00:00
|
|
|
} else if (begin) {
|
2015-10-19 17:24:05 -04:00
|
|
|
type = recycle_log_files_ ? kRecyclableFirstType : kFirstType;
|
2011-03-18 22:37:00 +00:00
|
|
|
} else if (end) {
|
2015-10-19 17:24:05 -04:00
|
|
|
type = recycle_log_files_ ? kRecyclableLastType : kLastType;
|
2011-03-18 22:37:00 +00:00
|
|
|
} else {
|
2015-10-19 17:24:05 -04:00
|
|
|
type = recycle_log_files_ ? kRecyclableMiddleType : kMiddleType;
|
2011-03-18 22:37:00 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
s = EmitPhysicalRecord(type, ptr, fragment_length);
|
|
|
|
ptr += fragment_length;
|
|
|
|
left -= fragment_length;
|
2011-05-21 02:17:43 +00:00
|
|
|
begin = false;
|
2011-03-18 22:37:00 +00:00
|
|
|
} while (s.ok() && left > 0);
|
2019-05-21 12:17:15 -07:00
|
|
|
|
|
|
|
if (s.ok()) {
|
|
|
|
if (!manual_flush_) {
|
|
|
|
s = dest_->Flush();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2011-03-18 22:37:00 +00:00
|
|
|
return s;
|
|
|
|
}
|
|
|
|
|
2018-05-14 10:53:32 -07:00
|
|
|
bool Writer::TEST_BufferIsEmpty() { return dest_->TEST_BufferIsEmpty(); }
|
|
|
|
|
2011-03-18 22:37:00 +00:00
|
|
|
Status Writer::EmitPhysicalRecord(RecordType t, const char* ptr, size_t n) {
|
|
|
|
assert(n <= 0xffff); // Must fit in two bytes
|
2015-10-19 17:24:05 -04:00
|
|
|
|
|
|
|
size_t header_size;
|
|
|
|
char buf[kRecyclableHeaderSize];
|
2011-03-18 22:37:00 +00:00
|
|
|
|
|
|
|
// Format the header
|
|
|
|
buf[4] = static_cast<char>(n & 0xff);
|
|
|
|
buf[5] = static_cast<char>(n >> 8);
|
|
|
|
buf[6] = static_cast<char>(t);
|
|
|
|
|
2015-10-19 17:24:05 -04:00
|
|
|
uint32_t crc = type_crc_[t];
|
|
|
|
if (t < kRecyclableFullType) {
|
|
|
|
// Legacy record format
|
|
|
|
assert(block_offset_ + kHeaderSize + n <= kBlockSize);
|
|
|
|
header_size = kHeaderSize;
|
|
|
|
} else {
|
|
|
|
// Recyclable record format
|
|
|
|
assert(block_offset_ + kRecyclableHeaderSize + n <= kBlockSize);
|
|
|
|
header_size = kRecyclableHeaderSize;
|
|
|
|
|
|
|
|
// Only encode low 32-bits of the 64-bit log number. This means
|
|
|
|
// we will fail to detect an old record if we recycled a log from
|
|
|
|
// ~4 billion logs ago, but that is effectively impossible, and
|
|
|
|
// even if it were we'dbe far more likely to see a false positive
|
|
|
|
// on the 32-bit CRC.
|
|
|
|
EncodeFixed32(buf + 7, static_cast<uint32_t>(log_number_));
|
|
|
|
crc = crc32c::Extend(crc, buf + 7, 4);
|
|
|
|
}
|
|
|
|
|
2011-03-18 22:37:00 +00:00
|
|
|
// Compute the crc of the record type and the payload.
|
2015-10-19 17:24:05 -04:00
|
|
|
crc = crc32c::Extend(crc, ptr, n);
|
|
|
|
crc = crc32c::Mask(crc); // Adjust for storage
|
2011-03-18 22:37:00 +00:00
|
|
|
EncodeFixed32(buf, crc);
|
|
|
|
|
|
|
|
// Write the header and the payload
|
2015-10-19 17:24:05 -04:00
|
|
|
Status s = dest_->Append(Slice(buf, header_size));
|
2011-03-18 22:37:00 +00:00
|
|
|
if (s.ok()) {
|
|
|
|
s = dest_->Append(Slice(ptr, n));
|
|
|
|
}
|
2015-10-19 17:24:05 -04:00
|
|
|
block_offset_ += header_size + n;
|
2011-03-18 22:37:00 +00:00
|
|
|
return s;
|
|
|
|
}
|
|
|
|
|
2011-10-31 17:22:06 +00:00
|
|
|
} // namespace log
|
2020-02-20 12:07:53 -08:00
|
|
|
} // namespace ROCKSDB_NAMESPACE
|