// // Copyright Aliaksei Levin (levlam@telegram.org), Arseny Smirnov (arseny30@gmail.com) 2014-2022 // // Distributed under the Boost Software License, Version 1.0. (See accompanying // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) // #include "td/db/TQueue.h" #include "td/db/binlog/Binlog.h" #include "td/db/binlog/BinlogEvent.h" #include "td/db/binlog/BinlogHelper.h" #include "td/db/binlog/BinlogInterface.h" #include "td/utils/FlatHashMap.h" #include "td/utils/misc.h" #include "td/utils/Random.h" #include "td/utils/StorerBase.h" #include "td/utils/tl_helpers.h" #include "td/utils/tl_parsers.h" #include "td/utils/tl_storers.h" #include namespace td { using EventId = TQueue::EventId; EventId::EventId() { } Result EventId::from_int32(int32 id) { if (!is_valid_id(id)) { return Status::Error("Invalid ID"); } return EventId(id); } bool EventId::is_valid() const { return !empty() && is_valid_id(id_); } int32 EventId::value() const { return id_; } Result EventId::next() const { return from_int32(id_ + 1); } Result EventId::advance(size_t offset) const { TRY_RESULT(new_id, narrow_cast_safe(id_ + offset)); return from_int32(new_id); } bool EventId::empty() const { return id_ == 0; } bool EventId::operator==(const EventId &other) const { return id_ == other.id_; } bool EventId::operator!=(const EventId &other) const { return !(*this == other); } bool EventId::operator<(const EventId &other) const { return id_ < other.id_; } StringBuilder &operator<<(StringBuilder &string_builder, EventId id) { return string_builder << "EventId{" << id.value() << "}"; } EventId::EventId(int32 id) : id_(id) { CHECK(is_valid_id(id)); } bool EventId::is_valid_id(int32 id) { return 0 <= id && id < MAX_ID; } class TQueueImpl final : public TQueue { static constexpr size_t MAX_EVENT_LENGTH = 65536 * 8; static constexpr size_t MAX_QUEUE_EVENTS = 1000000; static constexpr size_t MAX_TOTAL_EVENT_LENGTH = 1 << 30; public: void set_callback(unique_ptr callback) final { callback_ = std::move(callback); } unique_ptr extract_callback() final { return std::move(callback_); } bool do_push(QueueId queue_id, RawEvent &&raw_event) final { CHECK(raw_event.event_id.is_valid()); // raw_event.data can be empty when replaying binlog if (raw_event.data.size() > MAX_EVENT_LENGTH) { return false; } auto &q = queues_[queue_id]; if (q.events.size() >= MAX_QUEUE_EVENTS || q.total_event_length > MAX_TOTAL_EVENT_LENGTH - raw_event.data.size() || raw_event.expires_at <= 0) { return false; } auto event_id = raw_event.event_id; if (event_id < q.tail_id) { return false; } if (!q.events.empty()) { auto it = q.events.end(); --it; if (it->second.data.empty()) { if (callback_ != nullptr && it->second.log_event_id != 0) { callback_->pop(it->second.log_event_id); } q.events.erase(it); } } if (q.events.empty() && !raw_event.data.empty()) { schedule_queue_gc(queue_id, q, raw_event.expires_at); } if (raw_event.log_event_id == 0 && callback_ != nullptr) { raw_event.log_event_id = callback_->push(queue_id, raw_event); } q.tail_id = event_id.next().move_as_ok(); q.total_event_length += raw_event.data.size(); q.events.emplace(event_id, std::move(raw_event)); return true; } Result push(QueueId queue_id, string data, int32 expires_at, int64 extra, EventId hint_new_id) final { if (data.empty()) { return Status::Error("Data is empty"); } if (data.size() > MAX_EVENT_LENGTH) { return Status::Error("Data is too big"); } auto &q = queues_[queue_id]; if (q.events.size() >= MAX_QUEUE_EVENTS) { return Status::Error("Queue is full"); } if (q.total_event_length > MAX_TOTAL_EVENT_LENGTH - data.size()) { return Status::Error("Queue size is too big"); } if (expires_at <= 0) { return Status::Error("Failed to add already expired event"); } EventId event_id; while (true) { if (q.tail_id.empty()) { if (hint_new_id.empty()) { q.tail_id = EventId::from_int32(Random::fast(2 * MAX_QUEUE_EVENTS + 1, EventId::MAX_ID / 2)).move_as_ok(); } else { q.tail_id = hint_new_id; } } event_id = q.tail_id; CHECK(event_id.is_valid()); if (event_id.next().is_ok()) { break; } for (auto it = q.events.begin(); it != q.events.end();) { pop(q, queue_id, it, {}); } q.tail_id = EventId(); CHECK(hint_new_id.next().is_ok()); } RawEvent raw_event; raw_event.event_id = event_id; raw_event.data = std::move(data); raw_event.expires_at = expires_at; raw_event.extra = extra; bool is_added = do_push(queue_id, std::move(raw_event)); CHECK(is_added); return event_id; } EventId get_head(QueueId queue_id) const final { auto it = queues_.find(queue_id); if (it == queues_.end()) { return EventId(); } return get_queue_head(it->second); } EventId get_tail(QueueId queue_id) const final { auto it = queues_.find(queue_id); if (it == queues_.end()) { return EventId(); } auto &q = it->second; return q.tail_id; } void forget(QueueId queue_id, EventId event_id) final { auto q_it = queues_.find(queue_id); if (q_it == queues_.end()) { return; } auto &q = q_it->second; auto it = q.events.find(event_id); if (it == q.events.end()) { return; } pop(q, queue_id, it, q.tail_id); } Result get(QueueId queue_id, EventId from_id, bool forget_previous, int32 unix_time_now, MutableSpan &result_events) final { auto it = queues_.find(queue_id); if (it == queues_.end()) { result_events.truncate(0); return 0; } auto &q = it->second; // Some sanity checks if (from_id.value() > q.tail_id.value() + 10) { return Status::Error("Specified from_id is in the future"); } if (from_id.value() < get_queue_head(q).value() - static_cast(MAX_QUEUE_EVENTS)) { return Status::Error("Specified from_id is in the past"); } do_get(queue_id, q, from_id, forget_previous, unix_time_now, result_events); return get_size(q); } int64 run_gc(int32 unix_time_now) final { int64 deleted_events = 0; while (!queue_gc_at_.empty()) { auto it = queue_gc_at_.begin(); if (it->first >= unix_time_now) { break; } auto queue_id = it->second; auto &q = queues_[queue_id]; CHECK(q.gc_at == it->first); int32 new_gc_at = 0; if (!q.events.empty()) { auto head_id = q.events.begin()->first; Event event; MutableSpan span{&event, 1}; size_t size_before = get_size(q); do_get(queue_id, q, head_id, false, unix_time_now, span); size_t size_after = get_size(q); CHECK(size_after <= size_before); deleted_events += size_before - size_after; if (!span.empty()) { CHECK(!event.data.empty()); new_gc_at = event.expires_at; CHECK(new_gc_at >= unix_time_now); } } schedule_queue_gc(queue_id, q, new_gc_at); } return deleted_events; } size_t get_size(QueueId queue_id) const final { auto it = queues_.find(queue_id); if (it == queues_.end()) { return 0; } return get_size(it->second); } void close(Promise<> promise) final { if (callback_ != nullptr) { callback_->close(std::move(promise)); callback_ = nullptr; } } private: struct Queue { EventId tail_id; std::map events; size_t total_event_length = 0; int32 gc_at = 0; }; FlatHashMap queues_; std::set> queue_gc_at_; unique_ptr callback_; static EventId get_queue_head(const Queue &q) { if (q.events.empty()) { return q.tail_id; } return q.events.begin()->first; } static size_t get_size(const Queue &q) { if (q.events.empty()) { return 0; } return q.events.size() - (q.events.rbegin()->second.data.empty() ? 1 : 0); } void pop(Queue &q, QueueId queue_id, std::map::iterator &it, EventId tail_id) { auto &event = it->second; if (callback_ == nullptr || event.log_event_id == 0) { remove_event(q, it); return; } if (event.event_id.next().ok() == tail_id) { if (!event.data.empty()) { clear_event_data(q, event); callback_->push(queue_id, event); } ++it; } else { callback_->pop(event.log_event_id); remove_event(q, it); } } static void remove_event(Queue &q, std::map::iterator &it) { q.total_event_length -= it->second.data.size(); it = q.events.erase(it); } static void clear_event_data(Queue &q, RawEvent &event) { q.total_event_length -= event.data.size(); event.data = {}; } void do_get(QueueId queue_id, Queue &q, EventId from_id, bool forget_previous, int32 unix_time_now, MutableSpan &result_events) { if (forget_previous) { for (auto it = q.events.begin(); it != q.events.end() && it->first < from_id;) { pop(q, queue_id, it, q.tail_id); } } size_t ready_n = 0; for (auto it = q.events.lower_bound(from_id); it != q.events.end();) { auto &event = it->second; if (event.expires_at < unix_time_now || event.data.empty()) { pop(q, queue_id, it, q.tail_id); } else { CHECK(!(event.event_id < from_id)); if (ready_n == result_events.size()) { break; } auto &to = result_events[ready_n]; to.data = event.data; to.id = event.event_id; to.expires_at = event.expires_at; to.extra = event.extra; ready_n++; ++it; } } result_events.truncate(ready_n); } void schedule_queue_gc(QueueId queue_id, Queue &q, int32 gc_at) { if (q.gc_at != 0) { bool is_deleted = queue_gc_at_.erase({q.gc_at, queue_id}) > 0; CHECK(is_deleted); } q.gc_at = gc_at; if (q.gc_at != 0) { bool is_inserted = queue_gc_at_.emplace(gc_at, queue_id).second; CHECK(is_inserted); } } }; unique_ptr TQueue::create() { return make_unique(); } struct TQueueLogEvent final : public Storer { int64 queue_id; int32 event_id; int32 expires_at; Slice data; int64 extra; template void store(StorerT &&storer) const { using td::store; store(queue_id, storer); store(event_id, storer); store(expires_at, storer); store(data, storer); if (extra != 0) { store(extra, storer); } } template void parse(ParserT &&parser, int32 has_extra) { using td::parse; parse(queue_id, parser); parse(event_id, parser); parse(expires_at, parser); data = parser.template fetch_string(); if (has_extra == 0) { extra = 0; } else { parse(extra, parser); } } size_t size() const final { TlStorerCalcLength storer; store(storer); return storer.get_length(); } size_t store(uint8 *ptr) const final { TlStorerUnsafe storer(ptr); store(storer); return static_cast(storer.get_buf() - ptr); } }; template uint64 TQueueBinlog::push(QueueId queue_id, const RawEvent &event) { TQueueLogEvent log_event; log_event.queue_id = queue_id; log_event.event_id = event.event_id.value(); log_event.expires_at = event.expires_at; log_event.data = event.data; log_event.extra = event.extra; auto magic = BINLOG_EVENT_TYPE + (log_event.extra != 0); if (event.log_event_id == 0) { return binlog_->add(magic, log_event); } binlog_->rewrite(event.log_event_id, magic, log_event); return event.log_event_id; } template void TQueueBinlog::pop(uint64 log_event_id) { binlog_->erase(log_event_id); } template Status TQueueBinlog::replay(const BinlogEvent &binlog_event, TQueue &q) const { TQueueLogEvent event; TlParser parser(binlog_event.data_); int32 has_extra = binlog_event.type_ - BINLOG_EVENT_TYPE; if (has_extra != 0 && has_extra != 1) { return Status::Error("Wrong magic"); } event.parse(parser, has_extra); parser.fetch_end(); TRY_STATUS(parser.get_status()); TRY_RESULT(event_id, EventId::from_int32(event.event_id)); RawEvent raw_event; raw_event.log_event_id = binlog_event.id_; raw_event.event_id = event_id; raw_event.expires_at = event.expires_at; raw_event.data = event.data.str(); raw_event.extra = event.extra; if (!q.do_push(event.queue_id, std::move(raw_event))) { return Status::Error("Failed to add event"); } return Status::OK(); } template void TQueueBinlog::close(Promise<> promise) { binlog_->close(std::move(promise)); } template class TQueueBinlog; template class TQueueBinlog; uint64 TQueueMemoryStorage::push(QueueId queue_id, const RawEvent &event) { auto log_event_id = event.log_event_id == 0 ? next_log_event_id_++ : event.log_event_id; events_[log_event_id] = std::make_pair(queue_id, event); return log_event_id; } void TQueueMemoryStorage::pop(uint64 log_event_id) { events_.erase(log_event_id); } void TQueueMemoryStorage::replay(TQueue &q) const { for (auto &e : events_) { auto x = e.second; x.second.log_event_id = e.first; bool is_added = q.do_push(x.first, std::move(x.second)); CHECK(is_added); } } void TQueueMemoryStorage::close(Promise<> promise) { events_.clear(); promise.set_value({}); } } // namespace td