2018-12-31 22:04:05 +03:00
|
|
|
//
|
2024-01-01 03:07:21 +03:00
|
|
|
// Copyright Aliaksei Levin (levlam@telegram.org), Arseny Smirnov (arseny30@gmail.com) 2014-2024
|
2018-12-31 22:04:05 +03:00
|
|
|
//
|
|
|
|
// Distributed under the Boost Software License, Version 1.0. (See accompanying
|
|
|
|
// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
|
|
|
|
//
|
|
|
|
#include "td/telegram/HashtagHints.h"
|
|
|
|
|
2019-01-06 22:59:17 +03:00
|
|
|
#include "td/telegram/Global.h"
|
|
|
|
#include "td/telegram/TdDb.h"
|
|
|
|
|
2018-07-18 04:11:48 +03:00
|
|
|
#include "td/db/SqliteKeyValueAsync.h"
|
2018-12-31 22:04:05 +03:00
|
|
|
|
2022-11-23 19:37:32 +03:00
|
|
|
#include "td/utils/HashTableUtils.h"
|
2018-12-31 22:04:05 +03:00
|
|
|
#include "td/utils/logging.h"
|
|
|
|
#include "td/utils/tl_helpers.h"
|
2019-11-17 19:30:53 +03:00
|
|
|
#include "td/utils/utf8.h"
|
2018-12-31 22:04:05 +03:00
|
|
|
|
|
|
|
namespace td {
|
|
|
|
|
2024-06-02 01:11:32 +03:00
|
|
|
HashtagHints::HashtagHints(string mode, char first_character, ActorShared<> parent)
|
|
|
|
: mode_(std::move(mode)), first_character_(first_character), parent_(std::move(parent)) {
|
2018-12-31 22:04:05 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
void HashtagHints::start_up() {
|
2023-03-14 01:41:04 +03:00
|
|
|
if (G()->use_sqlite_pmc()) { // TODO hashtag hints should not depend on use_sqlite_pmc
|
2018-12-31 22:04:05 +03:00
|
|
|
G()->td_db()->get_sqlite_pmc()->get(get_key(),
|
|
|
|
PromiseCreator::lambda([actor_id = actor_id(this)](Result<string> res) {
|
|
|
|
send_closure(actor_id, &HashtagHints::from_db, std::move(res), false);
|
|
|
|
}));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void HashtagHints::hashtag_used(const string &hashtag) {
|
|
|
|
if (!sync_with_db_) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
hashtag_used_impl(hashtag);
|
|
|
|
G()->td_db()->get_sqlite_pmc()->set(get_key(), serialize(keys_to_strings(hints_.search_empty(101).second)),
|
2024-05-25 20:35:21 +03:00
|
|
|
Promise<Unit>());
|
2018-12-31 22:04:05 +03:00
|
|
|
}
|
|
|
|
|
2024-05-25 20:35:21 +03:00
|
|
|
void HashtagHints::remove_hashtag(string hashtag, Promise<Unit> promise) {
|
2018-12-31 22:04:05 +03:00
|
|
|
if (!sync_with_db_) {
|
2024-05-25 20:35:21 +03:00
|
|
|
return promise.set_value(Unit());
|
2018-12-31 22:04:05 +03:00
|
|
|
}
|
2024-06-02 01:11:32 +03:00
|
|
|
if (hashtag[0] == first_character_) {
|
2018-12-31 22:04:05 +03:00
|
|
|
hashtag = hashtag.substr(1);
|
|
|
|
}
|
2022-11-23 19:37:32 +03:00
|
|
|
auto key = Hash<string>()(hashtag);
|
2018-12-31 22:04:05 +03:00
|
|
|
if (hints_.has_key(key)) {
|
|
|
|
hints_.remove(key);
|
|
|
|
G()->td_db()->get_sqlite_pmc()->set(get_key(), serialize(keys_to_strings(hints_.search_empty(101).second)),
|
2024-05-25 20:35:21 +03:00
|
|
|
Promise<Unit>());
|
2018-12-31 22:04:05 +03:00
|
|
|
promise.set_value(Unit()); // set promise explicitly, because sqlite_pmc waits for too long before setting promise
|
|
|
|
} else {
|
|
|
|
promise.set_value(Unit());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-05-25 20:35:21 +03:00
|
|
|
void HashtagHints::clear(Promise<Unit> promise) {
|
2018-12-31 22:04:05 +03:00
|
|
|
if (!sync_with_db_) {
|
2024-05-25 20:35:21 +03:00
|
|
|
return promise.set_value(Unit());
|
|
|
|
}
|
|
|
|
hints_ = {};
|
|
|
|
G()->td_db()->get_sqlite_pmc()->set(get_key(), serialize(vector<string>()), Promise<Unit>());
|
|
|
|
promise.set_value(Unit());
|
|
|
|
}
|
|
|
|
|
|
|
|
void HashtagHints::query(const string &prefix, int32 limit, Promise<vector<string>> promise) {
|
|
|
|
if (!sync_with_db_) {
|
|
|
|
promise.set_value(vector<string>());
|
2018-12-31 22:04:05 +03:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2024-06-02 01:11:32 +03:00
|
|
|
auto query = Slice(prefix).substr(prefix[0] == first_character_ ? 1 : 0);
|
|
|
|
auto result = query.empty() ? hints_.search_empty(limit) : hints_.search(query, limit);
|
2018-12-31 22:04:05 +03:00
|
|
|
promise.set_value(keys_to_strings(result.second));
|
|
|
|
}
|
|
|
|
|
|
|
|
string HashtagHints::get_key() const {
|
|
|
|
return "hashtag_hints#" + mode_;
|
|
|
|
}
|
|
|
|
|
|
|
|
void HashtagHints::hashtag_used_impl(const string &hashtag) {
|
2019-11-17 19:30:53 +03:00
|
|
|
if (!check_utf8(hashtag)) {
|
|
|
|
LOG(ERROR) << "Trying to add invalid UTF-8 hashtag \"" << hashtag << '"';
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2022-11-23 19:37:32 +03:00
|
|
|
auto key = Hash<string>()(hashtag);
|
2018-12-31 22:04:05 +03:00
|
|
|
hints_.add(key, hashtag);
|
|
|
|
hints_.set_rating(key, -++counter_);
|
|
|
|
}
|
|
|
|
|
|
|
|
void HashtagHints::from_db(Result<string> data, bool dummy) {
|
2020-05-16 02:25:03 +03:00
|
|
|
if (G()->close_flag()) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2018-12-31 22:04:05 +03:00
|
|
|
sync_with_db_ = true;
|
|
|
|
if (data.is_error() || data.ok().empty()) {
|
|
|
|
return;
|
|
|
|
}
|
2024-05-25 20:35:21 +03:00
|
|
|
vector<string> hashtags;
|
2018-12-31 22:04:05 +03:00
|
|
|
auto status = unserialize(hashtags, data.ok());
|
|
|
|
if (status.is_error()) {
|
2019-11-17 19:30:53 +03:00
|
|
|
LOG(ERROR) << "Failed to unserialize hashtag hints: " << status;
|
2018-12-31 22:04:05 +03:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (auto it = hashtags.rbegin(); it != hashtags.rend(); ++it) {
|
|
|
|
hashtag_used_impl(*it);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-05-25 20:35:21 +03:00
|
|
|
vector<string> HashtagHints::keys_to_strings(const vector<int64> &keys) {
|
|
|
|
vector<string> result;
|
2018-12-31 22:04:05 +03:00
|
|
|
result.reserve(keys.size());
|
|
|
|
for (auto &it : keys) {
|
|
|
|
result.push_back(hints_.key_to_string(it));
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
2024-05-25 20:35:21 +03:00
|
|
|
|
2018-12-31 22:04:05 +03:00
|
|
|
} // namespace td
|