369 lines
15 KiB
C++
369 lines
15 KiB
C++
//
|
|
// Copyright Aliaksei Levin (levlam@telegram.org), Arseny Smirnov (arseny30@gmail.com) 2014-2023
|
|
//
|
|
// Distributed under the Boost Software License, Version 1.0. (See accompanying
|
|
// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
|
|
//
|
|
#include "td/telegram/VideoNotesManager.h"
|
|
|
|
#include "td/telegram/AuthManager.h"
|
|
#include "td/telegram/files/FileManager.h"
|
|
#include "td/telegram/Global.h"
|
|
#include "td/telegram/MessagesManager.h"
|
|
#include "td/telegram/OptionManager.h"
|
|
#include "td/telegram/PhotoFormat.h"
|
|
#include "td/telegram/secret_api.h"
|
|
#include "td/telegram/Td.h"
|
|
#include "td/telegram/td_api.h"
|
|
#include "td/telegram/telegram_api.h"
|
|
#include "td/telegram/UpdatesManager.h"
|
|
|
|
#include "td/actor/actor.h"
|
|
|
|
#include "td/utils/buffer.h"
|
|
#include "td/utils/logging.h"
|
|
#include "td/utils/misc.h"
|
|
#include "td/utils/Status.h"
|
|
|
|
namespace td {
|
|
|
|
VideoNotesManager::VideoNotesManager(Td *td, ActorShared<> parent) : td_(td), parent_(std::move(parent)) {
|
|
}
|
|
|
|
VideoNotesManager::~VideoNotesManager() {
|
|
Scheduler::instance()->destroy_on_scheduler(G()->get_gc_scheduler_id(), video_notes_);
|
|
}
|
|
|
|
void VideoNotesManager::tear_down() {
|
|
parent_.reset();
|
|
}
|
|
|
|
int32 VideoNotesManager::get_video_note_duration(FileId file_id) const {
|
|
auto video_note = get_video_note(file_id);
|
|
CHECK(video_note != nullptr);
|
|
return video_note->duration;
|
|
}
|
|
|
|
tl_object_ptr<td_api::videoNote> VideoNotesManager::get_video_note_object(FileId file_id) const {
|
|
if (!file_id.is_valid()) {
|
|
return nullptr;
|
|
}
|
|
|
|
auto video_note = get_video_note(file_id);
|
|
auto speech_recognition_result = video_note->transcription_info == nullptr
|
|
? nullptr
|
|
: video_note->transcription_info->get_speech_recognition_result_object();
|
|
return make_tl_object<td_api::videoNote>(
|
|
video_note->duration, video_note->waveform, video_note->dimensions.width,
|
|
get_minithumbnail_object(video_note->minithumbnail),
|
|
get_thumbnail_object(td_->file_manager_.get(), video_note->thumbnail, PhotoFormat::Jpeg),
|
|
std::move(speech_recognition_result), td_->file_manager_->get_file_object(file_id));
|
|
}
|
|
|
|
FileId VideoNotesManager::on_get_video_note(unique_ptr<VideoNote> new_video_note, bool replace) {
|
|
auto file_id = new_video_note->file_id;
|
|
CHECK(file_id.is_valid());
|
|
LOG(INFO) << "Receive video note " << file_id;
|
|
auto &v = video_notes_[file_id];
|
|
if (v == nullptr) {
|
|
v = std::move(new_video_note);
|
|
} else if (replace) {
|
|
CHECK(v->file_id == new_video_note->file_id);
|
|
if (v->duration != new_video_note->duration || v->dimensions != new_video_note->dimensions ||
|
|
v->waveform != new_video_note->waveform) {
|
|
LOG(DEBUG) << "Video note " << file_id << " info has changed";
|
|
v->duration = new_video_note->duration;
|
|
v->dimensions = new_video_note->dimensions;
|
|
v->waveform = std::move(new_video_note->waveform);
|
|
}
|
|
if (v->minithumbnail != new_video_note->minithumbnail) {
|
|
v->minithumbnail = std::move(new_video_note->minithumbnail);
|
|
}
|
|
if (v->thumbnail != new_video_note->thumbnail) {
|
|
if (!v->thumbnail.file_id.is_valid()) {
|
|
LOG(DEBUG) << "Video note " << file_id << " thumbnail has changed";
|
|
} else {
|
|
LOG(INFO) << "Video note " << file_id << " thumbnail has changed from " << v->thumbnail << " to "
|
|
<< new_video_note->thumbnail;
|
|
}
|
|
v->thumbnail = std::move(new_video_note->thumbnail);
|
|
}
|
|
if (TranscriptionInfo::update_from(v->transcription_info, std::move(new_video_note->transcription_info))) {
|
|
on_video_note_transcription_completed(file_id);
|
|
}
|
|
}
|
|
return file_id;
|
|
}
|
|
|
|
VideoNotesManager::VideoNote *VideoNotesManager::get_video_note(FileId file_id) {
|
|
return video_notes_.get_pointer(file_id);
|
|
}
|
|
|
|
const VideoNotesManager::VideoNote *VideoNotesManager::get_video_note(FileId file_id) const {
|
|
return video_notes_.get_pointer(file_id);
|
|
}
|
|
|
|
FileId VideoNotesManager::get_video_note_thumbnail_file_id(FileId file_id) const {
|
|
auto video_note = get_video_note(file_id);
|
|
CHECK(video_note != nullptr);
|
|
return video_note->thumbnail.file_id;
|
|
}
|
|
|
|
void VideoNotesManager::delete_video_note_thumbnail(FileId file_id) {
|
|
auto &video_note = video_notes_[file_id];
|
|
CHECK(video_note != nullptr);
|
|
video_note->thumbnail = PhotoSize();
|
|
}
|
|
|
|
FileId VideoNotesManager::dup_video_note(FileId new_id, FileId old_id) {
|
|
const VideoNote *old_video_note = get_video_note(old_id);
|
|
CHECK(old_video_note != nullptr);
|
|
auto &new_video_note = video_notes_[new_id];
|
|
CHECK(new_video_note == nullptr);
|
|
new_video_note = make_unique<VideoNote>();
|
|
new_video_note->file_id = new_id;
|
|
new_video_note->duration = old_video_note->duration;
|
|
new_video_note->dimensions = old_video_note->dimensions;
|
|
new_video_note->waveform = old_video_note->waveform;
|
|
new_video_note->minithumbnail = old_video_note->minithumbnail;
|
|
new_video_note->thumbnail = old_video_note->thumbnail;
|
|
new_video_note->thumbnail.file_id =
|
|
td_->file_manager_->dup_file_id(new_video_note->thumbnail.file_id, "dup_video_note");
|
|
new_video_note->transcription_info = TranscriptionInfo::copy_if_transcribed(old_video_note->transcription_info);
|
|
return new_id;
|
|
}
|
|
|
|
void VideoNotesManager::merge_video_notes(FileId new_id, FileId old_id) {
|
|
CHECK(old_id.is_valid() && new_id.is_valid());
|
|
CHECK(new_id != old_id);
|
|
|
|
LOG(INFO) << "Merge video notes " << new_id << " and " << old_id;
|
|
const VideoNote *old_ = get_video_note(old_id);
|
|
CHECK(old_ != nullptr);
|
|
|
|
const auto *new_ = get_video_note(new_id);
|
|
if (new_ == nullptr) {
|
|
dup_video_note(new_id, old_id);
|
|
} else {
|
|
if (old_->thumbnail != new_->thumbnail) {
|
|
// LOG_STATUS(td_->file_manager_->merge(new_->thumbnail.file_id, old_->thumbnail.file_id));
|
|
}
|
|
}
|
|
LOG_STATUS(td_->file_manager_->merge(new_id, old_id));
|
|
}
|
|
|
|
void VideoNotesManager::create_video_note(FileId file_id, string minithumbnail, PhotoSize thumbnail, int32 duration,
|
|
Dimensions dimensions, string waveform, bool replace) {
|
|
auto v = make_unique<VideoNote>();
|
|
v->file_id = file_id;
|
|
v->duration = max(duration, 0);
|
|
if (dimensions.width == dimensions.height && dimensions.width <= 640) {
|
|
v->dimensions = dimensions;
|
|
} else {
|
|
LOG(INFO) << "Receive wrong video note dimensions " << dimensions;
|
|
}
|
|
v->waveform = std::move(waveform);
|
|
if (!td_->auth_manager_->is_bot()) {
|
|
v->minithumbnail = std::move(minithumbnail);
|
|
}
|
|
v->thumbnail = std::move(thumbnail);
|
|
on_get_video_note(std::move(v), replace);
|
|
}
|
|
|
|
void VideoNotesManager::register_video_note(FileId video_note_file_id, FullMessageId full_message_id,
|
|
const char *source) {
|
|
if (full_message_id.get_message_id().is_scheduled() || !full_message_id.get_message_id().is_server() ||
|
|
td_->auth_manager_->is_bot()) {
|
|
return;
|
|
}
|
|
LOG(INFO) << "Register video note " << video_note_file_id << " from " << full_message_id << " from " << source;
|
|
bool is_inserted = video_note_messages_[video_note_file_id].insert(full_message_id).second;
|
|
LOG_CHECK(is_inserted) << source << ' ' << video_note_file_id << ' ' << full_message_id;
|
|
is_inserted = message_video_notes_.emplace(full_message_id, video_note_file_id).second;
|
|
CHECK(is_inserted);
|
|
}
|
|
|
|
void VideoNotesManager::unregister_video_note(FileId video_note_file_id, FullMessageId full_message_id,
|
|
const char *source) {
|
|
if (full_message_id.get_message_id().is_scheduled() || !full_message_id.get_message_id().is_server() ||
|
|
td_->auth_manager_->is_bot()) {
|
|
return;
|
|
}
|
|
LOG(INFO) << "Unregister video note " << video_note_file_id << " from " << full_message_id << " from " << source;
|
|
auto &message_ids = video_note_messages_[video_note_file_id];
|
|
auto is_deleted = message_ids.erase(full_message_id) > 0;
|
|
LOG_CHECK(is_deleted) << source << ' ' << video_note_file_id << ' ' << full_message_id;
|
|
if (message_ids.empty()) {
|
|
video_note_messages_.erase(video_note_file_id);
|
|
}
|
|
is_deleted = message_video_notes_.erase(full_message_id) > 0;
|
|
CHECK(is_deleted);
|
|
}
|
|
|
|
void VideoNotesManager::recognize_speech(FullMessageId full_message_id, Promise<Unit> &&promise) {
|
|
auto it = message_video_notes_.find(full_message_id);
|
|
CHECK(it != message_video_notes_.end());
|
|
|
|
auto file_id = it->second;
|
|
auto video_note = get_video_note(file_id);
|
|
CHECK(video_note != nullptr);
|
|
if (video_note->transcription_info == nullptr) {
|
|
video_note->transcription_info = make_unique<TranscriptionInfo>();
|
|
}
|
|
|
|
auto handler = [actor_id = actor_id(this),
|
|
file_id](Result<telegram_api::object_ptr<telegram_api::updateTranscribedAudio>> r_update) {
|
|
send_closure(actor_id, &VideoNotesManager::on_transcribed_audio_update, file_id, true, std::move(r_update));
|
|
};
|
|
if (video_note->transcription_info->recognize_speech(td_, full_message_id, std::move(promise), std::move(handler))) {
|
|
on_video_note_transcription_updated(file_id);
|
|
}
|
|
}
|
|
|
|
void VideoNotesManager::on_transcribed_audio_update(
|
|
FileId file_id, bool is_initial, Result<telegram_api::object_ptr<telegram_api::updateTranscribedAudio>> r_update) {
|
|
if (G()->close_flag()) {
|
|
return;
|
|
}
|
|
|
|
auto video_note = get_video_note(file_id);
|
|
CHECK(video_note != nullptr);
|
|
CHECK(video_note->transcription_info != nullptr);
|
|
|
|
if (r_update.is_error()) {
|
|
auto promises = video_note->transcription_info->on_failed_transcription(r_update.error().clone());
|
|
on_video_note_transcription_updated(file_id);
|
|
fail_promises(promises, r_update.move_as_error());
|
|
return;
|
|
}
|
|
auto update = r_update.move_as_ok();
|
|
auto transcription_id = update->transcription_id_;
|
|
if (!update->pending_) {
|
|
auto promises = video_note->transcription_info->on_final_transcription(std::move(update->text_), transcription_id);
|
|
on_video_note_transcription_completed(file_id);
|
|
set_promises(promises);
|
|
} else {
|
|
auto is_changed =
|
|
video_note->transcription_info->on_partial_transcription(std::move(update->text_), transcription_id);
|
|
if (is_changed) {
|
|
on_video_note_transcription_updated(file_id);
|
|
}
|
|
|
|
if (is_initial) {
|
|
td_->updates_manager_->subscribe_to_transcribed_audio_updates(
|
|
transcription_id, [actor_id = actor_id(this),
|
|
file_id](Result<telegram_api::object_ptr<telegram_api::updateTranscribedAudio>> r_update) {
|
|
send_closure(actor_id, &VideoNotesManager::on_transcribed_audio_update, file_id, false,
|
|
std::move(r_update));
|
|
});
|
|
}
|
|
}
|
|
}
|
|
|
|
void VideoNotesManager::on_video_note_transcription_updated(FileId file_id) {
|
|
auto it = video_note_messages_.find(file_id);
|
|
if (it != video_note_messages_.end()) {
|
|
for (const auto &full_message_id : it->second) {
|
|
td_->messages_manager_->on_external_update_message_content(full_message_id);
|
|
}
|
|
}
|
|
}
|
|
|
|
void VideoNotesManager::on_video_note_transcription_completed(FileId file_id) {
|
|
auto it = video_note_messages_.find(file_id);
|
|
if (it != video_note_messages_.end()) {
|
|
for (const auto &full_message_id : it->second) {
|
|
td_->messages_manager_->on_update_message_content(full_message_id);
|
|
}
|
|
}
|
|
}
|
|
|
|
void VideoNotesManager::rate_speech_recognition(FullMessageId full_message_id, bool is_good, Promise<Unit> &&promise) {
|
|
auto it = message_video_notes_.find(full_message_id);
|
|
CHECK(it != message_video_notes_.end());
|
|
|
|
auto file_id = it->second;
|
|
auto video_note = get_video_note(file_id);
|
|
CHECK(video_note != nullptr);
|
|
if (video_note->transcription_info == nullptr) {
|
|
return promise.set_value(Unit());
|
|
}
|
|
video_note->transcription_info->rate_speech_recognition(td_, full_message_id, is_good, std::move(promise));
|
|
}
|
|
|
|
SecretInputMedia VideoNotesManager::get_secret_input_media(FileId video_note_file_id,
|
|
tl_object_ptr<telegram_api::InputEncryptedFile> input_file,
|
|
BufferSlice thumbnail, int32 layer) const {
|
|
const VideoNote *video_note = get_video_note(video_note_file_id);
|
|
CHECK(video_note != nullptr);
|
|
auto file_view = td_->file_manager_->get_file_view(video_note_file_id);
|
|
if (!file_view.is_encrypted_secret() || file_view.encryption_key().empty()) {
|
|
return SecretInputMedia{};
|
|
}
|
|
if (file_view.has_remote_location()) {
|
|
input_file = file_view.main_remote_location().as_input_encrypted_file();
|
|
}
|
|
if (!input_file) {
|
|
return SecretInputMedia{};
|
|
}
|
|
if (video_note->thumbnail.file_id.is_valid() && thumbnail.empty()) {
|
|
return SecretInputMedia{};
|
|
}
|
|
vector<tl_object_ptr<secret_api::DocumentAttribute>> attributes;
|
|
attributes.push_back(make_tl_object<secret_api::documentAttributeVideo>(
|
|
secret_api::documentAttributeVideo::ROUND_MESSAGE_MASK, true, video_note->duration, video_note->dimensions.width,
|
|
video_note->dimensions.height));
|
|
|
|
return {std::move(input_file),
|
|
std::move(thumbnail),
|
|
video_note->thumbnail.dimensions,
|
|
"video/mp4",
|
|
file_view,
|
|
std::move(attributes),
|
|
string(),
|
|
layer};
|
|
}
|
|
|
|
tl_object_ptr<telegram_api::InputMedia> VideoNotesManager::get_input_media(
|
|
FileId file_id, tl_object_ptr<telegram_api::InputFile> input_file,
|
|
tl_object_ptr<telegram_api::InputFile> input_thumbnail) const {
|
|
auto file_view = td_->file_manager_->get_file_view(file_id);
|
|
if (file_view.is_encrypted()) {
|
|
return nullptr;
|
|
}
|
|
if (file_view.has_remote_location() && !file_view.main_remote_location().is_web() && input_file == nullptr) {
|
|
return make_tl_object<telegram_api::inputMediaDocument>(
|
|
0, false /*ignored*/, file_view.main_remote_location().as_input_document(), 0, string());
|
|
}
|
|
if (file_view.has_url()) {
|
|
return make_tl_object<telegram_api::inputMediaDocumentExternal>(0, false /*ignored*/, file_view.url(), 0);
|
|
}
|
|
|
|
if (input_file != nullptr) {
|
|
const VideoNote *video_note = get_video_note(file_id);
|
|
CHECK(video_note != nullptr);
|
|
|
|
vector<tl_object_ptr<telegram_api::DocumentAttribute>> attributes;
|
|
auto suggested_video_note_length =
|
|
narrow_cast<int32>(td_->option_manager_->get_option_integer("suggested_video_note_length", 384));
|
|
attributes.push_back(make_tl_object<telegram_api::documentAttributeVideo>(
|
|
telegram_api::documentAttributeVideo::ROUND_MESSAGE_MASK, false /*ignored*/, false /*ignored*/,
|
|
video_note->duration, video_note->dimensions.width ? video_note->dimensions.width : suggested_video_note_length,
|
|
video_note->dimensions.height ? video_note->dimensions.height : suggested_video_note_length));
|
|
int32 flags = telegram_api::inputMediaUploadedDocument::NOSOUND_VIDEO_MASK;
|
|
if (input_thumbnail != nullptr) {
|
|
flags |= telegram_api::inputMediaUploadedDocument::THUMB_MASK;
|
|
}
|
|
return make_tl_object<telegram_api::inputMediaUploadedDocument>(
|
|
flags, false /*ignored*/, false /*ignored*/, false /*ignored*/, std::move(input_file),
|
|
std::move(input_thumbnail), "video/mp4", std::move(attributes),
|
|
vector<tl_object_ptr<telegram_api::InputDocument>>(), 0);
|
|
} else {
|
|
CHECK(!file_view.has_remote_location());
|
|
}
|
|
|
|
return nullptr;
|
|
}
|
|
|
|
} // namespace td
|