// // Copyright Aliaksei Levin (levlam@telegram.org), Arseny Smirnov (arseny30@gmail.com) 2014-2022 // // Distributed under the Boost Software License, Version 1.0. (See accompanying // file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt) // #include "td/telegram/VideoNotesManager.h" #include "td/telegram/AuthManager.h" #include "td/telegram/files/FileManager.h" #include "td/telegram/Global.h" #include "td/telegram/MessagesManager.h" #include "td/telegram/OptionManager.h" #include "td/telegram/PhotoFormat.h" #include "td/telegram/secret_api.h" #include "td/telegram/Td.h" #include "td/telegram/td_api.h" #include "td/telegram/telegram_api.h" #include "td/telegram/UpdatesManager.h" #include "td/actor/actor.h" #include "td/utils/buffer.h" #include "td/utils/logging.h" #include "td/utils/misc.h" #include "td/utils/Status.h" namespace td { VideoNotesManager::VideoNotesManager(Td *td, ActorShared<> parent) : td_(td), parent_(std::move(parent)) { } VideoNotesManager::~VideoNotesManager() { Scheduler::instance()->destroy_on_scheduler(G()->get_gc_scheduler_id(), video_notes_); } void VideoNotesManager::tear_down() { parent_.reset(); } int32 VideoNotesManager::get_video_note_duration(FileId file_id) const { auto video_note = get_video_note(file_id); CHECK(video_note != nullptr); return video_note->duration; } tl_object_ptr VideoNotesManager::get_video_note_object(FileId file_id) const { if (!file_id.is_valid()) { return nullptr; } auto video_note = get_video_note(file_id); auto speech_recognition_result = video_note->transcription_info == nullptr ? nullptr : video_note->transcription_info->get_speech_recognition_result_object(); return make_tl_object( video_note->duration, video_note->waveform, video_note->dimensions.width, get_minithumbnail_object(video_note->minithumbnail), get_thumbnail_object(td_->file_manager_.get(), video_note->thumbnail, PhotoFormat::Jpeg), std::move(speech_recognition_result), td_->file_manager_->get_file_object(file_id)); } FileId VideoNotesManager::on_get_video_note(unique_ptr new_video_note, bool replace) { auto file_id = new_video_note->file_id; CHECK(file_id.is_valid()); LOG(INFO) << "Receive video note " << file_id; auto &v = video_notes_[file_id]; if (v == nullptr) { v = std::move(new_video_note); } else if (replace) { CHECK(v->file_id == new_video_note->file_id); if (v->duration != new_video_note->duration || v->dimensions != new_video_note->dimensions || v->waveform != new_video_note->waveform) { LOG(DEBUG) << "Video note " << file_id << " info has changed"; v->duration = new_video_note->duration; v->dimensions = new_video_note->dimensions; v->waveform = std::move(new_video_note->waveform); } if (!G()->get_option_boolean("disable_minithumbnails")) { if (v->minithumbnail != new_video_note->minithumbnail) { v->minithumbnail = std::move(new_video_note->minithumbnail); } } if (v->thumbnail != new_video_note->thumbnail) { if (!v->thumbnail.file_id.is_valid()) { LOG(DEBUG) << "Video note " << file_id << " thumbnail has changed"; } else { LOG(INFO) << "Video note " << file_id << " thumbnail has changed from " << v->thumbnail << " to " << new_video_note->thumbnail; } v->thumbnail = std::move(new_video_note->thumbnail); } if (TranscriptionInfo::update_from(v->transcription_info, std::move(new_video_note->transcription_info))) { on_video_note_transcription_completed(file_id); } } return file_id; } VideoNotesManager::VideoNote *VideoNotesManager::get_video_note(FileId file_id) { return video_notes_.get_pointer(file_id); } const VideoNotesManager::VideoNote *VideoNotesManager::get_video_note(FileId file_id) const { return video_notes_.get_pointer(file_id); } FileId VideoNotesManager::get_video_note_thumbnail_file_id(FileId file_id) const { auto video_note = get_video_note(file_id); CHECK(video_note != nullptr); return video_note->thumbnail.file_id; } void VideoNotesManager::delete_video_note_thumbnail(FileId file_id) { auto &video_note = video_notes_[file_id]; CHECK(video_note != nullptr); video_note->thumbnail = PhotoSize(); } FileId VideoNotesManager::dup_video_note(FileId new_id, FileId old_id) { const VideoNote *old_video_note = get_video_note(old_id); CHECK(old_video_note != nullptr); auto &new_video_note = video_notes_[new_id]; CHECK(new_video_note == nullptr); new_video_note = make_unique(); new_video_note->file_id = new_id; new_video_note->duration = old_video_note->duration; new_video_note->dimensions = old_video_note->dimensions; new_video_note->waveform = old_video_note->waveform; new_video_note->minithumbnail = old_video_note->minithumbnail; new_video_note->thumbnail = old_video_note->thumbnail; new_video_note->thumbnail.file_id = td_->file_manager_->dup_file_id(new_video_note->thumbnail.file_id, "dup_video_note"); new_video_note->transcription_info = TranscriptionInfo::copy_if_transcribed(old_video_note->transcription_info); return new_id; } void VideoNotesManager::merge_video_notes(FileId new_id, FileId old_id) { CHECK(old_id.is_valid() && new_id.is_valid()); CHECK(new_id != old_id); LOG(INFO) << "Merge video notes " << new_id << " and " << old_id; const VideoNote *old_ = get_video_note(old_id); CHECK(old_ != nullptr); const auto *new_ = get_video_note(new_id); if (new_ == nullptr) { dup_video_note(new_id, old_id); } else { if (old_->thumbnail != new_->thumbnail) { // LOG_STATUS(td_->file_manager_->merge(new_->thumbnail.file_id, old_->thumbnail.file_id)); } } LOG_STATUS(td_->file_manager_->merge(new_id, old_id)); } void VideoNotesManager::create_video_note(FileId file_id, string minithumbnail, PhotoSize thumbnail, int32 duration, Dimensions dimensions, string waveform, bool replace) { auto v = make_unique(); v->file_id = file_id; v->duration = max(duration, 0); if (dimensions.width == dimensions.height && dimensions.width <= 640) { v->dimensions = dimensions; } else { LOG(INFO) << "Receive wrong video note dimensions " << dimensions; } v->waveform = std::move(waveform); if (!td_->auth_manager_->is_bot() && !G()->get_option_boolean("disable_minithumbnails")) { v->minithumbnail = std::move(minithumbnail); } v->thumbnail = std::move(thumbnail); on_get_video_note(std::move(v), replace); } void VideoNotesManager::register_video_note(FileId video_note_file_id, FullMessageId full_message_id, const char *source) { if (full_message_id.get_message_id().is_scheduled() || !full_message_id.get_message_id().is_server() || td_->auth_manager_->is_bot()) { return; } LOG(INFO) << "Register video note " << video_note_file_id << " from " << full_message_id << " from " << source; bool is_inserted = video_note_messages_[video_note_file_id].insert(full_message_id).second; LOG_CHECK(is_inserted) << source << ' ' << video_note_file_id << ' ' << full_message_id; is_inserted = message_video_notes_.emplace(full_message_id, video_note_file_id).second; CHECK(is_inserted); } void VideoNotesManager::unregister_video_note(FileId video_note_file_id, FullMessageId full_message_id, const char *source) { if (full_message_id.get_message_id().is_scheduled() || !full_message_id.get_message_id().is_server() || td_->auth_manager_->is_bot()) { return; } LOG(INFO) << "Unregister video note " << video_note_file_id << " from " << full_message_id << " from " << source; auto &message_ids = video_note_messages_[video_note_file_id]; auto is_deleted = message_ids.erase(full_message_id) > 0; LOG_CHECK(is_deleted) << source << ' ' << video_note_file_id << ' ' << full_message_id; if (message_ids.empty()) { video_note_messages_.erase(video_note_file_id); } is_deleted = message_video_notes_.erase(full_message_id) > 0; CHECK(is_deleted); } void VideoNotesManager::recognize_speech(FullMessageId full_message_id, Promise &&promise) { auto it = message_video_notes_.find(full_message_id); CHECK(it != message_video_notes_.end()); auto file_id = it->second; auto video_note = get_video_note(file_id); CHECK(video_note != nullptr); if (video_note->transcription_info == nullptr) { video_note->transcription_info = make_unique(); } auto handler = [actor_id = actor_id(this), file_id](Result> r_update) { send_closure(actor_id, &VideoNotesManager::on_transcribed_audio_update, file_id, true, std::move(r_update)); }; if (video_note->transcription_info->recognize_speech(td_, full_message_id, std::move(promise), std::move(handler))) { on_video_note_transcription_updated(file_id); } } void VideoNotesManager::on_transcribed_audio_update( FileId file_id, bool is_initial, Result> r_update) { if (G()->close_flag()) { return; } auto video_note = get_video_note(file_id); CHECK(video_note != nullptr); CHECK(video_note->transcription_info != nullptr); if (r_update.is_error()) { auto promises = video_note->transcription_info->on_failed_transcription(r_update.error().clone()); on_video_note_transcription_updated(file_id); fail_promises(promises, r_update.move_as_error()); return; } auto update = r_update.move_as_ok(); auto transcription_id = update->transcription_id_; if (!update->pending_) { auto promises = video_note->transcription_info->on_final_transcription(std::move(update->text_), transcription_id); on_video_note_transcription_completed(file_id); set_promises(promises); } else { auto is_changed = video_note->transcription_info->on_partial_transcription(std::move(update->text_), transcription_id); if (is_changed) { on_video_note_transcription_updated(file_id); } if (is_initial) { td_->updates_manager_->subscribe_to_transcribed_audio_updates( transcription_id, [actor_id = actor_id(this), file_id](Result> r_update) { send_closure(actor_id, &VideoNotesManager::on_transcribed_audio_update, file_id, false, std::move(r_update)); }); } } } void VideoNotesManager::on_video_note_transcription_updated(FileId file_id) { auto it = video_note_messages_.find(file_id); if (it != video_note_messages_.end()) { for (const auto &full_message_id : it->second) { td_->messages_manager_->on_external_update_message_content(full_message_id); } } } void VideoNotesManager::on_video_note_transcription_completed(FileId file_id) { auto it = video_note_messages_.find(file_id); if (it != video_note_messages_.end()) { for (const auto &full_message_id : it->second) { td_->messages_manager_->on_update_message_content(full_message_id); } } } void VideoNotesManager::rate_speech_recognition(FullMessageId full_message_id, bool is_good, Promise &&promise) { auto it = message_video_notes_.find(full_message_id); CHECK(it != message_video_notes_.end()); auto file_id = it->second; auto video_note = get_video_note(file_id); CHECK(video_note != nullptr); if (video_note->transcription_info == nullptr) { return promise.set_value(Unit()); } video_note->transcription_info->rate_speech_recognition(td_, full_message_id, is_good, std::move(promise)); } SecretInputMedia VideoNotesManager::get_secret_input_media(FileId video_note_file_id, tl_object_ptr input_file, BufferSlice thumbnail, int32 layer) const { const VideoNote *video_note = get_video_note(video_note_file_id); CHECK(video_note != nullptr); auto file_view = td_->file_manager_->get_file_view(video_note_file_id); if (!file_view.is_encrypted_secret() || file_view.encryption_key().empty()) { return SecretInputMedia{}; } if (file_view.has_remote_location()) { input_file = file_view.main_remote_location().as_input_encrypted_file(); } if (!input_file) { return SecretInputMedia{}; } if (video_note->thumbnail.file_id.is_valid() && thumbnail.empty()) { return SecretInputMedia{}; } vector> attributes; attributes.push_back(make_tl_object( secret_api::documentAttributeVideo::ROUND_MESSAGE_MASK, true, video_note->duration, video_note->dimensions.width, video_note->dimensions.height)); return {std::move(input_file), std::move(thumbnail), video_note->thumbnail.dimensions, "video/mp4", file_view, std::move(attributes), string(), layer}; } tl_object_ptr VideoNotesManager::get_input_media( FileId file_id, tl_object_ptr input_file, tl_object_ptr input_thumbnail) const { auto file_view = td_->file_manager_->get_file_view(file_id); if (file_view.is_encrypted()) { return nullptr; } if (file_view.has_remote_location() && !file_view.main_remote_location().is_web() && input_file == nullptr) { return make_tl_object(0, file_view.main_remote_location().as_input_document(), 0, string()); } if (file_view.has_url()) { return make_tl_object(0, file_view.url(), 0); } if (input_file != nullptr) { const VideoNote *video_note = get_video_note(file_id); CHECK(video_note != nullptr); vector> attributes; auto suggested_video_note_length = narrow_cast(td_->option_manager_->get_option_integer("suggested_video_note_length", 384)); attributes.push_back(make_tl_object( telegram_api::documentAttributeVideo::ROUND_MESSAGE_MASK, false /*ignored*/, false /*ignored*/, video_note->duration, video_note->dimensions.width ? video_note->dimensions.width : suggested_video_note_length, video_note->dimensions.height ? video_note->dimensions.height : suggested_video_note_length)); int32 flags = telegram_api::inputMediaUploadedDocument::NOSOUND_VIDEO_MASK; if (input_thumbnail != nullptr) { flags |= telegram_api::inputMediaUploadedDocument::THUMB_MASK; } return make_tl_object( flags, false /*ignored*/, false /*ignored*/, std::move(input_file), std::move(input_thumbnail), "video/mp4", std::move(attributes), vector>(), 0); } else { CHECK(!file_view.has_remote_location()); } return nullptr; } void VideoNotesManager::memory_stats(vector &output) { output.push_back("\"video_notes_\":"); output.push_back(std::to_string(video_notes_.size())); } } // namespace td